diff --git "a/wandb/run-20220228_093705-yn2gmwrw/files/wandb-summary.json" "b/wandb/run-20220228_093705-yn2gmwrw/files/wandb-summary.json" --- "a/wandb/run-20220228_093705-yn2gmwrw/files/wandb-summary.json" +++ "b/wandb/run-20220228_093705-yn2gmwrw/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 4.3547, "train/learning_rate": 2.2429906542056077e-06, "train/epoch": 0.84, "train/global_step": 1500, "_runtime": 7672, "_timestamp": 1646048697, "_step": 1502, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 20.0, 954.0, 44.0], "bins": [-1042.8914794921875, -1026.2169189453125, -1009.54248046875, -992.867919921875, -976.1934204101562, -959.5189208984375, -942.8443603515625, -926.1698608398438, -909.495361328125, -892.8208618164062, -876.1463623046875, -859.4718017578125, -842.7973022460938, -826.122802734375, -809.4482421875, -792.7737426757812, -776.0992431640625, -759.4247436523438, -742.750244140625, -726.07568359375, -709.4011840820312, -692.7266845703125, -676.0521240234375, -659.3776245117188, -642.703125, -626.0286254882812, -609.3541259765625, -592.6795654296875, -576.0050659179688, -559.33056640625, -542.656005859375, -525.9815063476562, -509.3070068359375, -492.63250732421875, -475.9579772949219, -459.283447265625, -442.60894775390625, -425.9344482421875, -409.2599182128906, -392.58538818359375, -375.910888671875, -359.23638916015625, -342.5618591308594, -325.8873291015625, -309.21282958984375, -292.538330078125, -275.8638000488281, -259.18927001953125, -242.5147705078125, -225.8402557373047, -209.16574096679688, -192.49122619628906, -175.81671142578125, -159.14219665527344, -142.46768188476562, -125.79316711425781, -109.11865234375, -92.44413757324219, -75.76962280273438, -59.09510803222656, -42.42059326171875, -25.746078491210938, -9.071563720703125, 7.6029510498046875, 24.2774658203125]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 5.0, 2.0, 7.0, 12.0, 13.0, 12.0, 26.0, 23.0, 18.0, 41.0, 48.0, 50.0, 47.0, 41.0, 49.0, 50.0, 73.0, 64.0, 57.0, 57.0, 79.0, 50.0, 44.0, 23.0, 29.0, 21.0, 17.0, 15.0, 9.0, 10.0, 10.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.93453979492188, -91.27810668945312, -88.62166595458984, -85.9652328491211, -83.30879211425781, -80.65235900878906, -77.99591827392578, -75.33948516845703, -72.68304443359375, -70.026611328125, -67.37017059326172, -64.71373748779297, -62.05729675292969, -59.40086364746094, -56.74442672729492, -54.087989807128906, -51.431556701660156, -48.77511978149414, -46.118682861328125, -43.46224594116211, -40.805809020996094, -38.149375915527344, -35.49293899536133, -32.83650207519531, -30.180065155029297, -27.52362823486328, -24.867191314697266, -22.210756301879883, -19.554319381713867, -16.89788246154785, -14.241446495056152, -11.585010528564453, -8.928573608398438, -6.27213716506958, -3.6157007217407227, -0.9592642784118652, 1.6971721649169922, 4.353609085083008, 7.010045051574707, 9.666481018066406, 12.322917938232422, 14.979354858398438, 17.635791778564453, 20.292226791381836, 22.94866371154785, 25.605100631713867, 28.26153564453125, 30.917972564697266, 33.57440948486328, 36.2308464050293, 38.88728332519531, 41.54372024536133, 44.200157165527344, 46.856590270996094, 49.51302719116211, 52.169464111328125, 54.82590103149414, 57.482337951660156, 60.13877487182617, 62.79521179199219, 65.45164489746094, 68.10808563232422, 70.76451873779297, 73.42095947265625, 76.077392578125]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 4.0, 3.0, 6.0, 7.0, 8.0, 9.0, 11.0, 20.0, 9.0, 12.0, 12.0, 15.0, 11.0, 16.0, 22.0, 23.0, 25.0, 19.0, 31.0, 32.0, 25.0, 24.0, 37.0, 36.0, 39.0, 36.0, 29.0, 31.0, 34.0, 37.0, 32.0, 34.0, 30.0, 39.0, 30.0, 24.0, 27.0, 24.0, 23.0, 19.0, 20.0, 18.0, 14.0, 7.0, 7.0, 9.0, 3.0, 8.0, 5.0, 3.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 2.0], "bins": [-3.380859375, -3.278778076171875, -3.17669677734375, -3.074615478515625, -2.9725341796875, -2.870452880859375, -2.76837158203125, -2.666290283203125, -2.564208984375, -2.462127685546875, -2.36004638671875, -2.257965087890625, -2.1558837890625, -2.053802490234375, -1.95172119140625, -1.849639892578125, -1.74755859375, -1.645477294921875, -1.54339599609375, -1.441314697265625, -1.3392333984375, -1.237152099609375, -1.13507080078125, -1.032989501953125, -0.930908203125, -0.828826904296875, -0.72674560546875, -0.624664306640625, -0.5225830078125, -0.420501708984375, -0.31842041015625, -0.216339111328125, -0.1142578125, -0.012176513671875, 0.08990478515625, 0.191986083984375, 0.2940673828125, 0.396148681640625, 0.49822998046875, 0.600311279296875, 0.702392578125, 0.804473876953125, 0.90655517578125, 1.008636474609375, 1.1107177734375, 1.212799072265625, 1.31488037109375, 1.416961669921875, 1.51904296875, 1.621124267578125, 1.72320556640625, 1.825286865234375, 1.9273681640625, 2.029449462890625, 2.13153076171875, 2.233612060546875, 2.335693359375, 2.437774658203125, 2.53985595703125, 2.641937255859375, 2.7440185546875, 2.846099853515625, 2.94818115234375, 3.050262451171875, 3.15234375]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 9.0, 7.0, 11.0, 16.0, 15.0, 23.0, 37.0, 44.0, 41.0, 61.0, 71.0, 87.0, 146.0, 177.0, 279.0, 346.0, 504.0, 732.0, 1158.0, 2007.0, 3525.0, 7184.0, 18456.0, 63660.0, 383879.0, 2143745.0, 1323670.0, 180670.0, 38049.0, 12720.0, 5509.0, 2749.0, 1549.0, 970.0, 602.0, 442.0, 324.0, 211.0, 147.0, 92.0, 96.0, 70.0, 46.0, 36.0, 31.0, 22.0, 13.0, 9.0, 8.0, 9.0, 3.0, 3.0, 4.0, 7.0, 3.0, 2.0, 4.0], "bins": [-10.578125, -10.2557373046875, -9.933349609375, -9.6109619140625, -9.28857421875, -8.9661865234375, -8.643798828125, -8.3214111328125, -7.9990234375, -7.6766357421875, -7.354248046875, -7.0318603515625, -6.70947265625, -6.3870849609375, -6.064697265625, -5.7423095703125, -5.419921875, -5.0975341796875, -4.775146484375, -4.4527587890625, -4.13037109375, -3.8079833984375, -3.485595703125, -3.1632080078125, -2.8408203125, -2.5184326171875, -2.196044921875, -1.8736572265625, -1.55126953125, -1.2288818359375, -0.906494140625, -0.5841064453125, -0.26171875, 0.0606689453125, 0.383056640625, 0.7054443359375, 1.02783203125, 1.3502197265625, 1.672607421875, 1.9949951171875, 2.3173828125, 2.6397705078125, 2.962158203125, 3.2845458984375, 3.60693359375, 3.9293212890625, 4.251708984375, 4.5740966796875, 4.896484375, 5.2188720703125, 5.541259765625, 5.8636474609375, 6.18603515625, 6.5084228515625, 6.830810546875, 7.1531982421875, 7.4755859375, 7.7979736328125, 8.120361328125, 8.4427490234375, 8.76513671875, 9.0875244140625, 9.409912109375, 9.7322998046875, 10.0546875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 3.0, 6.0, 13.0, 15.0, 54.0, 133.0, 243.0, 484.0, 1049.0, 1096.0, 566.0, 219.0, 99.0, 41.0, 26.0, 15.0, 9.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.84375, -40.74365234375, -39.6435546875, -38.54345703125, -37.443359375, -36.34326171875, -35.2431640625, -34.14306640625, -33.04296875, -31.94287109375, -30.8427734375, -29.74267578125, -28.642578125, -27.54248046875, -26.4423828125, -25.34228515625, -24.2421875, -23.14208984375, -22.0419921875, -20.94189453125, -19.841796875, -18.74169921875, -17.6416015625, -16.54150390625, -15.44140625, -14.34130859375, -13.2412109375, -12.14111328125, -11.041015625, -9.94091796875, -8.8408203125, -7.74072265625, -6.640625, -5.54052734375, -4.4404296875, -3.34033203125, -2.240234375, -1.14013671875, -0.0400390625, 1.06005859375, 2.16015625, 3.26025390625, 4.3603515625, 5.46044921875, 6.560546875, 7.66064453125, 8.7607421875, 9.86083984375, 10.9609375, 12.06103515625, 13.1611328125, 14.26123046875, 15.361328125, 16.46142578125, 17.5615234375, 18.66162109375, 19.76171875, 20.86181640625, 21.9619140625, 23.06201171875, 24.162109375, 25.26220703125, 26.3623046875, 27.46240234375, 28.5625]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 7.0, 7.0, 13.0, 20.0, 39.0, 66.0, 180.0, 499.0, 1317.0, 10476.0, 4167371.0, 12157.0, 1287.0, 482.0, 196.0, 91.0, 35.0, 18.0, 12.0, 2.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-126.4375, -122.6650390625, -118.892578125, -115.1201171875, -111.34765625, -107.5751953125, -103.802734375, -100.0302734375, -96.2578125, -92.4853515625, -88.712890625, -84.9404296875, -81.16796875, -77.3955078125, -73.623046875, -69.8505859375, -66.078125, -62.3056640625, -58.533203125, -54.7607421875, -50.98828125, -47.2158203125, -43.443359375, -39.6708984375, -35.8984375, -32.1259765625, -28.353515625, -24.5810546875, -20.80859375, -17.0361328125, -13.263671875, -9.4912109375, -5.71875, -1.9462890625, 1.826171875, 5.5986328125, 9.37109375, 13.1435546875, 16.916015625, 20.6884765625, 24.4609375, 28.2333984375, 32.005859375, 35.7783203125, 39.55078125, 43.3232421875, 47.095703125, 50.8681640625, 54.640625, 58.4130859375, 62.185546875, 65.9580078125, 69.73046875, 73.5029296875, 77.275390625, 81.0478515625, 84.8203125, 88.5927734375, 92.365234375, 96.1376953125, 99.91015625, 103.6826171875, 107.455078125, 111.2275390625, 115.0]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 314.0, 682.0, 16.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.01564025878906, -80.80253601074219, -69.58943176269531, -58.37632751464844, -47.16322326660156, -35.95011901855469, -24.737014770507812, -13.523910522460938, -2.3108062744140625, 8.902297973632812, 20.115402221679688, 31.328506469726562, 42.54161071777344, 53.75471496582031, 64.96781921386719, 76.18092346191406, 87.39402770996094, 98.60713195800781, 109.82023620605469, 121.03334045410156, 132.24644470214844, 143.4595489501953, 154.6726531982422, 165.88575744628906, 177.09886169433594, 188.3119659423828, 199.5250701904297, 210.73817443847656, 221.95127868652344, 233.1643829345703, 244.3774871826172, 255.59059143066406, 266.8037109375, 278.0168151855469, 289.22991943359375, 300.4430236816406, 311.6561279296875, 322.8692321777344, 334.08233642578125, 345.2954406738281, 356.508544921875, 367.7216491699219, 378.93475341796875, 390.1478576660156, 401.3609619140625, 412.5740661621094, 423.78717041015625, 435.0002746582031, 446.21337890625, 457.4264831542969, 468.63958740234375, 479.8526916503906, 491.0657958984375, 502.2789001464844, 513.4920043945312, 524.705078125, 535.918212890625, 547.13134765625, 558.3444213867188, 569.5574951171875, 580.7706298828125, 591.9837646484375, 603.1968383789062, 614.409912109375, 625.623046875]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 7.0, 4.0, 6.0, 7.0, 9.0, 6.0, 22.0, 19.0, 19.0, 16.0, 18.0, 31.0, 30.0, 31.0, 34.0, 43.0, 35.0, 29.0, 48.0, 37.0, 40.0, 37.0, 26.0, 42.0, 41.0, 46.0, 39.0, 34.0, 27.0, 28.0, 29.0, 30.0, 20.0, 19.0, 18.0, 23.0, 11.0, 10.0, 10.0, 8.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-41.481170654296875, -40.00740051269531, -38.53363037109375, -37.05986022949219, -35.586090087890625, -34.1123161315918, -32.638545989990234, -31.164775848388672, -29.69100570678711, -28.217235565185547, -26.743465423583984, -25.26969337463379, -23.795923233032227, -22.322153091430664, -20.84838104248047, -19.374610900878906, -17.900840759277344, -16.42707061767578, -14.953299522399902, -13.479528427124023, -12.005758285522461, -10.531988143920898, -9.05821704864502, -7.584445953369141, -6.110675811767578, -4.636905193328857, -3.1631345748901367, -1.689363956451416, -0.2155933380126953, 1.2581772804260254, 2.731947898864746, 4.205718994140625, 5.6794891357421875, 7.153259754180908, 8.627030372619629, 10.100801467895508, 11.57457160949707, 13.048341751098633, 14.522112846374512, 15.99588394165039, 17.469654083251953, 18.943424224853516, 20.417194366455078, 21.890966415405273, 23.364736557006836, 24.8385066986084, 26.312278747558594, 27.786048889160156, 29.25981903076172, 30.73358917236328, 32.207359313964844, 33.681129455566406, 35.15489959716797, 36.6286735534668, 38.10244369506836, 39.57621383666992, 41.049983978271484, 42.52375411987305, 43.99752426147461, 45.47129440307617, 46.945068359375, 48.41883850097656, 49.892608642578125, 51.36637878417969, 52.84014892578125]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 3.0, 2.0, 2.0, 4.0, 3.0, 7.0, 5.0, 8.0, 8.0, 9.0, 24.0, 17.0, 21.0, 25.0, 19.0, 24.0, 24.0, 26.0, 26.0, 28.0, 25.0, 31.0, 39.0, 28.0, 36.0, 36.0, 42.0, 51.0, 42.0, 34.0, 35.0, 40.0, 28.0, 37.0, 29.0, 20.0, 28.0, 20.0, 16.0, 21.0, 14.0, 13.0, 13.0, 12.0, 7.0, 9.0, 9.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.05859375, -3.935302734375, -3.81201171875, -3.688720703125, -3.5654296875, -3.442138671875, -3.31884765625, -3.195556640625, -3.072265625, -2.948974609375, -2.82568359375, -2.702392578125, -2.5791015625, -2.455810546875, -2.33251953125, -2.209228515625, -2.0859375, -1.962646484375, -1.83935546875, -1.716064453125, -1.5927734375, -1.469482421875, -1.34619140625, -1.222900390625, -1.099609375, -0.976318359375, -0.85302734375, -0.729736328125, -0.6064453125, -0.483154296875, -0.35986328125, -0.236572265625, -0.11328125, 0.010009765625, 0.13330078125, 0.256591796875, 0.3798828125, 0.503173828125, 0.62646484375, 0.749755859375, 0.873046875, 0.996337890625, 1.11962890625, 1.242919921875, 1.3662109375, 1.489501953125, 1.61279296875, 1.736083984375, 1.859375, 1.982666015625, 2.10595703125, 2.229248046875, 2.3525390625, 2.475830078125, 2.59912109375, 2.722412109375, 2.845703125, 2.968994140625, 3.09228515625, 3.215576171875, 3.3388671875, 3.462158203125, 3.58544921875, 3.708740234375, 3.83203125]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 12.0, 13.0, 34.0, 33.0, 62.0, 87.0, 131.0, 199.0, 265.0, 477.0, 661.0, 1029.0, 1623.0, 2356.0, 3665.0, 5414.0, 8237.0, 12351.0, 17961.0, 26989.0, 39782.0, 60546.0, 93713.0, 152381.0, 201634.0, 148745.0, 91777.0, 59119.0, 39210.0, 26436.0, 17577.0, 12068.0, 7900.0, 5465.0, 3593.0, 2299.0, 1658.0, 959.0, 751.0, 456.0, 319.0, 171.0, 151.0, 76.0, 56.0, 40.0, 37.0, 9.0, 8.0, 5.0, 11.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.43359375, -0.4198188781738281, -0.40604400634765625, -0.3922691345214844, -0.3784942626953125, -0.3647193908691406, -0.35094451904296875, -0.3371696472167969, -0.323394775390625, -0.3096199035644531, -0.29584503173828125, -0.2820701599121094, -0.2682952880859375, -0.2545204162597656, -0.24074554443359375, -0.22697067260742188, -0.21319580078125, -0.19942092895507812, -0.18564605712890625, -0.17187118530273438, -0.1580963134765625, -0.14432144165039062, -0.13054656982421875, -0.11677169799804688, -0.102996826171875, -0.08922195434570312, -0.07544708251953125, -0.061672210693359375, -0.0478973388671875, -0.034122467041015625, -0.02034759521484375, -0.006572723388671875, 0.0072021484375, 0.020977020263671875, 0.03475189208984375, 0.048526763916015625, 0.0623016357421875, 0.07607650756835938, 0.08985137939453125, 0.10362625122070312, 0.117401123046875, 0.13117599487304688, 0.14495086669921875, 0.15872573852539062, 0.1725006103515625, 0.18627548217773438, 0.20005035400390625, 0.21382522583007812, 0.22760009765625, 0.24137496948242188, 0.25514984130859375, 0.2689247131347656, 0.2826995849609375, 0.2964744567871094, 0.31024932861328125, 0.3240242004394531, 0.337799072265625, 0.3515739440917969, 0.36534881591796875, 0.3791236877441406, 0.3928985595703125, 0.4066734313964844, 0.42044830322265625, 0.4342231750488281, 0.447998046875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 2.0, 4.0, 4.0, 3.0, 4.0, 6.0, 8.0, 14.0, 12.0, 13.0, 10.0, 11.0, 21.0, 22.0, 22.0, 29.0, 42.0, 36.0, 42.0, 46.0, 39.0, 40.0, 46.0, 1065.0, 43.0, 52.0, 49.0, 50.0, 34.0, 31.0, 41.0, 30.0, 19.0, 25.0, 20.0, 20.0, 12.0, 12.0, 10.0, 6.0, 9.0, 5.0, 7.0, 1.0, 4.0, 7.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.416015625, -2.327117919921875, -2.23822021484375, -2.149322509765625, -2.0604248046875, -1.971527099609375, -1.88262939453125, -1.793731689453125, -1.704833984375, -1.615936279296875, -1.52703857421875, -1.438140869140625, -1.3492431640625, -1.260345458984375, -1.17144775390625, -1.082550048828125, -0.99365234375, -0.904754638671875, -0.81585693359375, -0.726959228515625, -0.6380615234375, -0.549163818359375, -0.46026611328125, -0.371368408203125, -0.282470703125, -0.193572998046875, -0.10467529296875, -0.015777587890625, 0.0731201171875, 0.162017822265625, 0.25091552734375, 0.339813232421875, 0.4287109375, 0.517608642578125, 0.60650634765625, 0.695404052734375, 0.7843017578125, 0.873199462890625, 0.96209716796875, 1.050994873046875, 1.139892578125, 1.228790283203125, 1.31768798828125, 1.406585693359375, 1.4954833984375, 1.584381103515625, 1.67327880859375, 1.762176513671875, 1.85107421875, 1.939971923828125, 2.02886962890625, 2.117767333984375, 2.2066650390625, 2.295562744140625, 2.38446044921875, 2.473358154296875, 2.562255859375, 2.651153564453125, 2.74005126953125, 2.828948974609375, 2.9178466796875, 3.006744384765625, 3.09564208984375, 3.184539794921875, 3.2734375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 7.0, 1.0, 9.0, 10.0, 13.0, 27.0, 40.0, 45.0, 74.0, 108.0, 153.0, 242.0, 344.0, 525.0, 767.0, 1136.0, 1729.0, 2588.0, 4040.0, 6294.0, 9956.0, 16161.0, 26831.0, 47211.0, 81566.0, 144883.0, 1276040.0, 199978.0, 115021.0, 65059.0, 37432.0, 22184.0, 13250.0, 8257.0, 5234.0, 3266.0, 2213.0, 1433.0, 1022.0, 635.0, 420.0, 296.0, 211.0, 155.0, 92.0, 62.0, 47.0, 23.0, 20.0, 13.0, 8.0, 5.0, 3.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.441162109375, -0.4263572692871094, -0.41155242919921875, -0.3967475891113281, -0.3819427490234375, -0.3671379089355469, -0.35233306884765625, -0.3375282287597656, -0.322723388671875, -0.3079185485839844, -0.29311370849609375, -0.2783088684082031, -0.2635040283203125, -0.24869918823242188, -0.23389434814453125, -0.21908950805664062, -0.20428466796875, -0.18947982788085938, -0.17467498779296875, -0.15987014770507812, -0.1450653076171875, -0.13026046752929688, -0.11545562744140625, -0.10065078735351562, -0.085845947265625, -0.07104110717773438, -0.05623626708984375, -0.041431427001953125, -0.0266265869140625, -0.011821746826171875, 0.00298309326171875, 0.017787933349609375, 0.0325927734375, 0.047397613525390625, 0.06220245361328125, 0.07700729370117188, 0.0918121337890625, 0.10661697387695312, 0.12142181396484375, 0.13622665405273438, 0.151031494140625, 0.16583633422851562, 0.18064117431640625, 0.19544601440429688, 0.2102508544921875, 0.22505569458007812, 0.23986053466796875, 0.2546653747558594, 0.26947021484375, 0.2842750549316406, 0.29907989501953125, 0.3138847351074219, 0.3286895751953125, 0.3434944152832031, 0.35829925537109375, 0.3731040954589844, 0.387908935546875, 0.4027137756347656, 0.41751861572265625, 0.4323234558105469, 0.4471282958984375, 0.4619331359863281, 0.47673797607421875, 0.4915428161621094, 0.50634765625]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 5.0, 6.0, 6.0, 8.0, 5.0, 10.0, 6.0, 28.0, 27.0, 34.0, 32.0, 38.0, 50.0, 52.0, 70.0, 78.0, 69.0, 90.0, 76.0, 55.0, 51.0, 37.0, 36.0, 28.0, 24.0, 11.0, 14.0, 13.0, 6.0, 10.0, 6.0, 6.0, 5.0, 3.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020008087158203125, -0.0019198358058929443, -0.0018388628959655762, -0.001757889986038208, -0.0016769170761108398, -0.0015959441661834717, -0.0015149712562561035, -0.0014339983463287354, -0.0013530254364013672, -0.001272052526473999, -0.0011910796165466309, -0.0011101067066192627, -0.0010291337966918945, -0.0009481608867645264, -0.0008671879768371582, -0.00078621506690979, -0.0007052421569824219, -0.0006242692470550537, -0.0005432963371276855, -0.0004623234272003174, -0.0003813505172729492, -0.00030037760734558105, -0.0002194046974182129, -0.00013843178749084473, -5.745887756347656e-05, 2.35140323638916e-05, 0.00010448694229125977, 0.00018545985221862793, 0.0002664327621459961, 0.00034740567207336426, 0.0004283785820007324, 0.0005093514919281006, 0.0005903244018554688, 0.0006712973117828369, 0.0007522702217102051, 0.0008332431316375732, 0.0009142160415649414, 0.0009951889514923096, 0.0010761618614196777, 0.001157134771347046, 0.001238107681274414, 0.0013190805912017822, 0.0014000535011291504, 0.0014810264110565186, 0.0015619993209838867, 0.0016429722309112549, 0.001723945140838623, 0.0018049180507659912, 0.0018858909606933594, 0.0019668638706207275, 0.0020478367805480957, 0.002128809690475464, 0.002209782600402832, 0.0022907555103302, 0.0023717284202575684, 0.0024527013301849365, 0.0025336742401123047, 0.002614647150039673, 0.002695620059967041, 0.002776592969894409, 0.0028575658798217773, 0.0029385387897491455, 0.0030195116996765137, 0.003100484609603882, 0.00318145751953125]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 4.0, 6.0, 7.0, 7.0, 8.0, 12.0, 28.0, 32.0, 28.0, 41.0, 74.0, 96.0, 151.0, 198.0, 289.0, 482.0, 772.0, 993704.0, 50612.0, 706.0, 414.0, 260.0, 172.0, 115.0, 86.0, 75.0, 58.0, 35.0, 20.0, 10.0, 14.0, 14.0, 6.0, 10.0, 4.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.063720703125, -0.06199359893798828, -0.06026649475097656, -0.058539390563964844, -0.056812286376953125, -0.055085182189941406, -0.05335807800292969, -0.05163097381591797, -0.04990386962890625, -0.04817676544189453, -0.04644966125488281, -0.044722557067871094, -0.042995452880859375, -0.041268348693847656, -0.03954124450683594, -0.03781414031982422, -0.0360870361328125, -0.03435993194580078, -0.03263282775878906, -0.030905723571777344, -0.029178619384765625, -0.027451515197753906, -0.025724411010742188, -0.02399730682373047, -0.02227020263671875, -0.02054309844970703, -0.018815994262695312, -0.017088890075683594, -0.015361785888671875, -0.013634681701660156, -0.011907577514648438, -0.010180473327636719, -0.008453369140625, -0.006726264953613281, -0.0049991607666015625, -0.0032720565795898438, -0.001544952392578125, 0.00018215179443359375, 0.0019092559814453125, 0.0036363601684570312, 0.00536346435546875, 0.007090568542480469, 0.008817672729492188, 0.010544776916503906, 0.012271881103515625, 0.013998985290527344, 0.015726089477539062, 0.01745319366455078, 0.0191802978515625, 0.02090740203857422, 0.022634506225585938, 0.024361610412597656, 0.026088714599609375, 0.027815818786621094, 0.029542922973632812, 0.03127002716064453, 0.03299713134765625, 0.03472423553466797, 0.03645133972167969, 0.038178443908691406, 0.039905548095703125, 0.041632652282714844, 0.04335975646972656, 0.04508686065673828, 0.04681396484375]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 10.0, 31.0, 176.0, 434.0, 268.0, 73.0, 19.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012770687462761998, -0.0012049650540575385, -0.0011328613618388772, -0.001060757669620216, -0.0009886539774015546, -0.0009165502851828933, -0.0008444466511718929, -0.0007723429589532316, -0.0007002392667345703, -0.000628135574515909, -0.0005560318822972476, -0.0004839282191824168, -0.0004118245269637555, -0.0003397208347450942, -0.00026761717163026333, -0.00019551347941160202, -0.0001234097871929407, -5.130610225023702e-05, 2.0797582692466676e-05, 9.290126035921276e-05, 0.00016500495257787406, 0.00023710864479653537, 0.0003092123079113662, 0.00038131600013002753, 0.00045341969234868884, 0.0005255233845673501, 0.0005976270767860115, 0.0006697307107970119, 0.0007418344030156732, 0.0008139380952343345, 0.0008860417874529958, 0.0009581454796716571, 0.0010302492883056402, 0.0011023529805243015, 0.0011744566727429628, 0.0012465603649616241, 0.0013186640571802855, 0.0013907677493989468, 0.001462871441617608, 0.0015349751338362694, 0.0016070788260549307, 0.001679182518273592, 0.0017512862104922533, 0.0018233899027109146, 0.001895493594929576, 0.0019675972871482372, 0.0020397009793668985, 0.00211180467158556, 0.0021839081309735775, 0.002256011823192239, 0.0023281155154109, 0.0024002192076295614, 0.0024723228998482227, 0.002544426592066884, 0.0026165302842855453, 0.0026886339765042067, 0.002760737668722868, 0.0028328413609415293, 0.0029049450531601906, 0.002977048745378852, 0.003049152437597513, 0.0031212561298161745, 0.003193359822034836, 0.003265463514253497, 0.0033375672064721584]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 1.0, 1.0, 5.0, 6.0, 7.0, 8.0, 8.0, 16.0, 17.0, 17.0, 19.0, 22.0, 26.0, 55.0, 33.0, 46.0, 49.0, 50.0, 45.0, 49.0, 58.0, 46.0, 46.0, 47.0, 47.0, 46.0, 27.0, 45.0, 26.0, 24.0, 19.0, 20.0, 18.0, 11.0, 11.0, 9.0, 5.0, 4.0, 8.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014643669128417969, -0.0014221537858247757, -0.0013799406588077545, -0.0013377275317907333, -0.0012955144047737122, -0.001253301277756691, -0.0012110881507396698, -0.0011688750237226486, -0.0011266618967056274, -0.0010844487696886063, -0.001042235642671585, -0.001000022515654564, -0.0009578093886375427, -0.0009155962616205215, -0.0008733831346035004, -0.0008311700075864792, -0.000788956880569458, -0.0007467437535524368, -0.0007045306265354156, -0.0006623174995183945, -0.0006201043725013733, -0.0005778912454843521, -0.0005356781184673309, -0.0004934649914503098, -0.0004512518644332886, -0.0004090387374162674, -0.0003668256103992462, -0.00032461248338222504, -0.00028239935636520386, -0.00024018622934818268, -0.0001979731023311615, -0.00015575997531414032, -0.00011354684829711914, -7.133372128009796e-05, -2.9120594263076782e-05, 1.3092532753944397e-05, 5.5305659770965576e-05, 9.751878678798676e-05, 0.00013973191380500793, 0.00018194504082202911, 0.0002241581678390503, 0.00026637129485607147, 0.00030858442187309265, 0.00035079754889011383, 0.000393010675907135, 0.0004352238029241562, 0.00047743692994117737, 0.0005196500569581985, 0.0005618631839752197, 0.0006040763109922409, 0.0006462894380092621, 0.0006885025650262833, 0.0007307156920433044, 0.0007729288190603256, 0.0008151419460773468, 0.000857355073094368, 0.0008995682001113892, 0.0009417813271284103, 0.0009839944541454315, 0.0010262075811624527, 0.0010684207081794739, 0.001110633835196495, 0.0011528469622135162, 0.0011950600892305374, 0.0012372732162475586]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 3.0, 2.0, 2.0, 4.0, 3.0, 7.0, 5.0, 8.0, 8.0, 9.0, 24.0, 17.0, 21.0, 25.0, 19.0, 23.0, 25.0, 26.0, 26.0, 28.0, 25.0, 31.0, 39.0, 28.0, 36.0, 36.0, 42.0, 51.0, 42.0, 34.0, 35.0, 40.0, 28.0, 37.0, 29.0, 20.0, 28.0, 20.0, 16.0, 21.0, 14.0, 13.0, 13.0, 12.0, 7.0, 9.0, 9.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.05859375, -3.935302734375, -3.81201171875, -3.688720703125, -3.5654296875, -3.442138671875, -3.31884765625, -3.195556640625, -3.072265625, -2.948974609375, -2.82568359375, -2.702392578125, -2.5791015625, -2.455810546875, -2.33251953125, -2.209228515625, -2.0859375, -1.962646484375, -1.83935546875, -1.716064453125, -1.5927734375, -1.469482421875, -1.34619140625, -1.222900390625, -1.099609375, -0.976318359375, -0.85302734375, -0.729736328125, -0.6064453125, -0.483154296875, -0.35986328125, -0.236572265625, -0.11328125, 0.010009765625, 0.13330078125, 0.256591796875, 0.3798828125, 0.503173828125, 0.62646484375, 0.749755859375, 0.873046875, 0.996337890625, 1.11962890625, 1.242919921875, 1.3662109375, 1.489501953125, 1.61279296875, 1.736083984375, 1.859375, 1.982666015625, 2.10595703125, 2.229248046875, 2.3525390625, 2.475830078125, 2.59912109375, 2.722412109375, 2.845703125, 2.968994140625, 3.09228515625, 3.215576171875, 3.3388671875, 3.462158203125, 3.58544921875, 3.708740234375, 3.83203125]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 0.0, 9.0, 4.0, 10.0, 11.0, 12.0, 21.0, 29.0, 35.0, 54.0, 56.0, 68.0, 110.0, 147.0, 184.0, 218.0, 331.0, 433.0, 605.0, 814.0, 1161.0, 1546.0, 2172.0, 3533.0, 5829.0, 11167.0, 31708.0, 650041.0, 289106.0, 23753.0, 9565.0, 5132.0, 3188.0, 2069.0, 1498.0, 1016.0, 752.0, 553.0, 393.0, 312.0, 215.0, 175.0, 140.0, 101.0, 73.0, 50.0, 38.0, 28.0, 24.0, 16.0, 21.0, 9.0, 11.0, 6.0, 7.0, 2.0, 1.0, 2.0, 3.0, 1.0], "bins": [-25.609375, -24.806396484375, -24.00341796875, -23.200439453125, -22.3974609375, -21.594482421875, -20.79150390625, -19.988525390625, -19.185546875, -18.382568359375, -17.57958984375, -16.776611328125, -15.9736328125, -15.170654296875, -14.36767578125, -13.564697265625, -12.76171875, -11.958740234375, -11.15576171875, -10.352783203125, -9.5498046875, -8.746826171875, -7.94384765625, -7.140869140625, -6.337890625, -5.534912109375, -4.73193359375, -3.928955078125, -3.1259765625, -2.322998046875, -1.52001953125, -0.717041015625, 0.0859375, 0.888916015625, 1.69189453125, 2.494873046875, 3.2978515625, 4.100830078125, 4.90380859375, 5.706787109375, 6.509765625, 7.312744140625, 8.11572265625, 8.918701171875, 9.7216796875, 10.524658203125, 11.32763671875, 12.130615234375, 12.93359375, 13.736572265625, 14.53955078125, 15.342529296875, 16.1455078125, 16.948486328125, 17.75146484375, 18.554443359375, 19.357421875, 20.160400390625, 20.96337890625, 21.766357421875, 22.5693359375, 23.372314453125, 24.17529296875, 24.978271484375, 25.78125]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 4.0, 9.0, 8.0, 9.0, 14.0, 9.0, 17.0, 9.0, 18.0, 14.0, 21.0, 35.0, 28.0, 23.0, 26.0, 40.0, 55.0, 36.0, 61.0, 82.0, 163.0, 1477.0, 307.0, 122.0, 70.0, 55.0, 51.0, 41.0, 26.0, 14.0, 25.0, 28.0, 21.0, 20.0, 21.0, 22.0, 12.0, 9.0, 11.0, 8.0, 7.0, 3.0, 5.0, 6.0, 4.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-12.1015625, -11.721435546875, -11.34130859375, -10.961181640625, -10.5810546875, -10.200927734375, -9.82080078125, -9.440673828125, -9.060546875, -8.680419921875, -8.30029296875, -7.920166015625, -7.5400390625, -7.159912109375, -6.77978515625, -6.399658203125, -6.01953125, -5.639404296875, -5.25927734375, -4.879150390625, -4.4990234375, -4.118896484375, -3.73876953125, -3.358642578125, -2.978515625, -2.598388671875, -2.21826171875, -1.838134765625, -1.4580078125, -1.077880859375, -0.69775390625, -0.317626953125, 0.0625, 0.442626953125, 0.82275390625, 1.202880859375, 1.5830078125, 1.963134765625, 2.34326171875, 2.723388671875, 3.103515625, 3.483642578125, 3.86376953125, 4.243896484375, 4.6240234375, 5.004150390625, 5.38427734375, 5.764404296875, 6.14453125, 6.524658203125, 6.90478515625, 7.284912109375, 7.6650390625, 8.045166015625, 8.42529296875, 8.805419921875, 9.185546875, 9.565673828125, 9.94580078125, 10.325927734375, 10.7060546875, 11.086181640625, 11.46630859375, 11.846435546875, 12.2265625]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 6.0, 3.0, 6.0, 5.0, 5.0, 8.0, 3.0, 14.0, 12.0, 14.0, 19.0, 12.0, 31.0, 24.0, 25.0, 25.0, 30.0, 58.0, 73.0, 128.0, 331.0, 995.0, 17923.0, 3118246.0, 6114.0, 807.0, 276.0, 119.0, 76.0, 48.0, 44.0, 34.0, 23.0, 23.0, 26.0, 20.0, 12.0, 16.0, 12.0, 11.0, 13.0, 10.0, 5.0, 8.0, 4.0, 5.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-55.90625, -54.18115234375, -52.4560546875, -50.73095703125, -49.005859375, -47.28076171875, -45.5556640625, -43.83056640625, -42.10546875, -40.38037109375, -38.6552734375, -36.93017578125, -35.205078125, -33.47998046875, -31.7548828125, -30.02978515625, -28.3046875, -26.57958984375, -24.8544921875, -23.12939453125, -21.404296875, -19.67919921875, -17.9541015625, -16.22900390625, -14.50390625, -12.77880859375, -11.0537109375, -9.32861328125, -7.603515625, -5.87841796875, -4.1533203125, -2.42822265625, -0.703125, 1.02197265625, 2.7470703125, 4.47216796875, 6.197265625, 7.92236328125, 9.6474609375, 11.37255859375, 13.09765625, 14.82275390625, 16.5478515625, 18.27294921875, 19.998046875, 21.72314453125, 23.4482421875, 25.17333984375, 26.8984375, 28.62353515625, 30.3486328125, 32.07373046875, 33.798828125, 35.52392578125, 37.2490234375, 38.97412109375, 40.69921875, 42.42431640625, 44.1494140625, 45.87451171875, 47.599609375, 49.32470703125, 51.0498046875, 52.77490234375, 54.5]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1007.0, 13.0, 1.0], "bins": [-846.1148071289062, -832.4221801757812, -818.7295532226562, -805.0369262695312, -791.34423828125, -777.651611328125, -763.958984375, -750.266357421875, -736.57373046875, -722.881103515625, -709.1884765625, -695.495849609375, -681.8031616210938, -668.1105346679688, -654.4179077148438, -640.7252807617188, -627.0326538085938, -613.3400268554688, -599.6473999023438, -585.9547729492188, -572.2620849609375, -558.5694580078125, -544.8768310546875, -531.1842041015625, -517.4915771484375, -503.7989501953125, -490.1062927246094, -476.4136657714844, -462.7210388183594, -449.02838134765625, -435.33575439453125, -421.64312744140625, -407.9504699707031, -394.2578430175781, -380.565185546875, -366.87255859375, -353.179931640625, -339.4873046875, -325.7946472167969, -312.1020202636719, -298.4093933105469, -284.7167663574219, -271.02410888671875, -257.33148193359375, -243.63885498046875, -229.9462127685547, -216.25357055664062, -202.56094360351562, -188.86830139160156, -175.1756591796875, -161.4830322265625, -147.79039001464844, -134.09776306152344, -120.40512084960938, -106.71248626708984, -93.01985168457031, -79.32722473144531, -65.63459014892578, -51.94195556640625, -38.24931716918945, -24.556682586669922, -10.864044189453125, 2.8285903930664062, 16.521224975585938, 30.213863372802734]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 9.0, 10.0, 12.0, 16.0, 11.0, 18.0, 17.0, 19.0, 16.0, 34.0, 32.0, 30.0, 37.0, 25.0, 33.0, 37.0, 31.0, 53.0, 35.0, 39.0, 50.0, 31.0, 36.0, 33.0, 28.0, 29.0, 41.0, 22.0, 30.0, 22.0, 19.0, 26.0, 13.0, 18.0, 14.0, 15.0, 14.0, 8.0, 7.0, 7.0, 5.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-44.53876495361328, -43.30615234375, -42.07353973388672, -40.8409309387207, -39.60831832885742, -38.37570571899414, -37.143096923828125, -35.910484313964844, -34.67787170410156, -33.44525909423828, -32.212646484375, -30.980037689208984, -29.747425079345703, -28.514812469482422, -27.282201766967773, -26.049591064453125, -24.816978454589844, -23.584365844726562, -22.351755142211914, -21.119144439697266, -19.886531829833984, -18.653919219970703, -17.421308517456055, -16.188697814941406, -14.956085205078125, -13.72347354888916, -12.490861892700195, -11.25825023651123, -10.025638580322266, -8.7930269241333, -7.560415267944336, -6.327803611755371, -5.095191955566406, -3.8625802993774414, -2.6299686431884766, -1.3973569869995117, -0.16474533081054688, 1.067866325378418, 2.300477981567383, 3.5330896377563477, 4.7657012939453125, 5.998312950134277, 7.230924606323242, 8.463536262512207, 9.696147918701172, 10.928759574890137, 12.161371231079102, 13.393982887268066, 14.626594543457031, 15.859206199645996, 17.09181785583496, 18.32442855834961, 19.55704116821289, 20.789653778076172, 22.02226448059082, 23.25487518310547, 24.48748779296875, 25.72010040283203, 26.95271110534668, 28.185321807861328, 29.41793441772461, 30.65054702758789, 31.88315773010254, 33.11576843261719, 34.34838104248047]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 5.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 10.0, 8.0, 7.0, 10.0, 22.0, 28.0, 11.0, 24.0, 21.0, 17.0, 22.0, 17.0, 32.0, 22.0, 33.0, 29.0, 32.0, 25.0, 33.0, 33.0, 45.0, 41.0, 49.0, 36.0, 36.0, 37.0, 27.0, 37.0, 34.0, 18.0, 30.0, 29.0, 19.0, 15.0, 15.0, 18.0, 14.0, 8.0, 11.0, 11.0, 9.0, 6.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-4.09765625, -3.9716796875, -3.845703125, -3.7197265625, -3.59375, -3.4677734375, -3.341796875, -3.2158203125, -3.08984375, -2.9638671875, -2.837890625, -2.7119140625, -2.5859375, -2.4599609375, -2.333984375, -2.2080078125, -2.08203125, -1.9560546875, -1.830078125, -1.7041015625, -1.578125, -1.4521484375, -1.326171875, -1.2001953125, -1.07421875, -0.9482421875, -0.822265625, -0.6962890625, -0.5703125, -0.4443359375, -0.318359375, -0.1923828125, -0.06640625, 0.0595703125, 0.185546875, 0.3115234375, 0.4375, 0.5634765625, 0.689453125, 0.8154296875, 0.94140625, 1.0673828125, 1.193359375, 1.3193359375, 1.4453125, 1.5712890625, 1.697265625, 1.8232421875, 1.94921875, 2.0751953125, 2.201171875, 2.3271484375, 2.453125, 2.5791015625, 2.705078125, 2.8310546875, 2.95703125, 3.0830078125, 3.208984375, 3.3349609375, 3.4609375, 3.5869140625, 3.712890625, 3.8388671875, 3.96484375]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 5.0, 5.0, 5.0, 5.0, 6.0, 15.0, 16.0, 17.0, 30.0, 41.0, 57.0, 90.0, 104.0, 172.0, 301.0, 512.0, 953.0, 1790.0, 3648.0, 7986.0, 20526.0, 86463.0, 2149479.0, 1809101.0, 77585.0, 19515.0, 7872.0, 3623.0, 1882.0, 972.0, 540.0, 346.0, 184.0, 119.0, 94.0, 67.0, 39.0, 23.0, 28.0, 17.0, 14.0, 8.0, 7.0, 5.0, 5.0, 4.0, 6.0, 4.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-25.46875, -24.646484375, -23.82421875, -23.001953125, -22.1796875, -21.357421875, -20.53515625, -19.712890625, -18.890625, -18.068359375, -17.24609375, -16.423828125, -15.6015625, -14.779296875, -13.95703125, -13.134765625, -12.3125, -11.490234375, -10.66796875, -9.845703125, -9.0234375, -8.201171875, -7.37890625, -6.556640625, -5.734375, -4.912109375, -4.08984375, -3.267578125, -2.4453125, -1.623046875, -0.80078125, 0.021484375, 0.84375, 1.666015625, 2.48828125, 3.310546875, 4.1328125, 4.955078125, 5.77734375, 6.599609375, 7.421875, 8.244140625, 9.06640625, 9.888671875, 10.7109375, 11.533203125, 12.35546875, 13.177734375, 14.0, 14.822265625, 15.64453125, 16.466796875, 17.2890625, 18.111328125, 18.93359375, 19.755859375, 20.578125, 21.400390625, 22.22265625, 23.044921875, 23.8671875, 24.689453125, 25.51171875, 26.333984375, 27.15625]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 2.0, 8.0, 4.0, 10.0, 14.0, 13.0, 37.0, 58.0, 61.0, 144.0, 184.0, 373.0, 565.0, 864.0, 729.0, 455.0, 244.0, 134.0, 70.0, 42.0, 25.0, 19.0, 13.0, 7.0, 5.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.84375, -37.8134765625, -36.783203125, -35.7529296875, -34.72265625, -33.6923828125, -32.662109375, -31.6318359375, -30.6015625, -29.5712890625, -28.541015625, -27.5107421875, -26.48046875, -25.4501953125, -24.419921875, -23.3896484375, -22.359375, -21.3291015625, -20.298828125, -19.2685546875, -18.23828125, -17.2080078125, -16.177734375, -15.1474609375, -14.1171875, -13.0869140625, -12.056640625, -11.0263671875, -9.99609375, -8.9658203125, -7.935546875, -6.9052734375, -5.875, -4.8447265625, -3.814453125, -2.7841796875, -1.75390625, -0.7236328125, 0.306640625, 1.3369140625, 2.3671875, 3.3974609375, 4.427734375, 5.4580078125, 6.48828125, 7.5185546875, 8.548828125, 9.5791015625, 10.609375, 11.6396484375, 12.669921875, 13.7001953125, 14.73046875, 15.7607421875, 16.791015625, 17.8212890625, 18.8515625, 19.8818359375, 20.912109375, 21.9423828125, 22.97265625, 24.0029296875, 25.033203125, 26.0634765625, 27.09375]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 7.0, 10.0, 18.0, 43.0, 49.0, 96.0, 191.0, 408.0, 2452.0, 4183934.0, 5864.0, 586.0, 247.0, 152.0, 95.0, 31.0, 38.0, 26.0, 15.0, 8.0, 7.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-142.75, -137.380859375, -132.01171875, -126.642578125, -121.2734375, -115.904296875, -110.53515625, -105.166015625, -99.796875, -94.427734375, -89.05859375, -83.689453125, -78.3203125, -72.951171875, -67.58203125, -62.212890625, -56.84375, -51.474609375, -46.10546875, -40.736328125, -35.3671875, -29.998046875, -24.62890625, -19.259765625, -13.890625, -8.521484375, -3.15234375, 2.216796875, 7.5859375, 12.955078125, 18.32421875, 23.693359375, 29.0625, 34.431640625, 39.80078125, 45.169921875, 50.5390625, 55.908203125, 61.27734375, 66.646484375, 72.015625, 77.384765625, 82.75390625, 88.123046875, 93.4921875, 98.861328125, 104.23046875, 109.599609375, 114.96875, 120.337890625, 125.70703125, 131.076171875, 136.4453125, 141.814453125, 147.18359375, 152.552734375, 157.921875, 163.291015625, 168.66015625, 174.029296875, 179.3984375, 184.767578125, 190.13671875, 195.505859375, 200.875]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 36.0, 767.0, 214.0, 2.0, 0.0, 0.0, 2.0], "bins": [-705.835693359375, -693.8153686523438, -681.7950439453125, -669.7747192382812, -657.75439453125, -645.7340698242188, -633.7137451171875, -621.6934204101562, -609.673095703125, -597.6527709960938, -585.6324462890625, -573.6121215820312, -561.591796875, -549.5714721679688, -537.5511474609375, -525.5308227539062, -513.510498046875, -501.49017333984375, -489.4698486328125, -477.44952392578125, -465.42919921875, -453.40887451171875, -441.3885498046875, -429.36822509765625, -417.3479309082031, -405.3276062011719, -393.3072814941406, -381.2869567871094, -369.2666320800781, -357.2463073730469, -345.2259826660156, -333.2056579589844, -321.1853332519531, -309.1650085449219, -297.1446838378906, -285.1243591308594, -273.1040344238281, -261.0837097167969, -249.06338500976562, -237.04306030273438, -225.02273559570312, -213.00241088867188, -200.98208618164062, -188.96176147460938, -176.94143676757812, -164.92111206054688, -152.90078735351562, -140.88046264648438, -128.86013793945312, -116.83981323242188, -104.81948852539062, -92.79916381835938, -80.77883911132812, -68.75851440429688, -56.738197326660156, -44.717872619628906, -32.69755554199219, -20.677230834960938, -8.65690803527832, 3.363414764404297, 15.383739471435547, 27.404064178466797, 39.42438507080078, 51.44470977783203, 63.46503448486328]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 5.0, 8.0, 8.0, 10.0, 13.0, 8.0, 12.0, 15.0, 15.0, 21.0, 16.0, 21.0, 34.0, 22.0, 28.0, 44.0, 25.0, 39.0, 36.0, 37.0, 46.0, 50.0, 45.0, 43.0, 32.0, 40.0, 36.0, 33.0, 42.0, 27.0, 30.0, 29.0, 16.0, 15.0, 27.0, 13.0, 14.0, 10.0, 16.0, 2.0, 4.0, 3.0, 5.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-80.68278503417969, -78.1534423828125, -75.62409973144531, -73.09475708007812, -70.56542205810547, -68.03607940673828, -65.5067367553711, -62.977394104003906, -60.44805145263672, -57.91870880126953, -55.38936996459961, -52.86002731323242, -50.330684661865234, -47.80134582519531, -45.272003173828125, -42.74266052246094, -40.213321685791016, -37.68397903442383, -35.154640197753906, -32.62529754638672, -30.09595489501953, -27.566614151000977, -25.037273406982422, -22.507930755615234, -19.97859001159668, -17.449249267578125, -14.919906616210938, -12.390565872192383, -9.861224174499512, -7.331882476806641, -4.802541732788086, -2.2731990814208984, 0.25614166259765625, 2.7854831218719482, 5.31482458114624, 7.844165802001953, 10.373507499694824, 12.902849197387695, 15.43218994140625, 17.961532592773438, 20.490873336791992, 23.020214080810547, 25.549556732177734, 28.07889747619629, 30.608238220214844, 33.13758087158203, 35.66692352294922, 38.196266174316406, 40.72560501098633, 43.254947662353516, 45.78428649902344, 48.313629150390625, 50.84297180175781, 53.372314453125, 55.90165328979492, 58.43099594116211, 60.96033477783203, 63.48967742919922, 66.0190200805664, 68.54835510253906, 71.07769775390625, 73.60704040527344, 76.13638305664062, 78.66572570800781, 81.195068359375]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 6.0, 3.0, 1.0, 6.0, 11.0, 9.0, 9.0, 10.0, 16.0, 30.0, 16.0, 20.0, 30.0, 29.0, 25.0, 26.0, 24.0, 28.0, 33.0, 42.0, 33.0, 24.0, 43.0, 52.0, 45.0, 35.0, 43.0, 47.0, 40.0, 30.0, 33.0, 24.0, 29.0, 26.0, 21.0, 27.0, 17.0, 12.0, 14.0, 5.0, 8.0, 4.0, 6.0, 4.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.3203125, -4.1805419921875, -4.040771484375, -3.9010009765625, -3.76123046875, -3.6214599609375, -3.481689453125, -3.3419189453125, -3.2021484375, -3.0623779296875, -2.922607421875, -2.7828369140625, -2.64306640625, -2.5032958984375, -2.363525390625, -2.2237548828125, -2.083984375, -1.9442138671875, -1.804443359375, -1.6646728515625, -1.52490234375, -1.3851318359375, -1.245361328125, -1.1055908203125, -0.9658203125, -0.8260498046875, -0.686279296875, -0.5465087890625, -0.40673828125, -0.2669677734375, -0.127197265625, 0.0125732421875, 0.15234375, 0.2921142578125, 0.431884765625, 0.5716552734375, 0.71142578125, 0.8511962890625, 0.990966796875, 1.1307373046875, 1.2705078125, 1.4102783203125, 1.550048828125, 1.6898193359375, 1.82958984375, 1.9693603515625, 2.109130859375, 2.2489013671875, 2.388671875, 2.5284423828125, 2.668212890625, 2.8079833984375, 2.94775390625, 3.0875244140625, 3.227294921875, 3.3670654296875, 3.5068359375, 3.6466064453125, 3.786376953125, 3.9261474609375, 4.06591796875, 4.2056884765625, 4.345458984375, 4.4852294921875, 4.625]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 5.0, 4.0, 12.0, 24.0, 37.0, 47.0, 71.0, 105.0, 172.0, 245.0, 411.0, 609.0, 886.0, 1330.0, 2060.0, 3077.0, 4525.0, 6993.0, 10788.0, 15831.0, 24279.0, 37128.0, 56181.0, 86655.0, 133351.0, 194549.0, 163021.0, 106120.0, 68098.0, 44849.0, 29789.0, 19468.0, 12675.0, 8638.0, 5646.0, 3746.0, 2398.0, 1629.0, 1049.0, 724.0, 495.0, 302.0, 196.0, 125.0, 65.0, 52.0, 36.0, 31.0, 12.0, 9.0, 8.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.4775390625, -0.4624900817871094, -0.44744110107421875, -0.4323921203613281, -0.4173431396484375, -0.4022941589355469, -0.38724517822265625, -0.3721961975097656, -0.357147216796875, -0.3420982360839844, -0.32704925537109375, -0.3120002746582031, -0.2969512939453125, -0.2819023132324219, -0.26685333251953125, -0.2518043518066406, -0.23675537109375, -0.22170639038085938, -0.20665740966796875, -0.19160842895507812, -0.1765594482421875, -0.16151046752929688, -0.14646148681640625, -0.13141250610351562, -0.116363525390625, -0.10131454467773438, -0.08626556396484375, -0.07121658325195312, -0.0561676025390625, -0.041118621826171875, -0.02606964111328125, -0.011020660400390625, 0.0040283203125, 0.019077301025390625, 0.03412628173828125, 0.049175262451171875, 0.0642242431640625, 0.07927322387695312, 0.09432220458984375, 0.10937118530273438, 0.124420166015625, 0.13946914672851562, 0.15451812744140625, 0.16956710815429688, 0.1846160888671875, 0.19966506958007812, 0.21471405029296875, 0.22976303100585938, 0.24481201171875, 0.2598609924316406, 0.27490997314453125, 0.2899589538574219, 0.3050079345703125, 0.3200569152832031, 0.33510589599609375, 0.3501548767089844, 0.365203857421875, 0.3802528381347656, 0.39530181884765625, 0.4103507995605469, 0.4253997802734375, 0.4404487609863281, 0.45549774169921875, 0.4705467224121094, 0.485595703125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 1.0, 2.0, 2.0, 4.0, 5.0, 6.0, 4.0, 11.0, 12.0, 9.0, 14.0, 21.0, 20.0, 19.0, 24.0, 22.0, 24.0, 29.0, 36.0, 37.0, 41.0, 54.0, 33.0, 40.0, 1064.0, 45.0, 34.0, 36.0, 35.0, 35.0, 29.0, 32.0, 29.0, 21.0, 35.0, 23.0, 22.0, 14.0, 14.0, 16.0, 18.0, 7.0, 11.0, 7.0, 7.0, 12.0, 2.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-2.8046875, -2.721282958984375, -2.63787841796875, -2.554473876953125, -2.4710693359375, -2.387664794921875, -2.30426025390625, -2.220855712890625, -2.137451171875, -2.054046630859375, -1.97064208984375, -1.887237548828125, -1.8038330078125, -1.720428466796875, -1.63702392578125, -1.553619384765625, -1.47021484375, -1.386810302734375, -1.30340576171875, -1.220001220703125, -1.1365966796875, -1.053192138671875, -0.96978759765625, -0.886383056640625, -0.802978515625, -0.719573974609375, -0.63616943359375, -0.552764892578125, -0.4693603515625, -0.385955810546875, -0.30255126953125, -0.219146728515625, -0.1357421875, -0.052337646484375, 0.03106689453125, 0.114471435546875, 0.1978759765625, 0.281280517578125, 0.36468505859375, 0.448089599609375, 0.531494140625, 0.614898681640625, 0.69830322265625, 0.781707763671875, 0.8651123046875, 0.948516845703125, 1.03192138671875, 1.115325927734375, 1.19873046875, 1.282135009765625, 1.36553955078125, 1.448944091796875, 1.5323486328125, 1.615753173828125, 1.69915771484375, 1.782562255859375, 1.865966796875, 1.949371337890625, 2.03277587890625, 2.116180419921875, 2.1995849609375, 2.282989501953125, 2.36639404296875, 2.449798583984375, 2.533203125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 15.0, 19.0, 20.0, 45.0, 38.0, 48.0, 94.0, 141.0, 187.0, 240.0, 339.0, 520.0, 753.0, 1065.0, 1619.0, 2135.0, 3149.0, 4770.0, 7041.0, 10459.0, 15949.0, 24494.0, 37731.0, 58067.0, 91780.0, 146534.0, 1249415.0, 158744.0, 99286.0, 63209.0, 40182.0, 26353.0, 17359.0, 11362.0, 7652.0, 5005.0, 3501.0, 2411.0, 1627.0, 1088.0, 807.0, 526.0, 402.0, 285.0, 200.0, 131.0, 95.0, 69.0, 49.0, 55.0, 24.0, 10.0, 8.0, 11.0, 9.0, 3.0, 4.0], "bins": [-0.438720703125, -0.4256591796875, -0.41259765625, -0.3995361328125, -0.386474609375, -0.3734130859375, -0.3603515625, -0.3472900390625, -0.334228515625, -0.3211669921875, -0.30810546875, -0.2950439453125, -0.281982421875, -0.2689208984375, -0.255859375, -0.2427978515625, -0.229736328125, -0.2166748046875, -0.20361328125, -0.1905517578125, -0.177490234375, -0.1644287109375, -0.1513671875, -0.1383056640625, -0.125244140625, -0.1121826171875, -0.09912109375, -0.0860595703125, -0.072998046875, -0.0599365234375, -0.046875, -0.0338134765625, -0.020751953125, -0.0076904296875, 0.00537109375, 0.0184326171875, 0.031494140625, 0.0445556640625, 0.0576171875, 0.0706787109375, 0.083740234375, 0.0968017578125, 0.10986328125, 0.1229248046875, 0.135986328125, 0.1490478515625, 0.162109375, 0.1751708984375, 0.188232421875, 0.2012939453125, 0.21435546875, 0.2274169921875, 0.240478515625, 0.2535400390625, 0.2666015625, 0.2796630859375, 0.292724609375, 0.3057861328125, 0.31884765625, 0.3319091796875, 0.344970703125, 0.3580322265625, 0.37109375, 0.3841552734375, 0.397216796875]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 5.0, 7.0, 7.0, 10.0, 10.0, 14.0, 25.0, 28.0, 29.0, 31.0, 50.0, 53.0, 66.0, 70.0, 70.0, 76.0, 71.0, 55.0, 47.0, 42.0, 41.0, 30.0, 33.0, 27.0, 26.0, 18.0, 16.0, 8.0, 5.0, 7.0, 5.0, 3.0, 2.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0020904541015625, -0.0020299404859542847, -0.0019694268703460693, -0.001908913254737854, -0.0018483996391296387, -0.0017878860235214233, -0.001727372407913208, -0.0016668587923049927, -0.0016063451766967773, -0.001545831561088562, -0.0014853179454803467, -0.0014248043298721313, -0.001364290714263916, -0.0013037770986557007, -0.0012432634830474854, -0.00118274986743927, -0.0011222362518310547, -0.0010617226362228394, -0.001001209020614624, -0.0009406954050064087, -0.0008801817893981934, -0.000819668173789978, -0.0007591545581817627, -0.0006986409425735474, -0.000638127326965332, -0.0005776137113571167, -0.0005171000957489014, -0.00045658648014068604, -0.0003960728645324707, -0.00033555924892425537, -0.00027504563331604004, -0.0002145320177078247, -0.00015401840209960938, -9.350478649139404e-05, -3.299117088317871e-05, 2.752244472503662e-05, 8.803606033325195e-05, 0.00014854967594146729, 0.00020906329154968262, 0.00026957690715789795, 0.0003300905227661133, 0.0003906041383743286, 0.00045111775398254395, 0.0005116313695907593, 0.0005721449851989746, 0.0006326586008071899, 0.0006931722164154053, 0.0007536858320236206, 0.0008141994476318359, 0.0008747130632400513, 0.0009352266788482666, 0.000995740294456482, 0.0010562539100646973, 0.0011167675256729126, 0.001177281141281128, 0.0012377947568893433, 0.0012983083724975586, 0.001358821988105774, 0.0014193356037139893, 0.0014798492193222046, 0.00154036283493042, 0.0016008764505386353, 0.0016613900661468506, 0.001721903681755066, 0.0017824172973632812]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 4.0, 5.0, 7.0, 12.0, 22.0, 16.0, 26.0, 32.0, 38.0, 49.0, 113.0, 129.0, 302.0, 722.0, 875622.0, 170009.0, 655.0, 310.0, 170.0, 79.0, 57.0, 41.0, 37.0, 19.0, 13.0, 13.0, 13.0, 3.0, 11.0, 6.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.057373046875, -0.05557727813720703, -0.05378150939941406, -0.051985740661621094, -0.050189971923828125, -0.048394203186035156, -0.04659843444824219, -0.04480266571044922, -0.04300689697265625, -0.04121112823486328, -0.03941535949707031, -0.037619590759277344, -0.035823822021484375, -0.034028053283691406, -0.03223228454589844, -0.03043651580810547, -0.0286407470703125, -0.02684497833251953, -0.025049209594726562, -0.023253440856933594, -0.021457672119140625, -0.019661903381347656, -0.017866134643554688, -0.01607036590576172, -0.01427459716796875, -0.012478828430175781, -0.010683059692382812, -0.008887290954589844, -0.007091522216796875, -0.005295753479003906, -0.0034999847412109375, -0.0017042160034179688, 9.1552734375e-05, 0.0018873214721679688, 0.0036830902099609375, 0.005478858947753906, 0.007274627685546875, 0.009070396423339844, 0.010866165161132812, 0.012661933898925781, 0.01445770263671875, 0.01625347137451172, 0.018049240112304688, 0.019845008850097656, 0.021640777587890625, 0.023436546325683594, 0.025232315063476562, 0.02702808380126953, 0.0288238525390625, 0.03061962127685547, 0.03241539001464844, 0.034211158752441406, 0.036006927490234375, 0.037802696228027344, 0.03959846496582031, 0.04139423370361328, 0.04319000244140625, 0.04498577117919922, 0.04678153991699219, 0.048577308654785156, 0.050373077392578125, 0.052168846130371094, 0.05396461486816406, 0.05576038360595703, 0.05755615234375]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 13.0, 68.0, 289.0, 392.0, 191.0, 46.0, 9.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008266618242487311, -0.0007598712691105902, -0.0006930807139724493, -0.0006262901006266475, -0.0005594996036961675, -0.0004927089903503656, -0.0004259184352122247, -0.0003591278800740838, -0.0002923373249359429, -0.00022554676979780197, -0.00015875620010774583, -9.196563041768968e-05, -2.5175075279548764e-05, 4.161547985859215e-05, 0.00010840606410056353, 0.00017519661923870444, 0.00024198717437684536, 0.0003087777295149863, 0.0003755682846531272, 0.00044235886889509857, 0.000509149394929409, 0.0005759400082752109, 0.0006427305634133518, 0.0007095211185514927, 0.0007763116736896336, 0.0008431022288277745, 0.0009098927839659154, 0.0009766833391040564, 0.0010434739524498582, 0.0011102644493803382, 0.00117705506272614, 0.00124384555965662, 0.0013106360565871, 0.0013774266699329019, 0.0014442171668633819, 0.0015110077802091837, 0.0015777982771396637, 0.0016445888904854655, 0.0017113795038312674, 0.0017781700007617474, 0.0018449604976922274, 0.0019117511110380292, 0.001978541724383831, 0.002045332221314311, 0.002112122718244791, 0.002178913215175271, 0.0022457039449363947, 0.0023124944418668747, 0.0023792851716279984, 0.0024460756685584784, 0.002512866398319602, 0.002579656895250082, 0.002646447392180562, 0.002713237889111042, 0.0027800286188721657, 0.0028468191158026457, 0.0029136096127331257, 0.0029804001096636057, 0.0030471908394247293, 0.0031139813363552094, 0.0031807718332856894, 0.0032475623302161694, 0.003314353059977293, 0.003381143556907773, 0.003447934053838253]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 5.0, 12.0, 5.0, 10.0, 13.0, 15.0, 8.0, 21.0, 15.0, 14.0, 43.0, 33.0, 31.0, 25.0, 20.0, 37.0, 33.0, 45.0, 43.0, 36.0, 43.0, 48.0, 47.0, 45.0, 39.0, 27.0, 31.0, 37.0, 29.0, 23.0, 35.0, 22.0, 21.0, 11.0, 16.0, 10.0, 9.0, 15.0, 8.0, 6.0, 7.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0009709000587463379, -0.0009409431368112564, -0.0009109862148761749, -0.0008810292929410934, -0.000851072371006012, -0.0008211154490709305, -0.000791158527135849, -0.0007612016052007675, -0.000731244683265686, -0.0007012877613306046, -0.0006713308393955231, -0.0006413739174604416, -0.0006114169955253601, -0.0005814600735902786, -0.0005515031516551971, -0.0005215462297201157, -0.0004915893077850342, -0.0004616323858499527, -0.0004316754639148712, -0.00040171854197978973, -0.00037176162004470825, -0.00034180469810962677, -0.0003118477761745453, -0.0002818908542394638, -0.0002519339323043823, -0.00022197701036930084, -0.00019202008843421936, -0.00016206316649913788, -0.0001321062445640564, -0.00010214932262897491, -7.219240069389343e-05, -4.223547875881195e-05, -1.2278556823730469e-05, 1.7678365111351013e-05, 4.7635287046432495e-05, 7.759220898151398e-05, 0.00010754913091659546, 0.00013750605285167694, 0.00016746297478675842, 0.0001974198967218399, 0.0002273768186569214, 0.00025733374059200287, 0.00028729066252708435, 0.00031724758446216583, 0.0003472045063972473, 0.0003771614283323288, 0.0004071183502674103, 0.00043707527220249176, 0.00046703219413757324, 0.0004969891160726547, 0.0005269460380077362, 0.0005569029599428177, 0.0005868598818778992, 0.0006168168038129807, 0.0006467737257480621, 0.0006767306476831436, 0.0007066875696182251, 0.0007366444915533066, 0.0007666014134883881, 0.0007965583354234695, 0.000826515257358551, 0.0008564721792936325, 0.000886429101228714, 0.0009163860231637955, 0.000946342945098877]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 6.0, 3.0, 1.0, 6.0, 11.0, 9.0, 9.0, 10.0, 16.0, 30.0, 16.0, 20.0, 30.0, 29.0, 25.0, 26.0, 24.0, 28.0, 33.0, 42.0, 33.0, 24.0, 43.0, 52.0, 45.0, 35.0, 43.0, 47.0, 40.0, 30.0, 33.0, 24.0, 29.0, 26.0, 21.0, 27.0, 17.0, 12.0, 14.0, 5.0, 8.0, 4.0, 6.0, 4.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.3203125, -4.1805419921875, -4.040771484375, -3.9010009765625, -3.76123046875, -3.6214599609375, -3.481689453125, -3.3419189453125, -3.2021484375, -3.0623779296875, -2.922607421875, -2.7828369140625, -2.64306640625, -2.5032958984375, -2.363525390625, -2.2237548828125, -2.083984375, -1.9442138671875, -1.804443359375, -1.6646728515625, -1.52490234375, -1.3851318359375, -1.245361328125, -1.1055908203125, -0.9658203125, -0.8260498046875, -0.686279296875, -0.5465087890625, -0.40673828125, -0.2669677734375, -0.127197265625, 0.0125732421875, 0.15234375, 0.2921142578125, 0.431884765625, 0.5716552734375, 0.71142578125, 0.8511962890625, 0.990966796875, 1.1307373046875, 1.2705078125, 1.4102783203125, 1.550048828125, 1.6898193359375, 1.82958984375, 1.9693603515625, 2.109130859375, 2.2489013671875, 2.388671875, 2.5284423828125, 2.668212890625, 2.8079833984375, 2.94775390625, 3.0875244140625, 3.227294921875, 3.3670654296875, 3.5068359375, 3.6466064453125, 3.786376953125, 3.9261474609375, 4.06591796875, 4.2056884765625, 4.345458984375, 4.4852294921875, 4.625]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 6.0, 6.0, 9.0, 7.0, 20.0, 22.0, 22.0, 39.0, 44.0, 70.0, 95.0, 110.0, 154.0, 246.0, 344.0, 480.0, 820.0, 1445.0, 2948.0, 6948.0, 18469.0, 55186.0, 187165.0, 461940.0, 213692.0, 62456.0, 20478.0, 7829.0, 3315.0, 1594.0, 882.0, 517.0, 360.0, 208.0, 183.0, 124.0, 92.0, 61.0, 49.0, 36.0, 25.0, 15.0, 18.0, 7.0, 7.0, 6.0, 5.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.05859375, -3.9212646484375, -3.783935546875, -3.6466064453125, -3.50927734375, -3.3719482421875, -3.234619140625, -3.0972900390625, -2.9599609375, -2.8226318359375, -2.685302734375, -2.5479736328125, -2.41064453125, -2.2733154296875, -2.135986328125, -1.9986572265625, -1.861328125, -1.7239990234375, -1.586669921875, -1.4493408203125, -1.31201171875, -1.1746826171875, -1.037353515625, -0.9000244140625, -0.7626953125, -0.6253662109375, -0.488037109375, -0.3507080078125, -0.21337890625, -0.0760498046875, 0.061279296875, 0.1986083984375, 0.3359375, 0.4732666015625, 0.610595703125, 0.7479248046875, 0.88525390625, 1.0225830078125, 1.159912109375, 1.2972412109375, 1.4345703125, 1.5718994140625, 1.709228515625, 1.8465576171875, 1.98388671875, 2.1212158203125, 2.258544921875, 2.3958740234375, 2.533203125, 2.6705322265625, 2.807861328125, 2.9451904296875, 3.08251953125, 3.2198486328125, 3.357177734375, 3.4945068359375, 3.6318359375, 3.7691650390625, 3.906494140625, 4.0438232421875, 4.18115234375, 4.3184814453125, 4.455810546875, 4.5931396484375, 4.73046875]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 5.0, 7.0, 6.0, 6.0, 13.0, 9.0, 17.0, 16.0, 13.0, 18.0, 22.0, 29.0, 20.0, 21.0, 28.0, 41.0, 26.0, 39.0, 52.0, 51.0, 165.0, 1704.0, 244.0, 75.0, 52.0, 44.0, 38.0, 26.0, 36.0, 29.0, 36.0, 22.0, 31.0, 14.0, 18.0, 18.0, 12.0, 10.0, 9.0, 8.0, 3.0, 9.0, 5.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-15.15625, -14.677001953125, -14.19775390625, -13.718505859375, -13.2392578125, -12.760009765625, -12.28076171875, -11.801513671875, -11.322265625, -10.843017578125, -10.36376953125, -9.884521484375, -9.4052734375, -8.926025390625, -8.44677734375, -7.967529296875, -7.48828125, -7.009033203125, -6.52978515625, -6.050537109375, -5.5712890625, -5.092041015625, -4.61279296875, -4.133544921875, -3.654296875, -3.175048828125, -2.69580078125, -2.216552734375, -1.7373046875, -1.258056640625, -0.77880859375, -0.299560546875, 0.1796875, 0.658935546875, 1.13818359375, 1.617431640625, 2.0966796875, 2.575927734375, 3.05517578125, 3.534423828125, 4.013671875, 4.492919921875, 4.97216796875, 5.451416015625, 5.9306640625, 6.409912109375, 6.88916015625, 7.368408203125, 7.84765625, 8.326904296875, 8.80615234375, 9.285400390625, 9.7646484375, 10.243896484375, 10.72314453125, 11.202392578125, 11.681640625, 12.160888671875, 12.64013671875, 13.119384765625, 13.5986328125, 14.077880859375, 14.55712890625, 15.036376953125, 15.515625]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 3.0, 6.0, 3.0, 8.0, 14.0, 10.0, 10.0, 20.0, 15.0, 22.0, 31.0, 30.0, 37.0, 42.0, 61.0, 67.0, 116.0, 244.0, 515.0, 2018.0, 282653.0, 2855070.0, 3233.0, 648.0, 279.0, 144.0, 83.0, 60.0, 43.0, 33.0, 32.0, 25.0, 23.0, 17.0, 13.0, 15.0, 16.0, 7.0, 11.0, 7.0, 7.0, 5.0, 4.0, 0.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-35.40625, -34.3037109375, -33.201171875, -32.0986328125, -30.99609375, -29.8935546875, -28.791015625, -27.6884765625, -26.5859375, -25.4833984375, -24.380859375, -23.2783203125, -22.17578125, -21.0732421875, -19.970703125, -18.8681640625, -17.765625, -16.6630859375, -15.560546875, -14.4580078125, -13.35546875, -12.2529296875, -11.150390625, -10.0478515625, -8.9453125, -7.8427734375, -6.740234375, -5.6376953125, -4.53515625, -3.4326171875, -2.330078125, -1.2275390625, -0.125, 0.9775390625, 2.080078125, 3.1826171875, 4.28515625, 5.3876953125, 6.490234375, 7.5927734375, 8.6953125, 9.7978515625, 10.900390625, 12.0029296875, 13.10546875, 14.2080078125, 15.310546875, 16.4130859375, 17.515625, 18.6181640625, 19.720703125, 20.8232421875, 21.92578125, 23.0283203125, 24.130859375, 25.2333984375, 26.3359375, 27.4384765625, 28.541015625, 29.6435546875, 30.74609375, 31.8486328125, 32.951171875, 34.0537109375, 35.15625]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [2.0, 1.0, 78.0, 923.0, 15.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.770471572875977, -9.697038650512695, -5.623604774475098, -1.5501708984375, 2.5232620239257812, 6.5966949462890625, 10.670129776000977, 14.743562698364258, 18.81699562072754, 22.89042854309082, 26.963863372802734, 31.037296295166016, 35.1107292175293, 39.18416213989258, 43.257598876953125, 47.331031799316406, 51.40446472167969, 55.47789764404297, 59.55133056640625, 63.62476348876953, 67.69819641113281, 71.7716293334961, 75.84506225585938, 79.91850280761719, 83.99192810058594, 88.06536102294922, 92.1387939453125, 96.21222686767578, 100.28565979003906, 104.35909271240234, 108.43252563476562, 112.50596618652344, 116.57939147949219, 120.65282440185547, 124.72625732421875, 128.79969787597656, 132.8731231689453, 136.94656372070312, 141.01998901367188, 145.0934295654297, 149.16685485839844, 153.24029541015625, 157.313720703125, 161.3871612548828, 165.46058654785156, 169.53402709960938, 173.60745239257812, 177.68089294433594, 181.75433349609375, 185.82777404785156, 189.9011993408203, 193.97463989257812, 198.04806518554688, 202.1215057373047, 206.19493103027344, 210.26837158203125, 214.341796875, 218.4152374267578, 222.48866271972656, 226.56210327148438, 230.63552856445312, 234.70896911621094, 238.7823944091797, 242.8558349609375, 246.92926025390625]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 1.0, 3.0, 3.0, 2.0, 3.0, 7.0, 6.0, 8.0, 9.0, 12.0, 11.0, 10.0, 13.0, 19.0, 26.0, 24.0, 36.0, 23.0, 37.0, 38.0, 43.0, 44.0, 43.0, 45.0, 43.0, 38.0, 39.0, 39.0, 49.0, 42.0, 32.0, 31.0, 34.0, 22.0, 24.0, 24.0, 18.0, 18.0, 13.0, 15.0, 13.0, 9.0, 10.0, 6.0, 7.0, 6.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-47.40852355957031, -45.94264221191406, -44.47676086425781, -43.01087951660156, -41.54499816894531, -40.07911682128906, -38.61323547363281, -37.1473503112793, -35.68146896362305, -34.2155876159668, -32.74970626831055, -31.283824920654297, -29.817941665649414, -28.352060317993164, -26.886178970336914, -25.42029571533203, -23.954416275024414, -22.488534927368164, -21.022653579711914, -19.55677032470703, -18.09088897705078, -16.62500762939453, -15.159126281738281, -13.693243980407715, -12.227362632751465, -10.761481285095215, -9.295598983764648, -7.829717636108398, -6.36383581161499, -4.897953987121582, -3.432072639465332, -1.9661903381347656, -0.5003089904785156, 0.965572714805603, 2.4314544200897217, 3.897336006164551, 5.363217830657959, 6.829099655151367, 8.294981002807617, 9.760863304138184, 11.226744651794434, 12.692625999450684, 14.15850830078125, 15.6243896484375, 17.09027099609375, 18.55615234375, 20.02203369140625, 21.487916946411133, 22.953798294067383, 24.419679641723633, 25.885560989379883, 27.351444244384766, 28.817325592041016, 30.283206939697266, 31.749088287353516, 33.214969635009766, 34.680850982666016, 36.146732330322266, 37.612613677978516, 39.078495025634766, 40.544376373291016, 42.01026153564453, 43.47614288330078, 44.94202423095703, 46.40790557861328]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 6.0, 5.0, 7.0, 10.0, 6.0, 10.0, 14.0, 15.0, 22.0, 18.0, 34.0, 23.0, 28.0, 27.0, 21.0, 33.0, 32.0, 29.0, 47.0, 34.0, 36.0, 43.0, 50.0, 41.0, 38.0, 50.0, 42.0, 34.0, 31.0, 38.0, 23.0, 25.0, 28.0, 22.0, 25.0, 11.0, 10.0, 7.0, 8.0, 4.0, 6.0, 7.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.64453125, -4.496826171875, -4.34912109375, -4.201416015625, -4.0537109375, -3.906005859375, -3.75830078125, -3.610595703125, -3.462890625, -3.315185546875, -3.16748046875, -3.019775390625, -2.8720703125, -2.724365234375, -2.57666015625, -2.428955078125, -2.28125, -2.133544921875, -1.98583984375, -1.838134765625, -1.6904296875, -1.542724609375, -1.39501953125, -1.247314453125, -1.099609375, -0.951904296875, -0.80419921875, -0.656494140625, -0.5087890625, -0.361083984375, -0.21337890625, -0.065673828125, 0.08203125, 0.229736328125, 0.37744140625, 0.525146484375, 0.6728515625, 0.820556640625, 0.96826171875, 1.115966796875, 1.263671875, 1.411376953125, 1.55908203125, 1.706787109375, 1.8544921875, 2.002197265625, 2.14990234375, 2.297607421875, 2.4453125, 2.593017578125, 2.74072265625, 2.888427734375, 3.0361328125, 3.183837890625, 3.33154296875, 3.479248046875, 3.626953125, 3.774658203125, 3.92236328125, 4.070068359375, 4.2177734375, 4.365478515625, 4.51318359375, 4.660888671875, 4.80859375]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 4.0, 3.0, 4.0, 7.0, 6.0, 13.0, 15.0, 15.0, 21.0, 22.0, 22.0, 44.0, 47.0, 57.0, 89.0, 130.0, 210.0, 392.0, 978.0, 4148.0, 28999.0, 423687.0, 2990239.0, 694952.0, 42176.0, 5569.0, 1240.0, 435.0, 238.0, 136.0, 102.0, 76.0, 50.0, 23.0, 36.0, 17.0, 15.0, 12.0, 11.0, 10.0, 11.0, 8.0, 4.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.703125, -13.2236328125, -12.744140625, -12.2646484375, -11.78515625, -11.3056640625, -10.826171875, -10.3466796875, -9.8671875, -9.3876953125, -8.908203125, -8.4287109375, -7.94921875, -7.4697265625, -6.990234375, -6.5107421875, -6.03125, -5.5517578125, -5.072265625, -4.5927734375, -4.11328125, -3.6337890625, -3.154296875, -2.6748046875, -2.1953125, -1.7158203125, -1.236328125, -0.7568359375, -0.27734375, 0.2021484375, 0.681640625, 1.1611328125, 1.640625, 2.1201171875, 2.599609375, 3.0791015625, 3.55859375, 4.0380859375, 4.517578125, 4.9970703125, 5.4765625, 5.9560546875, 6.435546875, 6.9150390625, 7.39453125, 7.8740234375, 8.353515625, 8.8330078125, 9.3125, 9.7919921875, 10.271484375, 10.7509765625, 11.23046875, 11.7099609375, 12.189453125, 12.6689453125, 13.1484375, 13.6279296875, 14.107421875, 14.5869140625, 15.06640625, 15.5458984375, 16.025390625, 16.5048828125, 16.984375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 6.0, 7.0, 11.0, 11.0, 16.0, 23.0, 27.0, 27.0, 64.0, 51.0, 95.0, 134.0, 186.0, 246.0, 344.0, 399.0, 466.0, 479.0, 375.0, 304.0, 225.0, 136.0, 117.0, 91.0, 69.0, 39.0, 31.0, 35.0, 14.0, 4.0, 13.0, 11.0, 7.0, 4.0, 6.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-19.65625, -19.1231689453125, -18.590087890625, -18.0570068359375, -17.52392578125, -16.9908447265625, -16.457763671875, -15.9246826171875, -15.3916015625, -14.8585205078125, -14.325439453125, -13.7923583984375, -13.25927734375, -12.7261962890625, -12.193115234375, -11.6600341796875, -11.126953125, -10.5938720703125, -10.060791015625, -9.5277099609375, -8.99462890625, -8.4615478515625, -7.928466796875, -7.3953857421875, -6.8623046875, -6.3292236328125, -5.796142578125, -5.2630615234375, -4.72998046875, -4.1968994140625, -3.663818359375, -3.1307373046875, -2.59765625, -2.0645751953125, -1.531494140625, -0.9984130859375, -0.46533203125, 0.0677490234375, 0.600830078125, 1.1339111328125, 1.6669921875, 2.2000732421875, 2.733154296875, 3.2662353515625, 3.79931640625, 4.3323974609375, 4.865478515625, 5.3985595703125, 5.931640625, 6.4647216796875, 6.997802734375, 7.5308837890625, 8.06396484375, 8.5970458984375, 9.130126953125, 9.6632080078125, 10.1962890625, 10.7293701171875, 11.262451171875, 11.7955322265625, 12.32861328125, 12.8616943359375, 13.394775390625, 13.9278564453125, 14.4609375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 6.0, 4.0, 18.0, 16.0, 22.0, 30.0, 51.0, 97.0, 111.0, 190.0, 362.0, 882.0, 8763.0, 4011956.0, 168810.0, 1754.0, 514.0, 230.0, 141.0, 111.0, 71.0, 51.0, 30.0, 14.0, 15.0, 18.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.9375, -54.5380859375, -52.138671875, -49.7392578125, -47.33984375, -44.9404296875, -42.541015625, -40.1416015625, -37.7421875, -35.3427734375, -32.943359375, -30.5439453125, -28.14453125, -25.7451171875, -23.345703125, -20.9462890625, -18.546875, -16.1474609375, -13.748046875, -11.3486328125, -8.94921875, -6.5498046875, -4.150390625, -1.7509765625, 0.6484375, 3.0478515625, 5.447265625, 7.8466796875, 10.24609375, 12.6455078125, 15.044921875, 17.4443359375, 19.84375, 22.2431640625, 24.642578125, 27.0419921875, 29.44140625, 31.8408203125, 34.240234375, 36.6396484375, 39.0390625, 41.4384765625, 43.837890625, 46.2373046875, 48.63671875, 51.0361328125, 53.435546875, 55.8349609375, 58.234375, 60.6337890625, 63.033203125, 65.4326171875, 67.83203125, 70.2314453125, 72.630859375, 75.0302734375, 77.4296875, 79.8291015625, 82.228515625, 84.6279296875, 87.02734375, 89.4267578125, 91.826171875, 94.2255859375, 96.625]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 34.0, 211.0, 509.0, 225.0, 30.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.22755432128906, -99.2098617553711, -93.19216918945312, -87.17448425292969, -81.15679168701172, -75.13909912109375, -69.12141418457031, -63.103721618652344, -57.086029052734375, -51.068336486816406, -45.0506477355957, -39.032958984375, -33.01526641845703, -26.997575759887695, -20.97988510131836, -14.962196350097656, -8.944503784179688, -2.9268131256103516, 3.0908775329589844, 9.10856819152832, 15.126258850097656, 21.143949508666992, 27.161640167236328, 33.17932891845703, 39.197021484375, 45.21471405029297, 51.23240280151367, 57.250091552734375, 63.267784118652344, 69.28547668457031, 75.30316162109375, 81.32085418701172, 87.33853149414062, 93.3562240600586, 99.37391662597656, 105.3916015625, 111.40929412841797, 117.42698669433594, 123.44467163085938, 129.46237182617188, 135.4800567626953, 141.49774169921875, 147.51544189453125, 153.5331268310547, 159.55081176757812, 165.56851196289062, 171.58619689941406, 177.6038818359375, 183.62158203125, 189.63926696777344, 195.65696716308594, 201.67465209960938, 207.69235229492188, 213.7100372314453, 219.72772216796875, 225.74542236328125, 231.7631072998047, 237.78079223632812, 243.79849243164062, 249.81617736816406, 255.8338623046875, 261.8515625, 267.8692626953125, 273.8869323730469, 279.9046325683594]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 5.0, 2.0, 9.0, 9.0, 12.0, 14.0, 15.0, 13.0, 26.0, 12.0, 21.0, 31.0, 19.0, 26.0, 36.0, 37.0, 37.0, 36.0, 48.0, 27.0, 37.0, 42.0, 45.0, 41.0, 46.0, 46.0, 36.0, 31.0, 35.0, 31.0, 20.0, 16.0, 14.0, 25.0, 20.0, 18.0, 13.0, 10.0, 9.0, 8.0, 6.0, 7.0, 2.0, 3.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-59.109344482421875, -57.363704681396484, -55.618064880371094, -53.8724250793457, -52.12678527832031, -50.38114547729492, -48.63550567626953, -46.889869689941406, -45.14422607421875, -43.39858627319336, -41.65294647216797, -39.90730667114258, -38.16166687011719, -36.4160270690918, -34.670387268066406, -32.92475128173828, -31.17911148071289, -29.4334716796875, -27.68783187866211, -25.94219207763672, -24.196552276611328, -22.450912475585938, -20.70527458190918, -18.95963478088379, -17.2139949798584, -15.468355178833008, -13.722715377807617, -11.977076530456543, -10.231436729431152, -8.485796928405762, -6.7401580810546875, -4.994518280029297, -3.2488784790039062, -1.5032389163970947, 0.2424006462097168, 1.9880399703979492, 3.73367977142334, 5.4793195724487305, 7.224958419799805, 8.970598220825195, 10.716238021850586, 12.461877822875977, 14.207517623901367, 15.953156471252441, 17.698795318603516, 19.444435119628906, 21.190074920654297, 22.935714721679688, 24.681354522705078, 26.42699432373047, 28.17263412475586, 29.91827392578125, 31.66391372680664, 33.40955352783203, 35.155189514160156, 36.90083312988281, 38.64646911621094, 40.39210891723633, 42.13774871826172, 43.88338851928711, 45.6290283203125, 47.37466812133789, 49.12030792236328, 50.865943908691406, 52.61158752441406]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 6.0, 4.0, 6.0, 7.0, 9.0, 15.0, 6.0, 12.0, 15.0, 14.0, 21.0, 26.0, 29.0, 29.0, 33.0, 27.0, 30.0, 37.0, 36.0, 49.0, 48.0, 45.0, 42.0, 47.0, 39.0, 43.0, 38.0, 38.0, 32.0, 36.0, 40.0, 25.0, 33.0, 24.0, 13.0, 12.0, 13.0, 8.0, 10.0, 6.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3359375, -5.17401123046875, -5.0120849609375, -4.85015869140625, -4.688232421875, -4.52630615234375, -4.3643798828125, -4.20245361328125, -4.04052734375, -3.87860107421875, -3.7166748046875, -3.55474853515625, -3.392822265625, -3.23089599609375, -3.0689697265625, -2.90704345703125, -2.7451171875, -2.58319091796875, -2.4212646484375, -2.25933837890625, -2.097412109375, -1.93548583984375, -1.7735595703125, -1.61163330078125, -1.44970703125, -1.28778076171875, -1.1258544921875, -0.96392822265625, -0.802001953125, -0.64007568359375, -0.4781494140625, -0.31622314453125, -0.154296875, 0.00762939453125, 0.1695556640625, 0.33148193359375, 0.493408203125, 0.65533447265625, 0.8172607421875, 0.97918701171875, 1.14111328125, 1.30303955078125, 1.4649658203125, 1.62689208984375, 1.788818359375, 1.95074462890625, 2.1126708984375, 2.27459716796875, 2.4365234375, 2.59844970703125, 2.7603759765625, 2.92230224609375, 3.084228515625, 3.24615478515625, 3.4080810546875, 3.57000732421875, 3.73193359375, 3.89385986328125, 4.0557861328125, 4.21771240234375, 4.379638671875, 4.54156494140625, 4.7034912109375, 4.86541748046875, 5.02734375]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 8.0, 6.0, 6.0, 17.0, 19.0, 39.0, 70.0, 83.0, 130.0, 209.0, 317.0, 451.0, 666.0, 1083.0, 1615.0, 2527.0, 3690.0, 5767.0, 8675.0, 13183.0, 20189.0, 30854.0, 46008.0, 71113.0, 110651.0, 172175.0, 192349.0, 129064.0, 81814.0, 53140.0, 35018.0, 23204.0, 15112.0, 10069.0, 6630.0, 4233.0, 2840.0, 1862.0, 1303.0, 796.0, 535.0, 340.0, 246.0, 152.0, 98.0, 73.0, 44.0, 28.0, 27.0, 10.0, 9.0, 5.0, 2.0, 5.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.49609375, -0.4806709289550781, -0.46524810791015625, -0.4498252868652344, -0.4344024658203125, -0.4189796447753906, -0.40355682373046875, -0.3881340026855469, -0.372711181640625, -0.3572883605957031, -0.34186553955078125, -0.3264427185058594, -0.3110198974609375, -0.2955970764160156, -0.28017425537109375, -0.2647514343261719, -0.24932861328125, -0.23390579223632812, -0.21848297119140625, -0.20306015014648438, -0.1876373291015625, -0.17221450805664062, -0.15679168701171875, -0.14136886596679688, -0.125946044921875, -0.11052322387695312, -0.09510040283203125, -0.07967758178710938, -0.0642547607421875, -0.048831939697265625, -0.03340911865234375, -0.017986297607421875, -0.0025634765625, 0.012859344482421875, 0.02828216552734375, 0.043704986572265625, 0.0591278076171875, 0.07455062866210938, 0.08997344970703125, 0.10539627075195312, 0.120819091796875, 0.13624191284179688, 0.15166473388671875, 0.16708755493164062, 0.1825103759765625, 0.19793319702148438, 0.21335601806640625, 0.22877883911132812, 0.24420166015625, 0.2596244812011719, 0.27504730224609375, 0.2904701232910156, 0.3058929443359375, 0.3213157653808594, 0.33673858642578125, 0.3521614074707031, 0.367584228515625, 0.3830070495605469, 0.39842987060546875, 0.4138526916503906, 0.4292755126953125, 0.4446983337402344, 0.46012115478515625, 0.4755439758300781, 0.490966796875]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 5.0, 3.0, 1.0, 4.0, 4.0, 8.0, 7.0, 9.0, 11.0, 6.0, 7.0, 17.0, 15.0, 22.0, 18.0, 33.0, 19.0, 36.0, 29.0, 22.0, 36.0, 25.0, 29.0, 33.0, 40.0, 26.0, 1064.0, 34.0, 45.0, 36.0, 42.0, 27.0, 36.0, 34.0, 38.0, 31.0, 22.0, 22.0, 17.0, 17.0, 18.0, 17.0, 16.0, 15.0, 6.0, 8.0, 7.0, 7.0, 8.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.673828125, -2.58270263671875, -2.4915771484375, -2.40045166015625, -2.309326171875, -2.21820068359375, -2.1270751953125, -2.03594970703125, -1.94482421875, -1.85369873046875, -1.7625732421875, -1.67144775390625, -1.580322265625, -1.48919677734375, -1.3980712890625, -1.30694580078125, -1.2158203125, -1.12469482421875, -1.0335693359375, -0.94244384765625, -0.851318359375, -0.76019287109375, -0.6690673828125, -0.57794189453125, -0.48681640625, -0.39569091796875, -0.3045654296875, -0.21343994140625, -0.122314453125, -0.03118896484375, 0.0599365234375, 0.15106201171875, 0.2421875, 0.33331298828125, 0.4244384765625, 0.51556396484375, 0.606689453125, 0.69781494140625, 0.7889404296875, 0.88006591796875, 0.97119140625, 1.06231689453125, 1.1534423828125, 1.24456787109375, 1.335693359375, 1.42681884765625, 1.5179443359375, 1.60906982421875, 1.7001953125, 1.79132080078125, 1.8824462890625, 1.97357177734375, 2.064697265625, 2.15582275390625, 2.2469482421875, 2.33807373046875, 2.42919921875, 2.52032470703125, 2.6114501953125, 2.70257568359375, 2.793701171875, 2.88482666015625, 2.9759521484375, 3.06707763671875, 3.158203125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 5.0, 6.0, 9.0, 5.0, 14.0, 23.0, 26.0, 50.0, 89.0, 110.0, 163.0, 213.0, 329.0, 456.0, 713.0, 1012.0, 1568.0, 2173.0, 3053.0, 4742.0, 6767.0, 10446.0, 15575.0, 23927.0, 36324.0, 56118.0, 87787.0, 140212.0, 1250196.0, 162999.0, 102405.0, 65279.0, 42382.0, 27546.0, 17967.0, 11900.0, 7942.0, 5310.0, 3584.0, 2410.0, 1590.0, 1141.0, 787.0, 539.0, 422.0, 265.0, 200.0, 114.0, 77.0, 61.0, 39.0, 30.0, 20.0, 10.0, 5.0, 8.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.42578125, -0.41143035888671875, -0.3970794677734375, -0.38272857666015625, -0.368377685546875, -0.35402679443359375, -0.3396759033203125, -0.32532501220703125, -0.31097412109375, -0.29662322998046875, -0.2822723388671875, -0.26792144775390625, -0.253570556640625, -0.23921966552734375, -0.2248687744140625, -0.21051788330078125, -0.1961669921875, -0.18181610107421875, -0.1674652099609375, -0.15311431884765625, -0.138763427734375, -0.12441253662109375, -0.1100616455078125, -0.09571075439453125, -0.08135986328125, -0.06700897216796875, -0.0526580810546875, -0.03830718994140625, -0.023956298828125, -0.00960540771484375, 0.0047454833984375, 0.01909637451171875, 0.033447265625, 0.04779815673828125, 0.0621490478515625, 0.07649993896484375, 0.090850830078125, 0.10520172119140625, 0.1195526123046875, 0.13390350341796875, 0.14825439453125, 0.16260528564453125, 0.1769561767578125, 0.19130706787109375, 0.205657958984375, 0.22000885009765625, 0.2343597412109375, 0.24871063232421875, 0.2630615234375, 0.27741241455078125, 0.2917633056640625, 0.30611419677734375, 0.320465087890625, 0.33481597900390625, 0.3491668701171875, 0.36351776123046875, 0.37786865234375, 0.39221954345703125, 0.4065704345703125, 0.42092132568359375, 0.435272216796875, 0.44962310791015625, 0.4639739990234375, 0.47832489013671875, 0.49267578125]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 7.0, 4.0, 9.0, 6.0, 7.0, 14.0, 18.0, 19.0, 25.0, 20.0, 48.0, 40.0, 53.0, 61.0, 93.0, 68.0, 73.0, 84.0, 76.0, 59.0, 34.0, 29.0, 36.0, 28.0, 18.0, 16.0, 7.0, 10.0, 4.0, 7.0, 6.0, 6.0, 2.0, 4.0, 3.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00304412841796875, -0.002959132194519043, -0.002874135971069336, -0.002789139747619629, -0.002704143524169922, -0.002619147300720215, -0.002534151077270508, -0.0024491548538208008, -0.0023641586303710938, -0.0022791624069213867, -0.0021941661834716797, -0.0021091699600219727, -0.0020241737365722656, -0.0019391775131225586, -0.0018541812896728516, -0.0017691850662231445, -0.0016841888427734375, -0.0015991926193237305, -0.0015141963958740234, -0.0014292001724243164, -0.0013442039489746094, -0.0012592077255249023, -0.0011742115020751953, -0.0010892152786254883, -0.0010042190551757812, -0.0009192228317260742, -0.0008342266082763672, -0.0007492303848266602, -0.0006642341613769531, -0.0005792379379272461, -0.0004942417144775391, -0.00040924549102783203, -0.000324249267578125, -0.00023925304412841797, -0.00015425682067871094, -6.92605972290039e-05, 1.5735626220703125e-05, 0.00010073184967041016, 0.0001857280731201172, 0.0002707242965698242, 0.00035572052001953125, 0.0004407167434692383, 0.0005257129669189453, 0.0006107091903686523, 0.0006957054138183594, 0.0007807016372680664, 0.0008656978607177734, 0.0009506940841674805, 0.0010356903076171875, 0.0011206865310668945, 0.0012056827545166016, 0.0012906789779663086, 0.0013756752014160156, 0.0014606714248657227, 0.0015456676483154297, 0.0016306638717651367, 0.0017156600952148438, 0.0018006563186645508, 0.0018856525421142578, 0.001970648765563965, 0.002055644989013672, 0.002140641212463379, 0.002225637435913086, 0.002310633659362793, 0.0023956298828125]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 1.0, 6.0, 4.0, 4.0, 12.0, 11.0, 14.0, 16.0, 24.0, 31.0, 59.0, 52.0, 111.0, 211.0, 439.0, 2969.0, 1043016.0, 839.0, 296.0, 138.0, 97.0, 52.0, 28.0, 26.0, 23.0, 19.0, 16.0, 6.0, 7.0, 4.0, 3.0, 3.0, 4.0, 7.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07177734375, -0.06940841674804688, -0.06703948974609375, -0.06467056274414062, -0.0623016357421875, -0.059932708740234375, -0.05756378173828125, -0.055194854736328125, -0.052825927734375, -0.050457000732421875, -0.04808807373046875, -0.045719146728515625, -0.0433502197265625, -0.040981292724609375, -0.03861236572265625, -0.036243438720703125, -0.03387451171875, -0.031505584716796875, -0.02913665771484375, -0.026767730712890625, -0.0243988037109375, -0.022029876708984375, -0.01966094970703125, -0.017292022705078125, -0.014923095703125, -0.012554168701171875, -0.01018524169921875, -0.007816314697265625, -0.0054473876953125, -0.003078460693359375, -0.00070953369140625, 0.001659393310546875, 0.0040283203125, 0.006397247314453125, 0.00876617431640625, 0.011135101318359375, 0.0135040283203125, 0.015872955322265625, 0.01824188232421875, 0.020610809326171875, 0.022979736328125, 0.025348663330078125, 0.02771759033203125, 0.030086517333984375, 0.0324554443359375, 0.034824371337890625, 0.03719329833984375, 0.039562225341796875, 0.04193115234375, 0.044300079345703125, 0.04666900634765625, 0.049037933349609375, 0.0514068603515625, 0.053775787353515625, 0.05614471435546875, 0.058513641357421875, 0.060882568359375, 0.06325149536132812, 0.06562042236328125, 0.06798934936523438, 0.0703582763671875, 0.07272720336914062, 0.07509613037109375, 0.07746505737304688, 0.079833984375]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 213.0, 720.0, 78.0, 2.0, 3.0], "bins": [-0.012231012806296349, -0.012028365395963192, -0.011825717985630035, -0.011623071506619453, -0.011420424096286297, -0.01121777668595314, -0.011015129275619984, -0.010812481865286827, -0.01060983445495367, -0.010407187044620514, -0.010204539634287357, -0.0100018922239542, -0.009799245744943619, -0.009596598334610462, -0.009393950924277306, -0.009191303513944149, -0.008988657034933567, -0.00878600962460041, -0.008583362214267254, -0.008380714803934097, -0.008178068324923515, -0.007975420914590359, -0.007772773504257202, -0.0075701260939240456, -0.007367478683590889, -0.007164831273257732, -0.006962184328585863, -0.0067595369182527065, -0.00655688950791955, -0.006354242563247681, -0.006151595152914524, -0.0059489477425813675, -0.005746300332248211, -0.005543652921915054, -0.005341005977243185, -0.0051383585669100285, -0.004935711156576872, -0.004733064211905003, -0.004530416801571846, -0.004327769391238689, -0.00412512244656682, -0.0039224750362336636, -0.0037198278587311506, -0.0035171806812286377, -0.0033145335037261248, -0.003111886326223612, -0.0029092389158904552, -0.0027065917383879423, -0.0025039445608854294, -0.0023012973833829165, -0.00209864997304976, -0.001896002795547247, -0.001693355618044734, -0.0014907083241268992, -0.0012880610302090645, -0.0010854138527065516, -0.0008827665587887168, -0.000680119323078543, -0.00047747205826453865, -0.00027482479345053434, -7.21775577403605e-05, 0.00013046967796981335, 0.0003331169718876481, 0.000535764149390161, 0.0007384114433079958]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 6.0, 8.0, 5.0, 8.0, 4.0, 7.0, 9.0, 13.0, 13.0, 12.0, 18.0, 20.0, 30.0, 20.0, 31.0, 28.0, 38.0, 34.0, 35.0, 32.0, 35.0, 38.0, 34.0, 37.0, 51.0, 42.0, 36.0, 38.0, 35.0, 36.0, 35.0, 19.0, 37.0, 19.0, 23.0, 20.0, 16.0, 12.0, 14.0, 12.0, 12.0, 6.0, 8.0, 5.0, 5.0, 1.0, 4.0, 2.0, 4.0, 4.0, 0.0, 2.0, 2.0], "bins": [-0.0012970566749572754, -0.0012590046972036362, -0.001220952719449997, -0.0011829007416963577, -0.0011448487639427185, -0.0011067967861890793, -0.00106874480843544, -0.0010306928306818008, -0.0009926408529281616, -0.0009545888751745224, -0.0009165368974208832, -0.000878484919667244, -0.0008404329419136047, -0.0008023809641599655, -0.0007643289864063263, -0.0007262770086526871, -0.0006882250308990479, -0.0006501730531454086, -0.0006121210753917694, -0.0005740690976381302, -0.000536017119884491, -0.0004979651421308517, -0.0004599131643772125, -0.0004218611866235733, -0.0003838092088699341, -0.00034575723111629486, -0.00030770525336265564, -0.0002696532756090164, -0.0002316012978553772, -0.00019354932010173798, -0.00015549734234809875, -0.00011744536459445953, -7.939338684082031e-05, -4.134140908718109e-05, -3.28943133354187e-06, 3.476254642009735e-05, 7.281452417373657e-05, 0.0001108665019273758, 0.00014891847968101501, 0.00018697045743465424, 0.00022502243518829346, 0.0002630744129419327, 0.0003011263906955719, 0.0003391783684492111, 0.00037723034620285034, 0.00041528232395648956, 0.0004533343017101288, 0.000491386279463768, 0.0005294382572174072, 0.0005674902349710464, 0.0006055422127246857, 0.0006435941904783249, 0.0006816461682319641, 0.0007196981459856033, 0.0007577501237392426, 0.0007958021014928818, 0.000833854079246521, 0.0008719060570001602, 0.0009099580347537994, 0.0009480100125074387, 0.0009860619902610779, 0.001024113968014717, 0.0010621659457683563, 0.0011002179235219955, 0.0011382699012756348]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 6.0, 4.0, 6.0, 7.0, 9.0, 15.0, 6.0, 12.0, 15.0, 14.0, 21.0, 26.0, 29.0, 29.0, 33.0, 27.0, 30.0, 37.0, 36.0, 49.0, 48.0, 45.0, 42.0, 47.0, 39.0, 43.0, 38.0, 38.0, 32.0, 36.0, 40.0, 25.0, 33.0, 24.0, 13.0, 12.0, 13.0, 8.0, 10.0, 6.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3359375, -5.17401123046875, -5.0120849609375, -4.85015869140625, -4.688232421875, -4.52630615234375, -4.3643798828125, -4.20245361328125, -4.04052734375, -3.87860107421875, -3.7166748046875, -3.55474853515625, -3.392822265625, -3.23089599609375, -3.0689697265625, -2.90704345703125, -2.7451171875, -2.58319091796875, -2.4212646484375, -2.25933837890625, -2.097412109375, -1.93548583984375, -1.7735595703125, -1.61163330078125, -1.44970703125, -1.28778076171875, -1.1258544921875, -0.96392822265625, -0.802001953125, -0.64007568359375, -0.4781494140625, -0.31622314453125, -0.154296875, 0.00762939453125, 0.1695556640625, 0.33148193359375, 0.493408203125, 0.65533447265625, 0.8172607421875, 0.97918701171875, 1.14111328125, 1.30303955078125, 1.4649658203125, 1.62689208984375, 1.788818359375, 1.95074462890625, 2.1126708984375, 2.27459716796875, 2.4365234375, 2.59844970703125, 2.7603759765625, 2.92230224609375, 3.084228515625, 3.24615478515625, 3.4080810546875, 3.57000732421875, 3.73193359375, 3.89385986328125, 4.0557861328125, 4.21771240234375, 4.379638671875, 4.54156494140625, 4.7034912109375, 4.86541748046875, 5.02734375]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 0.0, 11.0, 11.0, 13.0, 20.0, 38.0, 48.0, 57.0, 93.0, 128.0, 169.0, 263.0, 405.0, 685.0, 1075.0, 1848.0, 3260.0, 6079.0, 11827.0, 25069.0, 62176.0, 184637.0, 459244.0, 180201.0, 60756.0, 24390.0, 11915.0, 5992.0, 3221.0, 1780.0, 1145.0, 695.0, 455.0, 273.0, 198.0, 104.0, 90.0, 43.0, 36.0, 35.0, 11.0, 14.0, 13.0, 12.0, 8.0, 7.0, 4.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.49609375, -3.38848876953125, -3.2808837890625, -3.17327880859375, -3.065673828125, -2.95806884765625, -2.8504638671875, -2.74285888671875, -2.63525390625, -2.52764892578125, -2.4200439453125, -2.31243896484375, -2.204833984375, -2.09722900390625, -1.9896240234375, -1.88201904296875, -1.7744140625, -1.66680908203125, -1.5592041015625, -1.45159912109375, -1.343994140625, -1.23638916015625, -1.1287841796875, -1.02117919921875, -0.91357421875, -0.80596923828125, -0.6983642578125, -0.59075927734375, -0.483154296875, -0.37554931640625, -0.2679443359375, -0.16033935546875, -0.052734375, 0.05487060546875, 0.1624755859375, 0.27008056640625, 0.377685546875, 0.48529052734375, 0.5928955078125, 0.70050048828125, 0.80810546875, 0.91571044921875, 1.0233154296875, 1.13092041015625, 1.238525390625, 1.34613037109375, 1.4537353515625, 1.56134033203125, 1.6689453125, 1.77655029296875, 1.8841552734375, 1.99176025390625, 2.099365234375, 2.20697021484375, 2.3145751953125, 2.42218017578125, 2.52978515625, 2.63739013671875, 2.7449951171875, 2.85260009765625, 2.960205078125, 3.06781005859375, 3.1754150390625, 3.28302001953125, 3.390625]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 5.0, 4.0, 4.0, 4.0, 5.0, 6.0, 10.0, 11.0, 14.0, 17.0, 14.0, 25.0, 19.0, 24.0, 23.0, 27.0, 32.0, 45.0, 47.0, 29.0, 42.0, 52.0, 68.0, 202.0, 1773.0, 110.0, 56.0, 47.0, 42.0, 19.0, 37.0, 27.0, 31.0, 31.0, 19.0, 19.0, 21.0, 14.0, 14.0, 13.0, 9.0, 6.0, 6.0, 9.0, 5.0, 4.0, 5.0, 1.0, 2.0, 1.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-14.265625, -13.7783203125, -13.291015625, -12.8037109375, -12.31640625, -11.8291015625, -11.341796875, -10.8544921875, -10.3671875, -9.8798828125, -9.392578125, -8.9052734375, -8.41796875, -7.9306640625, -7.443359375, -6.9560546875, -6.46875, -5.9814453125, -5.494140625, -5.0068359375, -4.51953125, -4.0322265625, -3.544921875, -3.0576171875, -2.5703125, -2.0830078125, -1.595703125, -1.1083984375, -0.62109375, -0.1337890625, 0.353515625, 0.8408203125, 1.328125, 1.8154296875, 2.302734375, 2.7900390625, 3.27734375, 3.7646484375, 4.251953125, 4.7392578125, 5.2265625, 5.7138671875, 6.201171875, 6.6884765625, 7.17578125, 7.6630859375, 8.150390625, 8.6376953125, 9.125, 9.6123046875, 10.099609375, 10.5869140625, 11.07421875, 11.5615234375, 12.048828125, 12.5361328125, 13.0234375, 13.5107421875, 13.998046875, 14.4853515625, 14.97265625, 15.4599609375, 15.947265625, 16.4345703125, 16.921875]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 4.0, 4.0, 3.0, 6.0, 6.0, 9.0, 5.0, 14.0, 12.0, 15.0, 14.0, 27.0, 25.0, 26.0, 45.0, 45.0, 75.0, 93.0, 132.0, 283.0, 533.0, 1765.0, 31308.0, 3055110.0, 52266.0, 2322.0, 588.0, 307.0, 172.0, 129.0, 58.0, 51.0, 43.0, 36.0, 26.0, 25.0, 25.0, 14.0, 17.0, 16.0, 12.0, 13.0, 5.0, 3.0, 8.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-28.734375, -27.90283203125, -27.0712890625, -26.23974609375, -25.408203125, -24.57666015625, -23.7451171875, -22.91357421875, -22.08203125, -21.25048828125, -20.4189453125, -19.58740234375, -18.755859375, -17.92431640625, -17.0927734375, -16.26123046875, -15.4296875, -14.59814453125, -13.7666015625, -12.93505859375, -12.103515625, -11.27197265625, -10.4404296875, -9.60888671875, -8.77734375, -7.94580078125, -7.1142578125, -6.28271484375, -5.451171875, -4.61962890625, -3.7880859375, -2.95654296875, -2.125, -1.29345703125, -0.4619140625, 0.36962890625, 1.201171875, 2.03271484375, 2.8642578125, 3.69580078125, 4.52734375, 5.35888671875, 6.1904296875, 7.02197265625, 7.853515625, 8.68505859375, 9.5166015625, 10.34814453125, 11.1796875, 12.01123046875, 12.8427734375, 13.67431640625, 14.505859375, 15.33740234375, 16.1689453125, 17.00048828125, 17.83203125, 18.66357421875, 19.4951171875, 20.32666015625, 21.158203125, 21.98974609375, 22.8212890625, 23.65283203125, 24.484375]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 14.0, 318.0, 622.0, 60.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-161.39930725097656, -158.36636352539062, -155.3334197998047, -152.30047607421875, -149.26754760742188, -146.23460388183594, -143.20166015625, -140.16871643066406, -137.13577270507812, -134.1028289794922, -131.06988525390625, -128.03695678710938, -125.0040054321289, -121.9710693359375, -118.93812561035156, -115.90518188476562, -112.87224578857422, -109.83930206298828, -106.80636596679688, -103.77342224121094, -100.740478515625, -97.70753479003906, -94.67459869384766, -91.64165496826172, -88.60871887207031, -85.57577514648438, -82.54283905029297, -79.50989532470703, -76.4769515991211, -73.44401550292969, -70.41107177734375, -67.37812805175781, -64.34517669677734, -61.31223678588867, -58.279293060302734, -55.24635314941406, -52.213409423828125, -49.18046951293945, -46.14752960205078, -43.114585876464844, -40.08164596557617, -37.0487060546875, -34.01576232910156, -30.98282241821289, -27.949880599975586, -24.91693878173828, -21.88399887084961, -18.851057052612305, -15.818115234375, -12.785173416137695, -9.752232551574707, -6.719291687011719, -3.686349868774414, -0.6534080505371094, 2.3795318603515625, 5.412473678588867, 8.445415496826172, 11.478357315063477, 14.511298179626465, 17.544239044189453, 20.577180862426758, 23.610122680664062, 26.643062591552734, 29.67600440979004, 32.708946228027344]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 6.0, 6.0, 6.0, 6.0, 12.0, 16.0, 15.0, 13.0, 25.0, 19.0, 31.0, 27.0, 26.0, 37.0, 46.0, 33.0, 40.0, 45.0, 59.0, 45.0, 46.0, 40.0, 32.0, 32.0, 42.0, 40.0, 36.0, 40.0, 20.0, 15.0, 36.0, 19.0, 12.0, 20.0, 15.0, 7.0, 10.0, 7.0, 4.0, 1.0, 6.0, 5.0, 1.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-54.60726547241211, -52.830650329589844, -51.054039001464844, -49.27742385864258, -47.50080871582031, -45.72419357299805, -43.94757843017578, -42.17096710205078, -40.394351959228516, -38.61773681640625, -36.84112548828125, -35.064510345458984, -33.28789520263672, -31.511280059814453, -29.73466682434082, -27.958053588867188, -26.181438446044922, -24.404823303222656, -22.628210067749023, -20.85159683227539, -19.074981689453125, -17.29836654663086, -15.521753311157227, -13.745139122009277, -11.968524932861328, -10.191910743713379, -8.41529655456543, -6.6386823654174805, -4.862068176269531, -3.085453987121582, -1.3088397979736328, 0.4677743911743164, 2.2443923950195312, 4.0210065841674805, 5.79762077331543, 7.574234962463379, 9.350849151611328, 11.127463340759277, 12.904077529907227, 14.680691719055176, 16.457305908203125, 18.23392105102539, 20.010534286499023, 21.787147521972656, 23.563762664794922, 25.340377807617188, 27.11699104309082, 28.893604278564453, 30.67021942138672, 32.446834564208984, 34.22344970703125, 36.00006103515625, 37.776676177978516, 39.55329132080078, 41.32990264892578, 43.10651779174805, 44.88313293457031, 46.65974807739258, 48.436363220214844, 50.212974548339844, 51.98958969116211, 53.766204833984375, 55.542816162109375, 57.31943130493164, 59.096046447753906]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 6.0, 5.0, 13.0, 9.0, 14.0, 9.0, 12.0, 19.0, 23.0, 28.0, 26.0, 31.0, 24.0, 25.0, 38.0, 33.0, 41.0, 52.0, 45.0, 48.0, 37.0, 45.0, 45.0, 38.0, 38.0, 41.0, 28.0, 33.0, 35.0, 46.0, 21.0, 18.0, 22.0, 9.0, 14.0, 10.0, 8.0, 4.0, 5.0, 4.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.47265625, -5.30621337890625, -5.1397705078125, -4.97332763671875, -4.806884765625, -4.64044189453125, -4.4739990234375, -4.30755615234375, -4.14111328125, -3.97467041015625, -3.8082275390625, -3.64178466796875, -3.475341796875, -3.30889892578125, -3.1424560546875, -2.97601318359375, -2.8095703125, -2.64312744140625, -2.4766845703125, -2.31024169921875, -2.143798828125, -1.97735595703125, -1.8109130859375, -1.64447021484375, -1.47802734375, -1.31158447265625, -1.1451416015625, -0.97869873046875, -0.812255859375, -0.64581298828125, -0.4793701171875, -0.31292724609375, -0.146484375, 0.01995849609375, 0.1864013671875, 0.35284423828125, 0.519287109375, 0.68572998046875, 0.8521728515625, 1.01861572265625, 1.18505859375, 1.35150146484375, 1.5179443359375, 1.68438720703125, 1.850830078125, 2.01727294921875, 2.1837158203125, 2.35015869140625, 2.5166015625, 2.68304443359375, 2.8494873046875, 3.01593017578125, 3.182373046875, 3.34881591796875, 3.5152587890625, 3.68170166015625, 3.84814453125, 4.01458740234375, 4.1810302734375, 4.34747314453125, 4.513916015625, 4.68035888671875, 4.8468017578125, 5.01324462890625, 5.1796875]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 7.0, 8.0, 11.0, 7.0, 10.0, 15.0, 12.0, 12.0, 22.0, 17.0, 28.0, 27.0, 25.0, 32.0, 23.0, 33.0, 65.0, 151.0, 582.0, 9086.0, 1439022.0, 2726421.0, 17285.0, 826.0, 167.0, 72.0, 47.0, 32.0, 33.0, 29.0, 31.0, 31.0, 22.0, 21.0, 21.0, 9.0, 3.0, 10.0, 7.0, 9.0, 8.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-34.65625, -33.66845703125, -32.6806640625, -31.69287109375, -30.705078125, -29.71728515625, -28.7294921875, -27.74169921875, -26.75390625, -25.76611328125, -24.7783203125, -23.79052734375, -22.802734375, -21.81494140625, -20.8271484375, -19.83935546875, -18.8515625, -17.86376953125, -16.8759765625, -15.88818359375, -14.900390625, -13.91259765625, -12.9248046875, -11.93701171875, -10.94921875, -9.96142578125, -8.9736328125, -7.98583984375, -6.998046875, -6.01025390625, -5.0224609375, -4.03466796875, -3.046875, -2.05908203125, -1.0712890625, -0.08349609375, 0.904296875, 1.89208984375, 2.8798828125, 3.86767578125, 4.85546875, 5.84326171875, 6.8310546875, 7.81884765625, 8.806640625, 9.79443359375, 10.7822265625, 11.77001953125, 12.7578125, 13.74560546875, 14.7333984375, 15.72119140625, 16.708984375, 17.69677734375, 18.6845703125, 19.67236328125, 20.66015625, 21.64794921875, 22.6357421875, 23.62353515625, 24.611328125, 25.59912109375, 26.5869140625, 27.57470703125, 28.5625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 5.0, 5.0, 8.0, 18.0, 25.0, 26.0, 39.0, 55.0, 78.0, 108.0, 158.0, 192.0, 263.0, 372.0, 475.0, 519.0, 440.0, 342.0, 289.0, 182.0, 133.0, 109.0, 52.0, 55.0, 37.0, 28.0, 11.0, 14.0, 9.0, 10.0, 3.0, 2.0, 6.0, 1.0, 1.0, 3.0, 1.0], "bins": [-21.71875, -21.20751953125, -20.6962890625, -20.18505859375, -19.673828125, -19.16259765625, -18.6513671875, -18.14013671875, -17.62890625, -17.11767578125, -16.6064453125, -16.09521484375, -15.583984375, -15.07275390625, -14.5615234375, -14.05029296875, -13.5390625, -13.02783203125, -12.5166015625, -12.00537109375, -11.494140625, -10.98291015625, -10.4716796875, -9.96044921875, -9.44921875, -8.93798828125, -8.4267578125, -7.91552734375, -7.404296875, -6.89306640625, -6.3818359375, -5.87060546875, -5.359375, -4.84814453125, -4.3369140625, -3.82568359375, -3.314453125, -2.80322265625, -2.2919921875, -1.78076171875, -1.26953125, -0.75830078125, -0.2470703125, 0.26416015625, 0.775390625, 1.28662109375, 1.7978515625, 2.30908203125, 2.8203125, 3.33154296875, 3.8427734375, 4.35400390625, 4.865234375, 5.37646484375, 5.8876953125, 6.39892578125, 6.91015625, 7.42138671875, 7.9326171875, 8.44384765625, 8.955078125, 9.46630859375, 9.9775390625, 10.48876953125, 11.0]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 8.0, 4.0, 14.0, 13.0, 20.0, 21.0, 35.0, 47.0, 76.0, 105.0, 168.0, 267.0, 534.0, 2353.0, 800685.0, 3384235.0, 4104.0, 655.0, 331.0, 194.0, 119.0, 86.0, 68.0, 44.0, 35.0, 24.0, 12.0, 8.0, 6.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.875, -44.419921875, -41.96484375, -39.509765625, -37.0546875, -34.599609375, -32.14453125, -29.689453125, -27.234375, -24.779296875, -22.32421875, -19.869140625, -17.4140625, -14.958984375, -12.50390625, -10.048828125, -7.59375, -5.138671875, -2.68359375, -0.228515625, 2.2265625, 4.681640625, 7.13671875, 9.591796875, 12.046875, 14.501953125, 16.95703125, 19.412109375, 21.8671875, 24.322265625, 26.77734375, 29.232421875, 31.6875, 34.142578125, 36.59765625, 39.052734375, 41.5078125, 43.962890625, 46.41796875, 48.873046875, 51.328125, 53.783203125, 56.23828125, 58.693359375, 61.1484375, 63.603515625, 66.05859375, 68.513671875, 70.96875, 73.423828125, 75.87890625, 78.333984375, 80.7890625, 83.244140625, 85.69921875, 88.154296875, 90.609375, 93.064453125, 95.51953125, 97.974609375, 100.4296875, 102.884765625, 105.33984375, 107.794921875, 110.25]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 7.0, 59.0, 445.0, 431.0, 69.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-128.150146484375, -120.15019989013672, -112.15025329589844, -104.15031433105469, -96.1503677368164, -88.15042114257812, -80.15048217773438, -72.1505355834961, -64.15058898925781, -56.15064239501953, -48.150699615478516, -40.1507568359375, -32.15081024169922, -24.150863647460938, -16.150920867919922, -8.150978088378906, -0.151031494140625, 7.848913192749023, 15.848857879638672, 23.84880256652832, 31.84874725341797, 39.84869384765625, 47.848636627197266, 55.84857940673828, 63.84852600097656, 71.84847259521484, 79.84841918945312, 87.84835815429688, 95.84830474853516, 103.84825134277344, 111.84819030761719, 119.84813690185547, 127.84808349609375, 135.8480224609375, 143.8479766845703, 151.84791564941406, 159.84786987304688, 167.84780883789062, 175.84774780273438, 183.84768676757812, 191.84764099121094, 199.8475799560547, 207.8475341796875, 215.84747314453125, 223.847412109375, 231.8473663330078, 239.84730529785156, 247.84725952148438, 255.84719848632812, 263.8471374511719, 271.8470764160156, 279.8470458984375, 287.84698486328125, 295.846923828125, 303.84686279296875, 311.8468017578125, 319.84674072265625, 327.8466796875, 335.84661865234375, 343.8465881347656, 351.8465270996094, 359.8464660644531, 367.8464050292969, 375.8463439941406, 383.8463134765625]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 8.0, 9.0, 11.0, 10.0, 11.0, 13.0, 14.0, 15.0, 15.0, 27.0, 27.0, 24.0, 31.0, 34.0, 24.0, 34.0, 34.0, 35.0, 40.0, 47.0, 42.0, 40.0, 32.0, 38.0, 35.0, 42.0, 29.0, 29.0, 29.0, 22.0, 25.0, 30.0, 13.0, 24.0, 17.0, 15.0, 18.0, 15.0, 9.0, 10.0, 4.0, 5.0, 5.0, 5.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-49.097076416015625, -47.36965560913086, -45.642234802246094, -43.91481018066406, -42.1873893737793, -40.45996856689453, -38.7325439453125, -37.005123138427734, -35.27770233154297, -33.5502815246582, -31.822858810424805, -30.095436096191406, -28.36801528930664, -26.640594482421875, -24.913171768188477, -23.185749053955078, -21.458328247070312, -19.730907440185547, -18.00348472595215, -16.27606201171875, -14.548641204833984, -12.821219444274902, -11.09379768371582, -9.366375923156738, -7.638954162597656, -5.911532402038574, -4.184110641479492, -2.45668888092041, -0.7292671203613281, 0.9981546401977539, 2.725576400756836, 4.452998161315918, 6.180419921875, 7.907841682434082, 9.635263442993164, 11.362685203552246, 13.090106964111328, 14.81752872467041, 16.544950485229492, 18.27237319946289, 19.999794006347656, 21.727214813232422, 23.45463752746582, 25.18206024169922, 26.909481048583984, 28.63690185546875, 30.36432456970215, 32.09174728393555, 33.81916809082031, 35.54658889770508, 37.274009704589844, 39.001434326171875, 40.72885513305664, 42.456275939941406, 44.18370056152344, 45.9111213684082, 47.63854217529297, 49.365962982177734, 51.0933837890625, 52.82080841064453, 54.5482292175293, 56.27565002441406, 58.003074645996094, 59.73049545288086, 61.457916259765625]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 3.0, 7.0, 7.0, 6.0, 12.0, 8.0, 14.0, 14.0, 15.0, 28.0, 15.0, 25.0, 29.0, 29.0, 24.0, 31.0, 29.0, 32.0, 50.0, 40.0, 38.0, 31.0, 42.0, 41.0, 46.0, 40.0, 35.0, 31.0, 28.0, 33.0, 26.0, 34.0, 16.0, 22.0, 19.0, 31.0, 18.0, 8.0, 9.0, 9.0, 12.0, 3.0, 4.0, 4.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.9375, -4.78363037109375, -4.6297607421875, -4.47589111328125, -4.322021484375, -4.16815185546875, -4.0142822265625, -3.86041259765625, -3.70654296875, -3.55267333984375, -3.3988037109375, -3.24493408203125, -3.091064453125, -2.93719482421875, -2.7833251953125, -2.62945556640625, -2.4755859375, -2.32171630859375, -2.1678466796875, -2.01397705078125, -1.860107421875, -1.70623779296875, -1.5523681640625, -1.39849853515625, -1.24462890625, -1.09075927734375, -0.9368896484375, -0.78302001953125, -0.629150390625, -0.47528076171875, -0.3214111328125, -0.16754150390625, -0.013671875, 0.14019775390625, 0.2940673828125, 0.44793701171875, 0.601806640625, 0.75567626953125, 0.9095458984375, 1.06341552734375, 1.21728515625, 1.37115478515625, 1.5250244140625, 1.67889404296875, 1.832763671875, 1.98663330078125, 2.1405029296875, 2.29437255859375, 2.4482421875, 2.60211181640625, 2.7559814453125, 2.90985107421875, 3.063720703125, 3.21759033203125, 3.3714599609375, 3.52532958984375, 3.67919921875, 3.83306884765625, 3.9869384765625, 4.14080810546875, 4.294677734375, 4.44854736328125, 4.6024169921875, 4.75628662109375, 4.91015625]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 6.0, 9.0, 6.0, 14.0, 20.0, 16.0, 37.0, 41.0, 73.0, 112.0, 157.0, 255.0, 381.0, 532.0, 906.0, 1394.0, 2212.0, 3382.0, 5332.0, 8492.0, 13373.0, 21153.0, 33558.0, 54255.0, 89727.0, 150189.0, 221562.0, 172094.0, 103791.0, 62089.0, 38231.0, 23831.0, 15127.0, 9558.0, 5932.0, 3713.0, 2428.0, 1588.0, 1060.0, 629.0, 452.0, 288.0, 182.0, 134.0, 77.0, 53.0, 49.0, 22.0, 15.0, 10.0, 11.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.572265625, -0.5541763305664062, -0.5360870361328125, -0.5179977416992188, -0.499908447265625, -0.48181915283203125, -0.4637298583984375, -0.44564056396484375, -0.42755126953125, -0.40946197509765625, -0.3913726806640625, -0.37328338623046875, -0.355194091796875, -0.33710479736328125, -0.3190155029296875, -0.30092620849609375, -0.2828369140625, -0.26474761962890625, -0.2466583251953125, -0.22856903076171875, -0.210479736328125, -0.19239044189453125, -0.1743011474609375, -0.15621185302734375, -0.13812255859375, -0.12003326416015625, -0.1019439697265625, -0.08385467529296875, -0.065765380859375, -0.04767608642578125, -0.0295867919921875, -0.01149749755859375, 0.006591796875, 0.02468109130859375, 0.0427703857421875, 0.06085968017578125, 0.078948974609375, 0.09703826904296875, 0.1151275634765625, 0.13321685791015625, 0.15130615234375, 0.16939544677734375, 0.1874847412109375, 0.20557403564453125, 0.223663330078125, 0.24175262451171875, 0.2598419189453125, 0.27793121337890625, 0.2960205078125, 0.31410980224609375, 0.3321990966796875, 0.35028839111328125, 0.368377685546875, 0.38646697998046875, 0.4045562744140625, 0.42264556884765625, 0.44073486328125, 0.45882415771484375, 0.4769134521484375, 0.49500274658203125, 0.513092041015625, 0.5311813354492188, 0.5492706298828125, 0.5673599243164062, 0.58544921875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 5.0, 6.0, 4.0, 9.0, 4.0, 12.0, 16.0, 12.0, 25.0, 21.0, 22.0, 34.0, 33.0, 29.0, 24.0, 48.0, 42.0, 42.0, 39.0, 40.0, 1065.0, 39.0, 37.0, 39.0, 36.0, 55.0, 34.0, 28.0, 29.0, 33.0, 14.0, 20.0, 19.0, 27.0, 8.0, 15.0, 9.0, 12.0, 9.0, 9.0, 6.0, 9.0, 1.0, 3.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.138671875, -3.036712646484375, -2.93475341796875, -2.832794189453125, -2.7308349609375, -2.628875732421875, -2.52691650390625, -2.424957275390625, -2.322998046875, -2.221038818359375, -2.11907958984375, -2.017120361328125, -1.9151611328125, -1.813201904296875, -1.71124267578125, -1.609283447265625, -1.50732421875, -1.405364990234375, -1.30340576171875, -1.201446533203125, -1.0994873046875, -0.997528076171875, -0.89556884765625, -0.793609619140625, -0.691650390625, -0.589691162109375, -0.48773193359375, -0.385772705078125, -0.2838134765625, -0.181854248046875, -0.07989501953125, 0.022064208984375, 0.1240234375, 0.225982666015625, 0.32794189453125, 0.429901123046875, 0.5318603515625, 0.633819580078125, 0.73577880859375, 0.837738037109375, 0.939697265625, 1.041656494140625, 1.14361572265625, 1.245574951171875, 1.3475341796875, 1.449493408203125, 1.55145263671875, 1.653411865234375, 1.75537109375, 1.857330322265625, 1.95928955078125, 2.061248779296875, 2.1632080078125, 2.265167236328125, 2.36712646484375, 2.469085693359375, 2.571044921875, 2.673004150390625, 2.77496337890625, 2.876922607421875, 2.9788818359375, 3.080841064453125, 3.18280029296875, 3.284759521484375, 3.38671875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 5.0, 2.0, 5.0, 6.0, 21.0, 19.0, 32.0, 46.0, 51.0, 80.0, 108.0, 155.0, 243.0, 369.0, 515.0, 725.0, 1102.0, 1520.0, 2261.0, 3317.0, 5081.0, 7575.0, 11510.0, 17988.0, 28061.0, 43777.0, 68922.0, 111522.0, 181347.0, 1248374.0, 133552.0, 82231.0, 51798.0, 33159.0, 21159.0, 13503.0, 8899.0, 5814.0, 3892.0, 2689.0, 1724.0, 1287.0, 834.0, 566.0, 353.0, 286.0, 196.0, 150.0, 109.0, 65.0, 39.0, 32.0, 14.0, 22.0, 16.0, 6.0, 6.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.47705078125, -0.46175384521484375, -0.4464569091796875, -0.43115997314453125, -0.415863037109375, -0.40056610107421875, -0.3852691650390625, -0.36997222900390625, -0.35467529296875, -0.33937835693359375, -0.3240814208984375, -0.30878448486328125, -0.293487548828125, -0.27819061279296875, -0.2628936767578125, -0.24759674072265625, -0.2322998046875, -0.21700286865234375, -0.2017059326171875, -0.18640899658203125, -0.171112060546875, -0.15581512451171875, -0.1405181884765625, -0.12522125244140625, -0.10992431640625, -0.09462738037109375, -0.0793304443359375, -0.06403350830078125, -0.048736572265625, -0.03343963623046875, -0.0181427001953125, -0.00284576416015625, 0.012451171875, 0.02774810791015625, 0.0430450439453125, 0.05834197998046875, 0.073638916015625, 0.08893585205078125, 0.1042327880859375, 0.11952972412109375, 0.13482666015625, 0.15012359619140625, 0.1654205322265625, 0.18071746826171875, 0.196014404296875, 0.21131134033203125, 0.2266082763671875, 0.24190521240234375, 0.2572021484375, 0.27249908447265625, 0.2877960205078125, 0.30309295654296875, 0.318389892578125, 0.33368682861328125, 0.3489837646484375, 0.36428070068359375, 0.37957763671875, 0.39487457275390625, 0.4101715087890625, 0.42546844482421875, 0.440765380859375, 0.45606231689453125, 0.4713592529296875, 0.48665618896484375, 0.501953125]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 7.0, 9.0, 10.0, 12.0, 10.0, 9.0, 12.0, 17.0, 23.0, 35.0, 38.0, 42.0, 61.0, 73.0, 70.0, 60.0, 82.0, 80.0, 69.0, 48.0, 46.0, 41.0, 31.0, 29.0, 21.0, 13.0, 16.0, 5.0, 4.0, 3.0, 5.0, 7.0, 1.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00250244140625, -0.0024181008338928223, -0.0023337602615356445, -0.002249419689178467, -0.002165079116821289, -0.0020807385444641113, -0.0019963979721069336, -0.0019120573997497559, -0.0018277168273925781, -0.0017433762550354004, -0.0016590356826782227, -0.001574695110321045, -0.0014903545379638672, -0.0014060139656066895, -0.0013216733932495117, -0.001237332820892334, -0.0011529922485351562, -0.0010686516761779785, -0.0009843111038208008, -0.000899970531463623, -0.0008156299591064453, -0.0007312893867492676, -0.0006469488143920898, -0.0005626082420349121, -0.0004782676696777344, -0.00039392709732055664, -0.0003095865249633789, -0.00022524595260620117, -0.00014090538024902344, -5.65648078918457e-05, 2.777576446533203e-05, 0.00011211633682250977, 0.0001964569091796875, 0.00028079748153686523, 0.00036513805389404297, 0.0004494786262512207, 0.0005338191986083984, 0.0006181597709655762, 0.0007025003433227539, 0.0007868409156799316, 0.0008711814880371094, 0.0009555220603942871, 0.0010398626327514648, 0.0011242032051086426, 0.0012085437774658203, 0.001292884349822998, 0.0013772249221801758, 0.0014615654945373535, 0.0015459060668945312, 0.001630246639251709, 0.0017145872116088867, 0.0017989277839660645, 0.0018832683563232422, 0.00196760892868042, 0.0020519495010375977, 0.0021362900733947754, 0.002220630645751953, 0.002304971218109131, 0.0023893117904663086, 0.0024736523628234863, 0.002557992935180664, 0.002642333507537842, 0.0027266740798950195, 0.0028110146522521973, 0.002895355224609375]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 5.0, 4.0, 5.0, 5.0, 8.0, 16.0, 10.0, 17.0, 38.0, 32.0, 56.0, 61.0, 148.0, 281.0, 650.0, 814811.0, 231058.0, 674.0, 265.0, 145.0, 73.0, 45.0, 29.0, 21.0, 12.0, 14.0, 14.0, 15.0, 13.0, 3.0, 8.0, 5.0, 3.0, 7.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.08575439453125, -0.0834341049194336, -0.08111381530761719, -0.07879352569580078, -0.07647323608398438, -0.07415294647216797, -0.07183265686035156, -0.06951236724853516, -0.06719207763671875, -0.06487178802490234, -0.06255149841308594, -0.06023120880126953, -0.057910919189453125, -0.05559062957763672, -0.05327033996582031, -0.050950050354003906, -0.0486297607421875, -0.046309471130371094, -0.04398918151855469, -0.04166889190673828, -0.039348602294921875, -0.03702831268310547, -0.03470802307128906, -0.032387733459472656, -0.03006744384765625, -0.027747154235839844, -0.025426864624023438, -0.02310657501220703, -0.020786285400390625, -0.01846599578857422, -0.016145706176757812, -0.013825416564941406, -0.011505126953125, -0.009184837341308594, -0.0068645477294921875, -0.004544258117675781, -0.002223968505859375, 9.632110595703125e-05, 0.0024166107177734375, 0.004736900329589844, 0.00705718994140625, 0.009377479553222656, 0.011697769165039062, 0.014018058776855469, 0.016338348388671875, 0.01865863800048828, 0.020978927612304688, 0.023299217224121094, 0.0256195068359375, 0.027939796447753906, 0.030260086059570312, 0.03258037567138672, 0.034900665283203125, 0.03722095489501953, 0.03954124450683594, 0.041861534118652344, 0.04418182373046875, 0.046502113342285156, 0.04882240295410156, 0.05114269256591797, 0.053462982177734375, 0.05578327178955078, 0.05810356140136719, 0.060423851013183594, 0.062744140625]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [8.0, 327.0, 681.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007851768168620765, -0.00041619138210080564, -4.720594733953476e-05, 0.00032177945831790566, 0.000690764922183007, 0.0010597503278404474, 0.001428735675290227, 0.00179772125557065, 0.0021667066030204296, 0.002535691950470209, 0.0029046775307506323, 0.003273662878200412, 0.003642648458480835, 0.0040116338059306145, 0.004380619153380394, 0.0047496045008301735, 0.00511859031394124, 0.00548757566139102, 0.005856561008840799, 0.006225546821951866, 0.006594532169401646, 0.006963517516851425, 0.007332502864301205, 0.007701488211750984, 0.008070473559200764, 0.008439458906650543, 0.008808444254100323, 0.009177429601550102, 0.009546414948999882, 0.009915400296449661, 0.010284386575222015, 0.010653371922671795, 0.011022356338799, 0.01139134168624878, 0.011760327033698559, 0.012129312381148338, 0.012498297728598118, 0.012867283076047897, 0.013236269354820251, 0.013605254702270031, 0.01397424004971981, 0.01434322539716959, 0.01471221074461937, 0.015081196092069149, 0.015450181439518929, 0.015819167718291283, 0.016188152134418488, 0.01655713841319084, 0.016926122829318047, 0.0172951091080904, 0.017664093524217606, 0.01803307980298996, 0.018402064219117165, 0.01877105049788952, 0.019140034914016724, 0.019509021192789078, 0.019878007471561432, 0.020246993750333786, 0.02061597816646099, 0.020984964445233345, 0.02135394886136055, 0.021722935140132904, 0.02209191955626011, 0.022460905835032463, 0.022829890251159668]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 4.0, 4.0, 4.0, 6.0, 2.0, 9.0, 7.0, 13.0, 12.0, 10.0, 21.0, 21.0, 17.0, 28.0, 39.0, 17.0, 32.0, 33.0, 52.0, 33.0, 32.0, 38.0, 37.0, 32.0, 33.0, 37.0, 44.0, 35.0, 31.0, 52.0, 26.0, 30.0, 32.0, 25.0, 24.0, 22.0, 15.0, 21.0, 14.0, 16.0, 6.0, 4.0, 13.0, 9.0, 2.0, 1.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.001103043556213379, -0.0010671885684132576, -0.0010313335806131363, -0.000995478592813015, -0.0009596236050128937, -0.0009237686172127724, -0.0008879136294126511, -0.0008520586416125298, -0.0008162036538124084, -0.0007803486660122871, -0.0007444936782121658, -0.0007086386904120445, -0.0006727837026119232, -0.0006369287148118019, -0.0006010737270116806, -0.0005652187392115593, -0.000529363751411438, -0.0004935087636113167, -0.0004576537758111954, -0.00042179878801107407, -0.00038594380021095276, -0.00035008881241083145, -0.00031423382461071014, -0.00027837883681058884, -0.00024252384901046753, -0.00020666886121034622, -0.00017081387341022491, -0.0001349588856101036, -9.91038978099823e-05, -6.324891000986099e-05, -2.7393922209739685e-05, 8.461065590381622e-06, 4.431605339050293e-05, 8.017104119062424e-05, 0.00011602602899074554, 0.00015188101679086685, 0.00018773600459098816, 0.00022359099239110947, 0.0002594459801912308, 0.0002953009679913521, 0.0003311559557914734, 0.0003670109435915947, 0.000402865931391716, 0.0004387209191918373, 0.0004745759069919586, 0.0005104308947920799, 0.0005462858825922012, 0.0005821408703923225, 0.0006179958581924438, 0.0006538508459925652, 0.0006897058337926865, 0.0007255608215928078, 0.0007614158093929291, 0.0007972707971930504, 0.0008331257849931717, 0.000868980772793293, 0.0009048357605934143, 0.0009406907483935356, 0.0009765457361936569, 0.0010124007239937782, 0.0010482557117938995, 0.0010841106995940208, 0.0011199656873941422, 0.0011558206751942635, 0.0011916756629943848]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 3.0, 7.0, 7.0, 6.0, 12.0, 8.0, 14.0, 14.0, 15.0, 28.0, 15.0, 25.0, 29.0, 29.0, 24.0, 31.0, 29.0, 32.0, 50.0, 40.0, 38.0, 32.0, 41.0, 41.0, 46.0, 40.0, 35.0, 31.0, 28.0, 33.0, 26.0, 34.0, 16.0, 22.0, 19.0, 31.0, 18.0, 8.0, 9.0, 9.0, 12.0, 3.0, 4.0, 4.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.9375, -4.78363037109375, -4.6297607421875, -4.47589111328125, -4.322021484375, -4.16815185546875, -4.0142822265625, -3.86041259765625, -3.70654296875, -3.55267333984375, -3.3988037109375, -3.24493408203125, -3.091064453125, -2.93719482421875, -2.7833251953125, -2.62945556640625, -2.4755859375, -2.32171630859375, -2.1678466796875, -2.01397705078125, -1.860107421875, -1.70623779296875, -1.5523681640625, -1.39849853515625, -1.24462890625, -1.09075927734375, -0.9368896484375, -0.78302001953125, -0.629150390625, -0.47528076171875, -0.3214111328125, -0.16754150390625, -0.013671875, 0.14019775390625, 0.2940673828125, 0.44793701171875, 0.601806640625, 0.75567626953125, 0.9095458984375, 1.06341552734375, 1.21728515625, 1.37115478515625, 1.5250244140625, 1.67889404296875, 1.832763671875, 1.98663330078125, 2.1405029296875, 2.29437255859375, 2.4482421875, 2.60211181640625, 2.7559814453125, 2.90985107421875, 3.063720703125, 3.21759033203125, 3.3714599609375, 3.52532958984375, 3.67919921875, 3.83306884765625, 3.9869384765625, 4.14080810546875, 4.294677734375, 4.44854736328125, 4.6024169921875, 4.75628662109375, 4.91015625]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 5.0, 7.0, 5.0, 13.0, 18.0, 33.0, 41.0, 53.0, 95.0, 141.0, 196.0, 270.0, 400.0, 626.0, 1019.0, 1714.0, 3083.0, 6218.0, 14781.0, 43310.0, 154604.0, 484424.0, 237164.0, 62908.0, 20157.0, 8048.0, 3767.0, 2064.0, 1171.0, 760.0, 460.0, 324.0, 215.0, 144.0, 96.0, 80.0, 45.0, 38.0, 22.0, 9.0, 7.0, 9.0, 6.0, 2.0, 4.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.546875, -3.423095703125, -3.29931640625, -3.175537109375, -3.0517578125, -2.927978515625, -2.80419921875, -2.680419921875, -2.556640625, -2.432861328125, -2.30908203125, -2.185302734375, -2.0615234375, -1.937744140625, -1.81396484375, -1.690185546875, -1.56640625, -1.442626953125, -1.31884765625, -1.195068359375, -1.0712890625, -0.947509765625, -0.82373046875, -0.699951171875, -0.576171875, -0.452392578125, -0.32861328125, -0.204833984375, -0.0810546875, 0.042724609375, 0.16650390625, 0.290283203125, 0.4140625, 0.537841796875, 0.66162109375, 0.785400390625, 0.9091796875, 1.032958984375, 1.15673828125, 1.280517578125, 1.404296875, 1.528076171875, 1.65185546875, 1.775634765625, 1.8994140625, 2.023193359375, 2.14697265625, 2.270751953125, 2.39453125, 2.518310546875, 2.64208984375, 2.765869140625, 2.8896484375, 3.013427734375, 3.13720703125, 3.260986328125, 3.384765625, 3.508544921875, 3.63232421875, 3.756103515625, 3.8798828125, 4.003662109375, 4.12744140625, 4.251220703125, 4.375]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 6.0, 6.0, 10.0, 11.0, 13.0, 18.0, 21.0, 15.0, 25.0, 21.0, 31.0, 21.0, 34.0, 36.0, 52.0, 43.0, 35.0, 91.0, 1655.0, 435.0, 81.0, 43.0, 59.0, 33.0, 41.0, 31.0, 32.0, 30.0, 18.0, 32.0, 12.0, 14.0, 13.0, 11.0, 7.0, 2.0, 4.0, 1.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.25, -18.60693359375, -17.9638671875, -17.32080078125, -16.677734375, -16.03466796875, -15.3916015625, -14.74853515625, -14.10546875, -13.46240234375, -12.8193359375, -12.17626953125, -11.533203125, -10.89013671875, -10.2470703125, -9.60400390625, -8.9609375, -8.31787109375, -7.6748046875, -7.03173828125, -6.388671875, -5.74560546875, -5.1025390625, -4.45947265625, -3.81640625, -3.17333984375, -2.5302734375, -1.88720703125, -1.244140625, -0.60107421875, 0.0419921875, 0.68505859375, 1.328125, 1.97119140625, 2.6142578125, 3.25732421875, 3.900390625, 4.54345703125, 5.1865234375, 5.82958984375, 6.47265625, 7.11572265625, 7.7587890625, 8.40185546875, 9.044921875, 9.68798828125, 10.3310546875, 10.97412109375, 11.6171875, 12.26025390625, 12.9033203125, 13.54638671875, 14.189453125, 14.83251953125, 15.4755859375, 16.11865234375, 16.76171875, 17.40478515625, 18.0478515625, 18.69091796875, 19.333984375, 19.97705078125, 20.6201171875, 21.26318359375, 21.90625]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 2.0, 5.0, 2.0, 5.0, 7.0, 11.0, 14.0, 15.0, 12.0, 27.0, 33.0, 34.0, 50.0, 59.0, 67.0, 138.0, 224.0, 436.0, 1582.0, 46892.0, 3085285.0, 8859.0, 911.0, 346.0, 226.0, 125.0, 81.0, 49.0, 31.0, 36.0, 22.0, 20.0, 15.0, 25.0, 16.0, 14.0, 7.0, 11.0, 3.0, 6.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-34.21875, -33.1923828125, -32.166015625, -31.1396484375, -30.11328125, -29.0869140625, -28.060546875, -27.0341796875, -26.0078125, -24.9814453125, -23.955078125, -22.9287109375, -21.90234375, -20.8759765625, -19.849609375, -18.8232421875, -17.796875, -16.7705078125, -15.744140625, -14.7177734375, -13.69140625, -12.6650390625, -11.638671875, -10.6123046875, -9.5859375, -8.5595703125, -7.533203125, -6.5068359375, -5.48046875, -4.4541015625, -3.427734375, -2.4013671875, -1.375, -0.3486328125, 0.677734375, 1.7041015625, 2.73046875, 3.7568359375, 4.783203125, 5.8095703125, 6.8359375, 7.8623046875, 8.888671875, 9.9150390625, 10.94140625, 11.9677734375, 12.994140625, 14.0205078125, 15.046875, 16.0732421875, 17.099609375, 18.1259765625, 19.15234375, 20.1787109375, 21.205078125, 22.2314453125, 23.2578125, 24.2841796875, 25.310546875, 26.3369140625, 27.36328125, 28.3896484375, 29.416015625, 30.4423828125, 31.46875]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 176.0, 830.0, 11.0], "bins": [-297.5321044921875, -292.7522888183594, -287.9725036621094, -283.19268798828125, -278.4128723144531, -273.633056640625, -268.853271484375, -264.0734558105469, -259.29364013671875, -254.5138397216797, -249.73402404785156, -244.9542236328125, -240.17440795898438, -235.3946075439453, -230.6147918701172, -225.83499145507812, -221.05519104003906, -216.275390625, -211.49557495117188, -206.7157745361328, -201.9359588623047, -197.15615844726562, -192.3763427734375, -187.59654235839844, -182.81674194335938, -178.0369415283203, -173.2571258544922, -168.47732543945312, -163.697509765625, -158.91770935058594, -154.1378936767578, -149.35809326171875, -144.57827758789062, -139.79847717285156, -135.01866149902344, -130.23886108398438, -125.45904541015625, -120.67924499511719, -115.8994369506836, -111.11962890625, -106.33982849121094, -101.56002044677734, -96.78021240234375, -92.00040435791016, -87.22059631347656, -82.4407958984375, -77.6609878540039, -72.88117980957031, -68.10137176513672, -63.321563720703125, -58.54175567626953, -53.7619514465332, -48.98214340209961, -44.202335357666016, -39.42253112792969, -34.642723083496094, -29.8629150390625, -25.083106994628906, -20.303300857543945, -15.523493766784668, -10.74368667602539, -5.963878631591797, -1.184072494506836, 3.595733642578125, 8.375542640686035]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 2.0, 2.0, 2.0, 6.0, 6.0, 3.0, 16.0, 9.0, 11.0, 13.0, 17.0, 15.0, 24.0, 25.0, 25.0, 28.0, 27.0, 36.0, 37.0, 34.0, 32.0, 35.0, 43.0, 43.0, 33.0, 37.0, 41.0, 41.0, 40.0, 24.0, 40.0, 43.0, 19.0, 24.0, 21.0, 16.0, 23.0, 12.0, 19.0, 13.0, 11.0, 12.0, 11.0, 10.0, 8.0, 4.0, 3.0, 3.0, 0.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.67430877685547, -50.972103118896484, -49.2698974609375, -47.567691802978516, -45.86548614501953, -44.16328048706055, -42.46107482910156, -40.75886917114258, -39.056663513183594, -37.35445785522461, -35.652252197265625, -33.95004653930664, -32.247840881347656, -30.545635223388672, -28.843429565429688, -27.141223907470703, -25.43901824951172, -23.736812591552734, -22.03460693359375, -20.332401275634766, -18.63019561767578, -16.927989959716797, -15.225784301757812, -13.523578643798828, -11.821372985839844, -10.11916732788086, -8.416961669921875, -6.714756011962891, -5.012550354003906, -3.310344696044922, -1.6081390380859375, 0.09406661987304688, 1.7962760925292969, 3.4984817504882812, 5.200687408447266, 6.90289306640625, 8.605098724365234, 10.307304382324219, 12.009510040283203, 13.711715698242188, 15.413921356201172, 17.116127014160156, 18.81833267211914, 20.520538330078125, 22.22274398803711, 23.924949645996094, 25.627155303955078, 27.329360961914062, 29.031566619873047, 30.73377227783203, 32.435977935791016, 34.13818359375, 35.840389251708984, 37.54259490966797, 39.24480056762695, 40.94700622558594, 42.64921188354492, 44.351417541503906, 46.05362319946289, 47.755828857421875, 49.45803451538086, 51.160240173339844, 52.86244583129883, 54.56465148925781, 56.2668571472168]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 5.0, 9.0, 4.0, 9.0, 11.0, 7.0, 11.0, 25.0, 8.0, 19.0, 26.0, 25.0, 27.0, 34.0, 29.0, 23.0, 43.0, 27.0, 46.0, 37.0, 42.0, 47.0, 31.0, 47.0, 45.0, 38.0, 29.0, 32.0, 32.0, 25.0, 36.0, 24.0, 23.0, 22.0, 21.0, 21.0, 13.0, 9.0, 15.0, 11.0, 5.0, 6.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.078125, -4.9185791015625, -4.759033203125, -4.5994873046875, -4.43994140625, -4.2803955078125, -4.120849609375, -3.9613037109375, -3.8017578125, -3.6422119140625, -3.482666015625, -3.3231201171875, -3.16357421875, -3.0040283203125, -2.844482421875, -2.6849365234375, -2.525390625, -2.3658447265625, -2.206298828125, -2.0467529296875, -1.88720703125, -1.7276611328125, -1.568115234375, -1.4085693359375, -1.2490234375, -1.0894775390625, -0.929931640625, -0.7703857421875, -0.61083984375, -0.4512939453125, -0.291748046875, -0.1322021484375, 0.02734375, 0.1868896484375, 0.346435546875, 0.5059814453125, 0.66552734375, 0.8250732421875, 0.984619140625, 1.1441650390625, 1.3037109375, 1.4632568359375, 1.622802734375, 1.7823486328125, 1.94189453125, 2.1014404296875, 2.260986328125, 2.4205322265625, 2.580078125, 2.7396240234375, 2.899169921875, 3.0587158203125, 3.21826171875, 3.3778076171875, 3.537353515625, 3.6968994140625, 3.8564453125, 4.0159912109375, 4.175537109375, 4.3350830078125, 4.49462890625, 4.6541748046875, 4.813720703125, 4.9732666015625, 5.1328125]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 4.0, 7.0, 9.0, 9.0, 7.0, 7.0, 18.0, 11.0, 21.0, 28.0, 42.0, 61.0, 81.0, 103.0, 205.0, 456.0, 1428.0, 4870.0, 21706.0, 133498.0, 1113465.0, 2299938.0, 536597.0, 64585.0, 12262.0, 3094.0, 892.0, 326.0, 177.0, 118.0, 68.0, 46.0, 34.0, 23.0, 24.0, 16.0, 12.0, 13.0, 8.0, 7.0, 4.0, 6.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.71875, -10.37646484375, -10.0341796875, -9.69189453125, -9.349609375, -9.00732421875, -8.6650390625, -8.32275390625, -7.98046875, -7.63818359375, -7.2958984375, -6.95361328125, -6.611328125, -6.26904296875, -5.9267578125, -5.58447265625, -5.2421875, -4.89990234375, -4.5576171875, -4.21533203125, -3.873046875, -3.53076171875, -3.1884765625, -2.84619140625, -2.50390625, -2.16162109375, -1.8193359375, -1.47705078125, -1.134765625, -0.79248046875, -0.4501953125, -0.10791015625, 0.234375, 0.57666015625, 0.9189453125, 1.26123046875, 1.603515625, 1.94580078125, 2.2880859375, 2.63037109375, 2.97265625, 3.31494140625, 3.6572265625, 3.99951171875, 4.341796875, 4.68408203125, 5.0263671875, 5.36865234375, 5.7109375, 6.05322265625, 6.3955078125, 6.73779296875, 7.080078125, 7.42236328125, 7.7646484375, 8.10693359375, 8.44921875, 8.79150390625, 9.1337890625, 9.47607421875, 9.818359375, 10.16064453125, 10.5029296875, 10.84521484375, 11.1875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 6.0, 8.0, 8.0, 10.0, 10.0, 19.0, 17.0, 34.0, 64.0, 93.0, 115.0, 176.0, 220.0, 370.0, 514.0, 633.0, 556.0, 393.0, 237.0, 186.0, 138.0, 92.0, 51.0, 41.0, 28.0, 24.0, 14.0, 8.0, 3.0, 1.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.0, -22.387451171875, -21.77490234375, -21.162353515625, -20.5498046875, -19.937255859375, -19.32470703125, -18.712158203125, -18.099609375, -17.487060546875, -16.87451171875, -16.261962890625, -15.6494140625, -15.036865234375, -14.42431640625, -13.811767578125, -13.19921875, -12.586669921875, -11.97412109375, -11.361572265625, -10.7490234375, -10.136474609375, -9.52392578125, -8.911376953125, -8.298828125, -7.686279296875, -7.07373046875, -6.461181640625, -5.8486328125, -5.236083984375, -4.62353515625, -4.010986328125, -3.3984375, -2.785888671875, -2.17333984375, -1.560791015625, -0.9482421875, -0.335693359375, 0.27685546875, 0.889404296875, 1.501953125, 2.114501953125, 2.72705078125, 3.339599609375, 3.9521484375, 4.564697265625, 5.17724609375, 5.789794921875, 6.40234375, 7.014892578125, 7.62744140625, 8.239990234375, 8.8525390625, 9.465087890625, 10.07763671875, 10.690185546875, 11.302734375, 11.915283203125, 12.52783203125, 13.140380859375, 13.7529296875, 14.365478515625, 14.97802734375, 15.590576171875, 16.203125]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 5.0, 11.0, 5.0, 18.0, 35.0, 29.0, 75.0, 80.0, 140.0, 266.0, 632.0, 3771.0, 3802075.0, 384205.0, 1929.0, 447.0, 207.0, 122.0, 71.0, 58.0, 29.0, 28.0, 15.0, 5.0, 6.0, 5.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.375, -60.4755859375, -57.576171875, -54.6767578125, -51.77734375, -48.8779296875, -45.978515625, -43.0791015625, -40.1796875, -37.2802734375, -34.380859375, -31.4814453125, -28.58203125, -25.6826171875, -22.783203125, -19.8837890625, -16.984375, -14.0849609375, -11.185546875, -8.2861328125, -5.38671875, -2.4873046875, 0.412109375, 3.3115234375, 6.2109375, 9.1103515625, 12.009765625, 14.9091796875, 17.80859375, 20.7080078125, 23.607421875, 26.5068359375, 29.40625, 32.3056640625, 35.205078125, 38.1044921875, 41.00390625, 43.9033203125, 46.802734375, 49.7021484375, 52.6015625, 55.5009765625, 58.400390625, 61.2998046875, 64.19921875, 67.0986328125, 69.998046875, 72.8974609375, 75.796875, 78.6962890625, 81.595703125, 84.4951171875, 87.39453125, 90.2939453125, 93.193359375, 96.0927734375, 98.9921875, 101.8916015625, 104.791015625, 107.6904296875, 110.58984375, 113.4892578125, 116.388671875, 119.2880859375, 122.1875]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 50.0, 275.0, 463.0, 197.0, 20.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-367.4720153808594, -360.58819580078125, -353.7043762207031, -346.820556640625, -339.9367370605469, -333.05291748046875, -326.1690979003906, -319.2852783203125, -312.4014587402344, -305.51763916015625, -298.6338195800781, -291.75, -284.8661804199219, -277.98236083984375, -271.0985412597656, -264.2147216796875, -257.33087158203125, -250.44705200195312, -243.563232421875, -236.67941284179688, -229.79559326171875, -222.91177368164062, -216.0279541015625, -209.14413452148438, -202.26031494140625, -195.37649536132812, -188.49267578125, -181.60885620117188, -174.72503662109375, -167.84121704101562, -160.9573974609375, -154.07357788085938, -147.1897735595703, -140.3059539794922, -133.42213439941406, -126.53831481933594, -119.65449523925781, -112.77067565917969, -105.88684844970703, -99.0030288696289, -92.11920928955078, -85.23538970947266, -78.35157012939453, -71.46774291992188, -64.58392333984375, -57.70010757446289, -50.8162841796875, -43.932464599609375, -37.04864501953125, -30.164825439453125, -23.281003952026367, -16.39718246459961, -9.513362884521484, -2.6295433044433594, 4.254280090332031, 11.138099670410156, 18.02191925048828, 24.905738830566406, 31.789560317993164, 38.67338180541992, 45.55720138549805, 52.44102096557617, 59.32484436035156, 66.20866394042969, 73.09248352050781]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 2.0, 9.0, 5.0, 5.0, 8.0, 17.0, 15.0, 18.0, 15.0, 21.0, 24.0, 24.0, 40.0, 45.0, 28.0, 31.0, 44.0, 35.0, 29.0, 35.0, 38.0, 35.0, 49.0, 45.0, 42.0, 40.0, 42.0, 42.0, 32.0, 28.0, 25.0, 20.0, 21.0, 27.0, 13.0, 16.0, 14.0, 9.0, 6.0, 3.0, 1.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.37615966796875, -46.57379913330078, -44.77143478393555, -42.96907424926758, -41.166709899902344, -39.364349365234375, -37.561988830566406, -35.75962829589844, -33.9572639465332, -32.154903411865234, -30.3525390625, -28.55017852783203, -26.74781608581543, -24.945453643798828, -23.14309310913086, -21.340730667114258, -19.538368225097656, -17.736005783081055, -15.93364429473877, -14.131282806396484, -12.328920364379883, -10.526557922363281, -8.724196434020996, -6.921834945678711, -5.119472503662109, -3.317110538482666, -1.5147485733032227, 0.2876133918762207, 2.089975357055664, 3.8923377990722656, 5.694699287414551, 7.497060775756836, 9.299423217773438, 11.101785659790039, 12.904147148132324, 14.70650863647461, 16.50887107849121, 18.311233520507812, 20.11359405517578, 21.915956497192383, 23.718318939208984, 25.520681381225586, 27.323043823242188, 29.125404357910156, 30.927766799926758, 32.73012924194336, 34.53248977661133, 36.33485412597656, 38.13721466064453, 39.9395751953125, 41.741939544677734, 43.5443000793457, 45.34666442871094, 47.149024963378906, 48.951385498046875, 50.753746032714844, 52.55611038208008, 54.35847091674805, 56.16083526611328, 57.96319580078125, 59.76555633544922, 61.56792068481445, 63.37028121948242, 65.17264556884766, 66.97500610351562]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 6.0, 12.0, 6.0, 8.0, 7.0, 13.0, 13.0, 17.0, 20.0, 15.0, 18.0, 35.0, 26.0, 33.0, 35.0, 37.0, 34.0, 31.0, 44.0, 45.0, 44.0, 47.0, 40.0, 34.0, 42.0, 40.0, 33.0, 33.0, 39.0, 32.0, 27.0, 23.0, 21.0, 18.0, 18.0, 11.0, 12.0, 6.0, 12.0, 5.0, 4.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.43359375, -5.26409912109375, -5.0946044921875, -4.92510986328125, -4.755615234375, -4.58612060546875, -4.4166259765625, -4.24713134765625, -4.07763671875, -3.90814208984375, -3.7386474609375, -3.56915283203125, -3.399658203125, -3.23016357421875, -3.0606689453125, -2.89117431640625, -2.7216796875, -2.55218505859375, -2.3826904296875, -2.21319580078125, -2.043701171875, -1.87420654296875, -1.7047119140625, -1.53521728515625, -1.36572265625, -1.19622802734375, -1.0267333984375, -0.85723876953125, -0.687744140625, -0.51824951171875, -0.3487548828125, -0.17926025390625, -0.009765625, 0.15972900390625, 0.3292236328125, 0.49871826171875, 0.668212890625, 0.83770751953125, 1.0072021484375, 1.17669677734375, 1.34619140625, 1.51568603515625, 1.6851806640625, 1.85467529296875, 2.024169921875, 2.19366455078125, 2.3631591796875, 2.53265380859375, 2.7021484375, 2.87164306640625, 3.0411376953125, 3.21063232421875, 3.380126953125, 3.54962158203125, 3.7191162109375, 3.88861083984375, 4.05810546875, 4.22760009765625, 4.3970947265625, 4.56658935546875, 4.736083984375, 4.90557861328125, 5.0750732421875, 5.24456787109375, 5.4140625]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 7.0, 8.0, 13.0, 12.0, 19.0, 34.0, 41.0, 73.0, 96.0, 172.0, 219.0, 387.0, 566.0, 809.0, 1212.0, 1913.0, 2903.0, 4350.0, 6837.0, 10667.0, 16457.0, 25859.0, 40486.0, 63060.0, 99092.0, 159821.0, 211381.0, 146771.0, 92039.0, 57965.0, 37532.0, 24140.0, 15416.0, 9924.0, 6345.0, 4103.0, 2615.0, 1793.0, 1142.0, 743.0, 515.0, 337.0, 215.0, 170.0, 92.0, 75.0, 52.0, 32.0, 17.0, 20.0, 7.0, 7.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.58984375, -0.5716476440429688, -0.5534515380859375, -0.5352554321289062, -0.517059326171875, -0.49886322021484375, -0.4806671142578125, -0.46247100830078125, -0.44427490234375, -0.42607879638671875, -0.4078826904296875, -0.38968658447265625, -0.371490478515625, -0.35329437255859375, -0.3350982666015625, -0.31690216064453125, -0.2987060546875, -0.28050994873046875, -0.2623138427734375, -0.24411773681640625, -0.225921630859375, -0.20772552490234375, -0.1895294189453125, -0.17133331298828125, -0.15313720703125, -0.13494110107421875, -0.1167449951171875, -0.09854888916015625, -0.080352783203125, -0.06215667724609375, -0.0439605712890625, -0.02576446533203125, -0.007568359375, 0.01062774658203125, 0.0288238525390625, 0.04701995849609375, 0.065216064453125, 0.08341217041015625, 0.1016082763671875, 0.11980438232421875, 0.13800048828125, 0.15619659423828125, 0.1743927001953125, 0.19258880615234375, 0.210784912109375, 0.22898101806640625, 0.2471771240234375, 0.26537322998046875, 0.2835693359375, 0.30176544189453125, 0.3199615478515625, 0.33815765380859375, 0.356353759765625, 0.37454986572265625, 0.3927459716796875, 0.41094207763671875, 0.42913818359375, 0.44733428955078125, 0.4655303955078125, 0.48372650146484375, 0.501922607421875, 0.5201187133789062, 0.5383148193359375, 0.5565109252929688, 0.57470703125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 3.0, 7.0, 6.0, 3.0, 7.0, 10.0, 11.0, 14.0, 13.0, 17.0, 17.0, 20.0, 33.0, 26.0, 29.0, 34.0, 43.0, 32.0, 47.0, 47.0, 33.0, 32.0, 1070.0, 42.0, 40.0, 51.0, 33.0, 31.0, 36.0, 33.0, 32.0, 29.0, 23.0, 22.0, 13.0, 22.0, 14.0, 11.0, 10.0, 7.0, 4.0, 5.0, 4.0, 1.0, 4.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.005859375, -2.898529052734375, -2.79119873046875, -2.683868408203125, -2.5765380859375, -2.469207763671875, -2.36187744140625, -2.254547119140625, -2.147216796875, -2.039886474609375, -1.93255615234375, -1.825225830078125, -1.7178955078125, -1.610565185546875, -1.50323486328125, -1.395904541015625, -1.28857421875, -1.181243896484375, -1.07391357421875, -0.966583251953125, -0.8592529296875, -0.751922607421875, -0.64459228515625, -0.537261962890625, -0.429931640625, -0.322601318359375, -0.21527099609375, -0.107940673828125, -0.0006103515625, 0.106719970703125, 0.21405029296875, 0.321380615234375, 0.4287109375, 0.536041259765625, 0.64337158203125, 0.750701904296875, 0.8580322265625, 0.965362548828125, 1.07269287109375, 1.180023193359375, 1.287353515625, 1.394683837890625, 1.50201416015625, 1.609344482421875, 1.7166748046875, 1.824005126953125, 1.93133544921875, 2.038665771484375, 2.14599609375, 2.253326416015625, 2.36065673828125, 2.467987060546875, 2.5753173828125, 2.682647705078125, 2.78997802734375, 2.897308349609375, 3.004638671875, 3.111968994140625, 3.21929931640625, 3.326629638671875, 3.4339599609375, 3.541290283203125, 3.64862060546875, 3.755950927734375, 3.86328125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 7.0, 4.0, 10.0, 10.0, 15.0, 28.0, 46.0, 49.0, 60.0, 100.0, 157.0, 208.0, 334.0, 454.0, 671.0, 947.0, 1523.0, 2273.0, 3461.0, 5468.0, 8552.0, 13744.0, 22083.0, 36020.0, 59206.0, 97595.0, 159932.0, 1270708.0, 160944.0, 96662.0, 59108.0, 36579.0, 22182.0, 13747.0, 8564.0, 5318.0, 3539.0, 2277.0, 1440.0, 955.0, 726.0, 448.0, 298.0, 214.0, 152.0, 104.0, 65.0, 45.0, 31.0, 28.0, 14.0, 17.0, 7.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.521484375, -0.5038070678710938, -0.4861297607421875, -0.46845245361328125, -0.450775146484375, -0.43309783935546875, -0.4154205322265625, -0.39774322509765625, -0.38006591796875, -0.36238861083984375, -0.3447113037109375, -0.32703399658203125, -0.309356689453125, -0.29167938232421875, -0.2740020751953125, -0.25632476806640625, -0.2386474609375, -0.22097015380859375, -0.2032928466796875, -0.18561553955078125, -0.167938232421875, -0.15026092529296875, -0.1325836181640625, -0.11490631103515625, -0.09722900390625, -0.07955169677734375, -0.0618743896484375, -0.04419708251953125, -0.026519775390625, -0.00884246826171875, 0.0088348388671875, 0.02651214599609375, 0.044189453125, 0.06186676025390625, 0.0795440673828125, 0.09722137451171875, 0.114898681640625, 0.13257598876953125, 0.1502532958984375, 0.16793060302734375, 0.18560791015625, 0.20328521728515625, 0.2209625244140625, 0.23863983154296875, 0.256317138671875, 0.27399444580078125, 0.2916717529296875, 0.30934906005859375, 0.3270263671875, 0.34470367431640625, 0.3623809814453125, 0.38005828857421875, 0.397735595703125, 0.41541290283203125, 0.4330902099609375, 0.45076751708984375, 0.46844482421875, 0.48612213134765625, 0.5037994384765625, 0.5214767456054688, 0.539154052734375, 0.5568313598632812, 0.5745086669921875, 0.5921859741210938, 0.60986328125]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 6.0, 3.0, 6.0, 9.0, 5.0, 20.0, 10.0, 28.0, 34.0, 48.0, 53.0, 65.0, 75.0, 99.0, 90.0, 76.0, 74.0, 66.0, 61.0, 37.0, 35.0, 23.0, 24.0, 13.0, 7.0, 12.0, 6.0, 5.0, 1.0, 0.0, 4.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0029811859130859375, -0.002869337797164917, -0.0027574896812438965, -0.002645641565322876, -0.0025337934494018555, -0.002421945333480835, -0.0023100972175598145, -0.002198249101638794, -0.0020864009857177734, -0.001974552869796753, -0.0018627047538757324, -0.001750856637954712, -0.0016390085220336914, -0.001527160406112671, -0.0014153122901916504, -0.0013034641742706299, -0.0011916160583496094, -0.0010797679424285889, -0.0009679198265075684, -0.0008560717105865479, -0.0007442235946655273, -0.0006323754787445068, -0.0005205273628234863, -0.0004086792469024658, -0.0002968311309814453, -0.0001849830150604248, -7.31348991394043e-05, 3.871321678161621e-05, 0.00015056133270263672, 0.0002624094486236572, 0.00037425756454467773, 0.00048610568046569824, 0.0005979537963867188, 0.0007098019123077393, 0.0008216500282287598, 0.0009334981441497803, 0.0010453462600708008, 0.0011571943759918213, 0.0012690424919128418, 0.0013808906078338623, 0.0014927387237548828, 0.0016045868396759033, 0.0017164349555969238, 0.0018282830715179443, 0.0019401311874389648, 0.0020519793033599854, 0.002163827419281006, 0.0022756755352020264, 0.002387523651123047, 0.0024993717670440674, 0.002611219882965088, 0.0027230679988861084, 0.002834916114807129, 0.0029467642307281494, 0.00305861234664917, 0.0031704604625701904, 0.003282308578491211, 0.0033941566944122314, 0.003506004810333252, 0.0036178529262542725, 0.003729701042175293, 0.0038415491580963135, 0.003953397274017334, 0.0040652453899383545, 0.004177093505859375]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 7.0, 2.0, 2.0, 4.0, 5.0, 8.0, 10.0, 17.0, 14.0, 28.0, 37.0, 44.0, 73.0, 117.0, 274.0, 937.0, 1043395.0, 2700.0, 415.0, 157.0, 97.0, 53.0, 43.0, 33.0, 26.0, 13.0, 16.0, 5.0, 6.0, 4.0, 8.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0], "bins": [-0.11578369140625, -0.11286544799804688, -0.10994720458984375, -0.10702896118164062, -0.1041107177734375, -0.10119247436523438, -0.09827423095703125, -0.09535598754882812, -0.092437744140625, -0.08951950073242188, -0.08660125732421875, -0.08368301391601562, -0.0807647705078125, -0.07784652709960938, -0.07492828369140625, -0.07201004028320312, -0.069091796875, -0.06617355346679688, -0.06325531005859375, -0.060337066650390625, -0.0574188232421875, -0.054500579833984375, -0.05158233642578125, -0.048664093017578125, -0.045745849609375, -0.042827606201171875, -0.03990936279296875, -0.036991119384765625, -0.0340728759765625, -0.031154632568359375, -0.02823638916015625, -0.025318145751953125, -0.02239990234375, -0.019481658935546875, -0.01656341552734375, -0.013645172119140625, -0.0107269287109375, -0.007808685302734375, -0.00489044189453125, -0.001972198486328125, 0.000946044921875, 0.003864288330078125, 0.00678253173828125, 0.009700775146484375, 0.0126190185546875, 0.015537261962890625, 0.01845550537109375, 0.021373748779296875, 0.0242919921875, 0.027210235595703125, 0.03012847900390625, 0.033046722412109375, 0.0359649658203125, 0.038883209228515625, 0.04180145263671875, 0.044719696044921875, 0.047637939453125, 0.050556182861328125, 0.05347442626953125, 0.056392669677734375, 0.0593109130859375, 0.062229156494140625, 0.06514739990234375, 0.06806564331054688, 0.07098388671875]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 12.0, 101.0, 337.0, 415.0, 128.0, 21.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.007397281937301159, -0.007265530992299318, -0.00713377958163619, -0.00700202863663435, -0.006870277225971222, -0.006738526280969381, -0.006606775335967541, -0.006475023925304413, -0.006343272980302572, -0.006211522035300732, -0.006079770624637604, -0.005948019679635763, -0.005816268734633923, -0.005684517323970795, -0.005552766378968954, -0.005421014968305826, -0.005289264023303986, -0.005157513078302145, -0.005025761667639017, -0.0048940107226371765, -0.004762259311974049, -0.004630508366972208, -0.004498757421970367, -0.0043670060113072395, -0.004235255066305399, -0.004103504121303558, -0.0039717527106404305, -0.00384000176563859, -0.0037082505878061056, -0.0035764994099736214, -0.0034447484649717808, -0.0033129972871392965, -0.0031812461093068123, -0.003049494931474328, -0.002917743753641844, -0.002785992808640003, -0.002654241630807519, -0.0025224904529750347, -0.002390739507973194, -0.00225898833014071, -0.0021272371523082256, -0.0019954859744757414, -0.001863734913058579, -0.0017319838516414165, -0.0016002326738089323, -0.001468481495976448, -0.0013367304345592856, -0.0012049793731421232, -0.0010732280788943172, -0.0009414769592694938, -0.0008097258396446705, -0.0006779747200198472, -0.0005462236003950238, -0.0004144724807702005, -0.00028272136114537716, -0.00015097024152055383, -1.9219121895730495e-05, 0.00011253199772909284, 0.00024428311735391617, 0.0003760342369787395, 0.0005077853566035628, 0.0006395364762283862, 0.0007712875958532095, 0.0009030387154780328, 0.0010347898351028562]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 7.0, 12.0, 10.0, 10.0, 15.0, 18.0, 21.0, 18.0, 23.0, 24.0, 32.0, 24.0, 37.0, 41.0, 52.0, 42.0, 56.0, 39.0, 32.0, 39.0, 47.0, 56.0, 45.0, 42.0, 43.0, 30.0, 26.0, 26.0, 27.0, 16.0, 20.0, 18.0, 11.0, 10.0, 9.0, 8.0, 7.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0015050172805786133, -0.0014540227130055428, -0.0014030281454324722, -0.0013520335778594017, -0.0013010390102863312, -0.0012500444427132607, -0.0011990498751401901, -0.0011480553075671196, -0.001097060739994049, -0.0010460661724209785, -0.000995071604847908, -0.0009440770372748375, -0.000893082469701767, -0.0008420879021286964, -0.0007910933345556259, -0.0007400987669825554, -0.0006891041994094849, -0.0006381096318364143, -0.0005871150642633438, -0.0005361204966902733, -0.00048512592911720276, -0.00043413136154413223, -0.0003831367939710617, -0.0003321422263979912, -0.00028114765882492065, -0.00023015309125185013, -0.0001791585236787796, -0.00012816395610570908, -7.716938853263855e-05, -2.6174820959568024e-05, 2.4819746613502502e-05, 7.581431418657303e-05, 0.00012680888175964355, 0.00017780344933271408, 0.0002287980169057846, 0.00027979258447885513, 0.00033078715205192566, 0.0003817817196249962, 0.0004327762871980667, 0.00048377085477113724, 0.0005347654223442078, 0.0005857599899172783, 0.0006367545574903488, 0.0006877491250634193, 0.0007387436926364899, 0.0007897382602095604, 0.0008407328277826309, 0.0008917273953557014, 0.000942721962928772, 0.0009937165305018425, 0.001044711098074913, 0.0010957056656479836, 0.001146700233221054, 0.0011976948007941246, 0.0012486893683671951, 0.0012996839359402657, 0.0013506785035133362, 0.0014016730710864067, 0.0014526676386594772, 0.0015036622062325478, 0.0015546567738056183, 0.0016056513413786888, 0.0016566459089517593, 0.0017076404765248299, 0.0017586350440979004]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 6.0, 12.0, 6.0, 8.0, 7.0, 13.0, 13.0, 17.0, 20.0, 15.0, 18.0, 35.0, 26.0, 33.0, 35.0, 37.0, 34.0, 31.0, 44.0, 45.0, 44.0, 47.0, 40.0, 35.0, 41.0, 40.0, 33.0, 33.0, 39.0, 32.0, 27.0, 23.0, 21.0, 18.0, 18.0, 11.0, 12.0, 6.0, 12.0, 5.0, 4.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.43359375, -5.26409912109375, -5.0946044921875, -4.92510986328125, -4.755615234375, -4.58612060546875, -4.4166259765625, -4.24713134765625, -4.07763671875, -3.90814208984375, -3.7386474609375, -3.56915283203125, -3.399658203125, -3.23016357421875, -3.0606689453125, -2.89117431640625, -2.7216796875, -2.55218505859375, -2.3826904296875, -2.21319580078125, -2.043701171875, -1.87420654296875, -1.7047119140625, -1.53521728515625, -1.36572265625, -1.19622802734375, -1.0267333984375, -0.85723876953125, -0.687744140625, -0.51824951171875, -0.3487548828125, -0.17926025390625, -0.009765625, 0.15972900390625, 0.3292236328125, 0.49871826171875, 0.668212890625, 0.83770751953125, 1.0072021484375, 1.17669677734375, 1.34619140625, 1.51568603515625, 1.6851806640625, 1.85467529296875, 2.024169921875, 2.19366455078125, 2.3631591796875, 2.53265380859375, 2.7021484375, 2.87164306640625, 3.0411376953125, 3.21063232421875, 3.380126953125, 3.54962158203125, 3.7191162109375, 3.88861083984375, 4.05810546875, 4.22760009765625, 4.3970947265625, 4.56658935546875, 4.736083984375, 4.90557861328125, 5.0750732421875, 5.24456787109375, 5.4140625]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 11.0, 11.0, 15.0, 17.0, 22.0, 37.0, 35.0, 65.0, 82.0, 150.0, 186.0, 357.0, 566.0, 961.0, 1647.0, 3308.0, 6061.0, 12236.0, 28610.0, 78188.0, 236134.0, 399082.0, 177667.0, 58761.0, 22811.0, 10108.0, 5059.0, 2700.0, 1462.0, 824.0, 493.0, 283.0, 184.0, 127.0, 81.0, 59.0, 43.0, 31.0, 27.0, 18.0, 14.0, 4.0, 7.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.390625, -3.28253173828125, -3.1744384765625, -3.06634521484375, -2.958251953125, -2.85015869140625, -2.7420654296875, -2.63397216796875, -2.52587890625, -2.41778564453125, -2.3096923828125, -2.20159912109375, -2.093505859375, -1.98541259765625, -1.8773193359375, -1.76922607421875, -1.6611328125, -1.55303955078125, -1.4449462890625, -1.33685302734375, -1.228759765625, -1.12066650390625, -1.0125732421875, -0.90447998046875, -0.79638671875, -0.68829345703125, -0.5802001953125, -0.47210693359375, -0.364013671875, -0.25592041015625, -0.1478271484375, -0.03973388671875, 0.068359375, 0.17645263671875, 0.2845458984375, 0.39263916015625, 0.500732421875, 0.60882568359375, 0.7169189453125, 0.82501220703125, 0.93310546875, 1.04119873046875, 1.1492919921875, 1.25738525390625, 1.365478515625, 1.47357177734375, 1.5816650390625, 1.68975830078125, 1.7978515625, 1.90594482421875, 2.0140380859375, 2.12213134765625, 2.230224609375, 2.33831787109375, 2.4464111328125, 2.55450439453125, 2.66259765625, 2.77069091796875, 2.8787841796875, 2.98687744140625, 3.094970703125, 3.20306396484375, 3.3111572265625, 3.41925048828125, 3.52734375]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 4.0, 4.0, 9.0, 7.0, 9.0, 13.0, 9.0, 16.0, 10.0, 23.0, 25.0, 25.0, 33.0, 26.0, 46.0, 31.0, 44.0, 62.0, 41.0, 154.0, 1788.0, 191.0, 61.0, 56.0, 37.0, 49.0, 37.0, 27.0, 35.0, 32.0, 26.0, 19.0, 23.0, 16.0, 14.0, 11.0, 14.0, 6.0, 8.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0], "bins": [-21.21875, -20.60498046875, -19.9912109375, -19.37744140625, -18.763671875, -18.14990234375, -17.5361328125, -16.92236328125, -16.30859375, -15.69482421875, -15.0810546875, -14.46728515625, -13.853515625, -13.23974609375, -12.6259765625, -12.01220703125, -11.3984375, -10.78466796875, -10.1708984375, -9.55712890625, -8.943359375, -8.32958984375, -7.7158203125, -7.10205078125, -6.48828125, -5.87451171875, -5.2607421875, -4.64697265625, -4.033203125, -3.41943359375, -2.8056640625, -2.19189453125, -1.578125, -0.96435546875, -0.3505859375, 0.26318359375, 0.876953125, 1.49072265625, 2.1044921875, 2.71826171875, 3.33203125, 3.94580078125, 4.5595703125, 5.17333984375, 5.787109375, 6.40087890625, 7.0146484375, 7.62841796875, 8.2421875, 8.85595703125, 9.4697265625, 10.08349609375, 10.697265625, 11.31103515625, 11.9248046875, 12.53857421875, 13.15234375, 13.76611328125, 14.3798828125, 14.99365234375, 15.607421875, 16.22119140625, 16.8349609375, 17.44873046875, 18.0625]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 8.0, 11.0, 10.0, 11.0, 20.0, 21.0, 21.0, 36.0, 31.0, 49.0, 68.0, 72.0, 98.0, 192.0, 285.0, 594.0, 3039.0, 470076.0, 2664414.0, 4984.0, 664.0, 319.0, 192.0, 114.0, 89.0, 57.0, 46.0, 26.0, 32.0, 30.0, 13.0, 13.0, 11.0, 11.0, 12.0, 3.0, 11.0, 5.0, 4.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-29.0, -28.0029296875, -27.005859375, -26.0087890625, -25.01171875, -24.0146484375, -23.017578125, -22.0205078125, -21.0234375, -20.0263671875, -19.029296875, -18.0322265625, -17.03515625, -16.0380859375, -15.041015625, -14.0439453125, -13.046875, -12.0498046875, -11.052734375, -10.0556640625, -9.05859375, -8.0615234375, -7.064453125, -6.0673828125, -5.0703125, -4.0732421875, -3.076171875, -2.0791015625, -1.08203125, -0.0849609375, 0.912109375, 1.9091796875, 2.90625, 3.9033203125, 4.900390625, 5.8974609375, 6.89453125, 7.8916015625, 8.888671875, 9.8857421875, 10.8828125, 11.8798828125, 12.876953125, 13.8740234375, 14.87109375, 15.8681640625, 16.865234375, 17.8623046875, 18.859375, 19.8564453125, 20.853515625, 21.8505859375, 22.84765625, 23.8447265625, 24.841796875, 25.8388671875, 26.8359375, 27.8330078125, 28.830078125, 29.8271484375, 30.82421875, 31.8212890625, 32.818359375, 33.8154296875, 34.8125]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 584.0, 432.0], "bins": [-451.4989929199219, -444.3240051269531, -437.1490478515625, -429.97406005859375, -422.7991027832031, -415.6241149902344, -408.44915771484375, -401.274169921875, -394.09918212890625, -386.9241943359375, -379.7492370605469, -372.5742492675781, -365.3992919921875, -358.22430419921875, -351.0493469238281, -343.8743591308594, -336.69940185546875, -329.5244140625, -322.3494567871094, -315.1744689941406, -307.99951171875, -300.82452392578125, -293.6495666503906, -286.4745788574219, -279.29962158203125, -272.1246337890625, -264.9496765136719, -257.7746887207031, -250.5997314453125, -243.42474365234375, -236.24977111816406, -229.07479858398438, -221.89981079101562, -214.72483825683594, -207.54986572265625, -200.37489318847656, -193.19992065429688, -186.02493286132812, -178.84996032714844, -171.67498779296875, -164.50001525878906, -157.32504272460938, -150.1500701904297, -142.97509765625, -135.80010986328125, -128.62515258789062, -121.45016479492188, -114.27519226074219, -107.10022735595703, -99.92525482177734, -92.75027465820312, -85.57530212402344, -78.40032958984375, -71.22535705566406, -64.05038452148438, -56.875404357910156, -49.70043182373047, -42.52545928955078, -35.35048294067383, -28.175508499145508, -21.000534057617188, -13.8255615234375, -6.650585174560547, 0.5243911743164062, 7.699365615844727]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 6.0, 8.0, 8.0, 13.0, 9.0, 10.0, 13.0, 21.0, 14.0, 18.0, 28.0, 34.0, 18.0, 21.0, 29.0, 29.0, 34.0, 39.0, 42.0, 30.0, 38.0, 41.0, 30.0, 29.0, 31.0, 37.0, 30.0, 39.0, 37.0, 25.0, 25.0, 21.0, 23.0, 24.0, 23.0, 17.0, 22.0, 15.0, 9.0, 15.0, 12.0, 9.0, 5.0, 4.0, 3.0, 10.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-54.6042594909668, -52.94281005859375, -51.28135681152344, -49.61990737915039, -47.958457946777344, -46.29700469970703, -44.635555267333984, -42.97410583496094, -41.312652587890625, -39.65120315551758, -37.989749908447266, -36.32830047607422, -34.66685104370117, -33.005401611328125, -31.343948364257812, -29.682498931884766, -28.02104949951172, -26.35959815979004, -24.698148727416992, -23.036697387695312, -21.375247955322266, -19.713796615600586, -18.052345275878906, -16.39089584350586, -14.72944450378418, -13.067994117736816, -11.406543731689453, -9.745092391967773, -8.08364200592041, -6.422191619873047, -4.760740280151367, -3.099289894104004, -1.4378433227539062, 0.22360730171203613, 1.8850579261779785, 3.5465087890625, 5.207959175109863, 6.869409561157227, 8.530860900878906, 10.19231128692627, 11.853761672973633, 13.515212059020996, 15.17666244506836, 16.83811378479004, 18.49956512451172, 20.161014556884766, 21.822465896606445, 23.483917236328125, 25.145366668701172, 26.80681800842285, 28.4682674407959, 30.129718780517578, 31.791168212890625, 33.45262145996094, 35.114070892333984, 36.77552032470703, 38.436973571777344, 40.09842300415039, 41.7598762512207, 43.42132568359375, 45.0827751159668, 46.744224548339844, 48.405677795410156, 50.0671272277832, 51.72857666015625]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 8.0, 8.0, 7.0, 7.0, 14.0, 12.0, 12.0, 22.0, 18.0, 20.0, 22.0, 29.0, 27.0, 35.0, 39.0, 37.0, 33.0, 31.0, 47.0, 42.0, 46.0, 45.0, 34.0, 42.0, 43.0, 39.0, 27.0, 38.0, 26.0, 32.0, 33.0, 16.0, 20.0, 24.0, 12.0, 10.0, 16.0, 9.0, 4.0, 4.0, 3.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-5.578125, -5.40667724609375, -5.2352294921875, -5.06378173828125, -4.892333984375, -4.72088623046875, -4.5494384765625, -4.37799072265625, -4.20654296875, -4.03509521484375, -3.8636474609375, -3.69219970703125, -3.520751953125, -3.34930419921875, -3.1778564453125, -3.00640869140625, -2.8349609375, -2.66351318359375, -2.4920654296875, -2.32061767578125, -2.149169921875, -1.97772216796875, -1.8062744140625, -1.63482666015625, -1.46337890625, -1.29193115234375, -1.1204833984375, -0.94903564453125, -0.777587890625, -0.60614013671875, -0.4346923828125, -0.26324462890625, -0.091796875, 0.07965087890625, 0.2510986328125, 0.42254638671875, 0.593994140625, 0.76544189453125, 0.9368896484375, 1.10833740234375, 1.27978515625, 1.45123291015625, 1.6226806640625, 1.79412841796875, 1.965576171875, 2.13702392578125, 2.3084716796875, 2.47991943359375, 2.6513671875, 2.82281494140625, 2.9942626953125, 3.16571044921875, 3.337158203125, 3.50860595703125, 3.6800537109375, 3.85150146484375, 4.02294921875, 4.19439697265625, 4.3658447265625, 4.53729248046875, 4.708740234375, 4.88018798828125, 5.0516357421875, 5.22308349609375, 5.39453125]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 10.0, 6.0, 7.0, 10.0, 16.0, 13.0, 15.0, 16.0, 21.0, 26.0, 27.0, 48.0, 53.0, 77.0, 176.0, 419.0, 1912.0, 15116.0, 249428.0, 3062958.0, 822585.0, 36243.0, 3737.0, 699.0, 262.0, 111.0, 64.0, 32.0, 40.0, 35.0, 24.0, 23.0, 17.0, 14.0, 11.0, 9.0, 9.0, 4.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-18.84375, -18.2841796875, -17.724609375, -17.1650390625, -16.60546875, -16.0458984375, -15.486328125, -14.9267578125, -14.3671875, -13.8076171875, -13.248046875, -12.6884765625, -12.12890625, -11.5693359375, -11.009765625, -10.4501953125, -9.890625, -9.3310546875, -8.771484375, -8.2119140625, -7.65234375, -7.0927734375, -6.533203125, -5.9736328125, -5.4140625, -4.8544921875, -4.294921875, -3.7353515625, -3.17578125, -2.6162109375, -2.056640625, -1.4970703125, -0.9375, -0.3779296875, 0.181640625, 0.7412109375, 1.30078125, 1.8603515625, 2.419921875, 2.9794921875, 3.5390625, 4.0986328125, 4.658203125, 5.2177734375, 5.77734375, 6.3369140625, 6.896484375, 7.4560546875, 8.015625, 8.5751953125, 9.134765625, 9.6943359375, 10.25390625, 10.8134765625, 11.373046875, 11.9326171875, 12.4921875, 13.0517578125, 13.611328125, 14.1708984375, 14.73046875, 15.2900390625, 15.849609375, 16.4091796875, 16.96875]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 2.0, 7.0, 12.0, 15.0, 15.0, 27.0, 32.0, 36.0, 48.0, 71.0, 68.0, 90.0, 169.0, 194.0, 244.0, 365.0, 390.0, 474.0, 434.0, 296.0, 263.0, 226.0, 143.0, 102.0, 75.0, 77.0, 50.0, 39.0, 36.0, 23.0, 15.0, 12.0, 9.0, 8.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-18.71875, -18.2457275390625, -17.772705078125, -17.2996826171875, -16.82666015625, -16.3536376953125, -15.880615234375, -15.4075927734375, -14.9345703125, -14.4615478515625, -13.988525390625, -13.5155029296875, -13.04248046875, -12.5694580078125, -12.096435546875, -11.6234130859375, -11.150390625, -10.6773681640625, -10.204345703125, -9.7313232421875, -9.25830078125, -8.7852783203125, -8.312255859375, -7.8392333984375, -7.3662109375, -6.8931884765625, -6.420166015625, -5.9471435546875, -5.47412109375, -5.0010986328125, -4.528076171875, -4.0550537109375, -3.58203125, -3.1090087890625, -2.635986328125, -2.1629638671875, -1.68994140625, -1.2169189453125, -0.743896484375, -0.2708740234375, 0.2021484375, 0.6751708984375, 1.148193359375, 1.6212158203125, 2.09423828125, 2.5672607421875, 3.040283203125, 3.5133056640625, 3.986328125, 4.4593505859375, 4.932373046875, 5.4053955078125, 5.87841796875, 6.3514404296875, 6.824462890625, 7.2974853515625, 7.7705078125, 8.2435302734375, 8.716552734375, 9.1895751953125, 9.66259765625, 10.1356201171875, 10.608642578125, 11.0816650390625, 11.5546875]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 7.0, 3.0, 5.0, 13.0, 12.0, 12.0, 11.0, 29.0, 37.0, 42.0, 49.0, 76.0, 98.0, 122.0, 190.0, 306.0, 489.0, 1721.0, 75695.0, 4047454.0, 64844.0, 1619.0, 503.0, 254.0, 183.0, 143.0, 86.0, 62.0, 38.0, 39.0, 37.0, 24.0, 23.0, 15.0, 8.0, 10.0, 6.0, 8.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.09375, -42.21630859375, -40.3388671875, -38.46142578125, -36.583984375, -34.70654296875, -32.8291015625, -30.95166015625, -29.07421875, -27.19677734375, -25.3193359375, -23.44189453125, -21.564453125, -19.68701171875, -17.8095703125, -15.93212890625, -14.0546875, -12.17724609375, -10.2998046875, -8.42236328125, -6.544921875, -4.66748046875, -2.7900390625, -0.91259765625, 0.96484375, 2.84228515625, 4.7197265625, 6.59716796875, 8.474609375, 10.35205078125, 12.2294921875, 14.10693359375, 15.984375, 17.86181640625, 19.7392578125, 21.61669921875, 23.494140625, 25.37158203125, 27.2490234375, 29.12646484375, 31.00390625, 32.88134765625, 34.7587890625, 36.63623046875, 38.513671875, 40.39111328125, 42.2685546875, 44.14599609375, 46.0234375, 47.90087890625, 49.7783203125, 51.65576171875, 53.533203125, 55.41064453125, 57.2880859375, 59.16552734375, 61.04296875, 62.92041015625, 64.7978515625, 66.67529296875, 68.552734375, 70.43017578125, 72.3076171875, 74.18505859375, 76.0625]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 19.0, 120.0, 306.0, 388.0, 154.0, 24.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-113.35067749023438, -106.73175811767578, -100.11283874511719, -93.4939193725586, -86.875, -80.25607299804688, -73.63716125488281, -67.01823425292969, -60.39931869506836, -53.780399322509766, -47.16147994995117, -40.54255676269531, -33.92363739013672, -27.304718017578125, -20.68579864501953, -14.066879272460938, -7.447959899902344, -0.8290400505065918, 5.78987979888916, 12.40880012512207, 19.027719497680664, 25.64664077758789, 32.265560150146484, 38.88447952270508, 45.50339889526367, 52.122318267822266, 58.74123764038086, 65.36016082763672, 71.97908020019531, 78.5979995727539, 85.2169189453125, 91.8358383178711, 98.45475769042969, 105.07367706298828, 111.69259643554688, 118.31151580810547, 124.93043518066406, 131.5493621826172, 138.16827392578125, 144.78720092773438, 151.40611267089844, 158.02503967285156, 164.64395141601562, 171.26287841796875, 177.8817901611328, 184.50071716308594, 191.11962890625, 197.73855590820312, 204.35748291015625, 210.97640991210938, 217.59532165527344, 224.21424865722656, 230.83316040039062, 237.45208740234375, 244.0709991455078, 250.68992614746094, 257.308837890625, 263.9277648925781, 270.54669189453125, 277.16558837890625, 283.7845153808594, 290.4034423828125, 297.0223693847656, 303.6412658691406, 310.26019287109375]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 1.0, 5.0, 3.0, 4.0, 9.0, 11.0, 8.0, 10.0, 13.0, 13.0, 17.0, 18.0, 23.0, 21.0, 30.0, 22.0, 27.0, 29.0, 35.0, 40.0, 48.0, 39.0, 48.0, 27.0, 43.0, 50.0, 47.0, 31.0, 46.0, 21.0, 32.0, 27.0, 18.0, 36.0, 28.0, 23.0, 10.0, 17.0, 11.0, 19.0, 6.0, 11.0, 3.0, 6.0, 2.0, 7.0, 2.0, 1.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-46.59754943847656, -45.07670974731445, -43.555870056152344, -42.035030364990234, -40.514190673828125, -38.993350982666016, -37.472511291503906, -35.9516716003418, -34.43083190917969, -32.90999221801758, -31.38915252685547, -29.86831283569336, -28.34747314453125, -26.82663345336914, -25.30579376220703, -23.784954071044922, -22.264114379882812, -20.743274688720703, -19.222434997558594, -17.701595306396484, -16.180755615234375, -14.659915924072266, -13.139076232910156, -11.618236541748047, -10.097396850585938, -8.576557159423828, -7.055717468261719, -5.534877777099609, -4.0140380859375, -2.4931983947753906, -0.9723587036132812, 0.5484809875488281, 2.0693206787109375, 3.590160369873047, 5.111000061035156, 6.631839752197266, 8.152679443359375, 9.673519134521484, 11.194358825683594, 12.715198516845703, 14.236038208007812, 15.756877899169922, 17.27771759033203, 18.79855728149414, 20.31939697265625, 21.84023666381836, 23.36107635498047, 24.881916046142578, 26.402755737304688, 27.923595428466797, 29.444435119628906, 30.965274810791016, 32.486114501953125, 34.006954193115234, 35.527793884277344, 37.04863357543945, 38.56947326660156, 40.09031295776367, 41.61115264892578, 43.13199234008789, 44.65283203125, 46.17367172241211, 47.69451141357422, 49.21535110473633, 50.73619079589844]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 3.0, 5.0, 8.0, 6.0, 6.0, 13.0, 17.0, 15.0, 16.0, 17.0, 21.0, 18.0, 24.0, 29.0, 21.0, 36.0, 37.0, 31.0, 40.0, 43.0, 40.0, 32.0, 49.0, 44.0, 44.0, 31.0, 38.0, 31.0, 35.0, 25.0, 29.0, 38.0, 32.0, 15.0, 19.0, 17.0, 18.0, 9.0, 10.0, 14.0, 8.0, 8.0, 5.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.60546875, -5.4368896484375, -5.268310546875, -5.0997314453125, -4.93115234375, -4.7625732421875, -4.593994140625, -4.4254150390625, -4.2568359375, -4.0882568359375, -3.919677734375, -3.7510986328125, -3.58251953125, -3.4139404296875, -3.245361328125, -3.0767822265625, -2.908203125, -2.7396240234375, -2.571044921875, -2.4024658203125, -2.23388671875, -2.0653076171875, -1.896728515625, -1.7281494140625, -1.5595703125, -1.3909912109375, -1.222412109375, -1.0538330078125, -0.88525390625, -0.7166748046875, -0.548095703125, -0.3795166015625, -0.2109375, -0.0423583984375, 0.126220703125, 0.2947998046875, 0.46337890625, 0.6319580078125, 0.800537109375, 0.9691162109375, 1.1376953125, 1.3062744140625, 1.474853515625, 1.6434326171875, 1.81201171875, 1.9805908203125, 2.149169921875, 2.3177490234375, 2.486328125, 2.6549072265625, 2.823486328125, 2.9920654296875, 3.16064453125, 3.3292236328125, 3.497802734375, 3.6663818359375, 3.8349609375, 4.0035400390625, 4.172119140625, 4.3406982421875, 4.50927734375, 4.6778564453125, 4.846435546875, 5.0150146484375, 5.18359375]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 2.0, 2.0, 4.0, 13.0, 8.0, 17.0, 35.0, 32.0, 49.0, 72.0, 109.0, 170.0, 221.0, 306.0, 524.0, 707.0, 1011.0, 1451.0, 2158.0, 3216.0, 4900.0, 7646.0, 11774.0, 17995.0, 27548.0, 43748.0, 68809.0, 110470.0, 177604.0, 202225.0, 134135.0, 83501.0, 52322.0, 33353.0, 21582.0, 13994.0, 8958.0, 5908.0, 3895.0, 2557.0, 1782.0, 1189.0, 822.0, 549.0, 382.0, 229.0, 202.0, 112.0, 85.0, 51.0, 42.0, 26.0, 20.0, 11.0, 10.0, 5.0, 8.0, 5.0, 3.0, 1.0, 2.0], "bins": [-0.57861328125, -0.5606460571289062, -0.5426788330078125, -0.5247116088867188, -0.506744384765625, -0.48877716064453125, -0.4708099365234375, -0.45284271240234375, -0.43487548828125, -0.41690826416015625, -0.3989410400390625, -0.38097381591796875, -0.363006591796875, -0.34503936767578125, -0.3270721435546875, -0.30910491943359375, -0.2911376953125, -0.27317047119140625, -0.2552032470703125, -0.23723602294921875, -0.219268798828125, -0.20130157470703125, -0.1833343505859375, -0.16536712646484375, -0.14739990234375, -0.12943267822265625, -0.1114654541015625, -0.09349822998046875, -0.075531005859375, -0.05756378173828125, -0.0395965576171875, -0.02162933349609375, -0.003662109375, 0.01430511474609375, 0.0322723388671875, 0.05023956298828125, 0.068206787109375, 0.08617401123046875, 0.1041412353515625, 0.12210845947265625, 0.14007568359375, 0.15804290771484375, 0.1760101318359375, 0.19397735595703125, 0.211944580078125, 0.22991180419921875, 0.2478790283203125, 0.26584625244140625, 0.2838134765625, 0.30178070068359375, 0.3197479248046875, 0.33771514892578125, 0.355682373046875, 0.37364959716796875, 0.3916168212890625, 0.40958404541015625, 0.42755126953125, 0.44551849365234375, 0.4634857177734375, 0.48145294189453125, 0.499420166015625, 0.5173873901367188, 0.5353546142578125, 0.5533218383789062, 0.5712890625]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 4.0, 2.0, 7.0, 5.0, 7.0, 14.0, 12.0, 10.0, 15.0, 20.0, 16.0, 16.0, 27.0, 21.0, 31.0, 22.0, 32.0, 38.0, 37.0, 37.0, 30.0, 46.0, 38.0, 1063.0, 33.0, 51.0, 42.0, 34.0, 32.0, 31.0, 21.0, 28.0, 34.0, 16.0, 27.0, 24.0, 24.0, 15.0, 12.0, 9.0, 10.0, 7.0, 10.0, 5.0, 6.0, 4.0, 2.0, 5.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.19140625, -3.087066650390625, -2.98272705078125, -2.878387451171875, -2.7740478515625, -2.669708251953125, -2.56536865234375, -2.461029052734375, -2.356689453125, -2.252349853515625, -2.14801025390625, -2.043670654296875, -1.9393310546875, -1.834991455078125, -1.73065185546875, -1.626312255859375, -1.52197265625, -1.417633056640625, -1.31329345703125, -1.208953857421875, -1.1046142578125, -1.000274658203125, -0.89593505859375, -0.791595458984375, -0.687255859375, -0.582916259765625, -0.47857666015625, -0.374237060546875, -0.2698974609375, -0.165557861328125, -0.06121826171875, 0.043121337890625, 0.1474609375, 0.251800537109375, 0.35614013671875, 0.460479736328125, 0.5648193359375, 0.669158935546875, 0.77349853515625, 0.877838134765625, 0.982177734375, 1.086517333984375, 1.19085693359375, 1.295196533203125, 1.3995361328125, 1.503875732421875, 1.60821533203125, 1.712554931640625, 1.81689453125, 1.921234130859375, 2.02557373046875, 2.129913330078125, 2.2342529296875, 2.338592529296875, 2.44293212890625, 2.547271728515625, 2.651611328125, 2.755950927734375, 2.86029052734375, 2.964630126953125, 3.0689697265625, 3.173309326171875, 3.27764892578125, 3.381988525390625, 3.486328125]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 4.0, 6.0, 9.0, 11.0, 12.0, 17.0, 28.0, 41.0, 80.0, 86.0, 135.0, 194.0, 297.0, 452.0, 654.0, 910.0, 1352.0, 1993.0, 3011.0, 4530.0, 6963.0, 10785.0, 16587.0, 25621.0, 39322.0, 62215.0, 100291.0, 163404.0, 1260541.0, 147553.0, 90318.0, 56662.0, 36104.0, 23377.0, 14760.0, 9669.0, 6233.0, 4241.0, 2832.0, 1858.0, 1250.0, 883.0, 588.0, 387.0, 291.0, 190.0, 115.0, 90.0, 62.0, 31.0, 45.0, 22.0, 15.0, 8.0, 5.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.52978515625, -0.512908935546875, -0.49603271484375, -0.479156494140625, -0.4622802734375, -0.445404052734375, -0.42852783203125, -0.411651611328125, -0.394775390625, -0.377899169921875, -0.36102294921875, -0.344146728515625, -0.3272705078125, -0.310394287109375, -0.29351806640625, -0.276641845703125, -0.259765625, -0.242889404296875, -0.22601318359375, -0.209136962890625, -0.1922607421875, -0.175384521484375, -0.15850830078125, -0.141632080078125, -0.124755859375, -0.107879638671875, -0.09100341796875, -0.074127197265625, -0.0572509765625, -0.040374755859375, -0.02349853515625, -0.006622314453125, 0.01025390625, 0.027130126953125, 0.04400634765625, 0.060882568359375, 0.0777587890625, 0.094635009765625, 0.11151123046875, 0.128387451171875, 0.145263671875, 0.162139892578125, 0.17901611328125, 0.195892333984375, 0.2127685546875, 0.229644775390625, 0.24652099609375, 0.263397216796875, 0.2802734375, 0.297149658203125, 0.31402587890625, 0.330902099609375, 0.3477783203125, 0.364654541015625, 0.38153076171875, 0.398406982421875, 0.415283203125, 0.432159423828125, 0.44903564453125, 0.465911865234375, 0.4827880859375, 0.499664306640625, 0.51654052734375, 0.533416748046875, 0.55029296875]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 7.0, 3.0, 3.0, 7.0, 9.0, 6.0, 9.0, 9.0, 12.0, 17.0, 21.0, 23.0, 43.0, 49.0, 51.0, 70.0, 69.0, 92.0, 86.0, 87.0, 84.0, 45.0, 43.0, 31.0, 33.0, 22.0, 17.0, 9.0, 10.0, 3.0, 10.0, 8.0, 5.0, 1.0, 1.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0027713775634765625, -0.00266873836517334, -0.002566099166870117, -0.0024634599685668945, -0.002360820770263672, -0.0022581815719604492, -0.0021555423736572266, -0.002052903175354004, -0.0019502639770507812, -0.0018476247787475586, -0.001744985580444336, -0.0016423463821411133, -0.0015397071838378906, -0.001437067985534668, -0.0013344287872314453, -0.0012317895889282227, -0.001129150390625, -0.0010265111923217773, -0.0009238719940185547, -0.000821232795715332, -0.0007185935974121094, -0.0006159543991088867, -0.0005133152008056641, -0.0004106760025024414, -0.00030803680419921875, -0.0002053976058959961, -0.00010275840759277344, -1.1920928955078125e-07, 0.00010251998901367188, 0.00020515918731689453, 0.0003077983856201172, 0.00041043758392333984, 0.0005130767822265625, 0.0006157159805297852, 0.0007183551788330078, 0.0008209943771362305, 0.0009236335754394531, 0.0010262727737426758, 0.0011289119720458984, 0.001231551170349121, 0.0013341903686523438, 0.0014368295669555664, 0.001539468765258789, 0.0016421079635620117, 0.0017447471618652344, 0.001847386360168457, 0.0019500255584716797, 0.0020526647567749023, 0.002155303955078125, 0.0022579431533813477, 0.0023605823516845703, 0.002463221549987793, 0.0025658607482910156, 0.0026684999465942383, 0.002771139144897461, 0.0028737783432006836, 0.0029764175415039062, 0.003079056739807129, 0.0031816959381103516, 0.0032843351364135742, 0.003386974334716797, 0.0034896135330200195, 0.003592252731323242, 0.003694891929626465, 0.0037975311279296875]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 0.0, 4.0, 5.0, 7.0, 7.0, 8.0, 6.0, 12.0, 11.0, 17.0, 29.0, 59.0, 108.0, 211.0, 535.0, 14478.0, 1031547.0, 886.0, 280.0, 134.0, 61.0, 35.0, 31.0, 25.0, 4.0, 11.0, 12.0, 10.0, 5.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.1180419921875, -0.11495113372802734, -0.11186027526855469, -0.10876941680908203, -0.10567855834960938, -0.10258769989013672, -0.09949684143066406, -0.0964059829711914, -0.09331512451171875, -0.0902242660522461, -0.08713340759277344, -0.08404254913330078, -0.08095169067382812, -0.07786083221435547, -0.07476997375488281, -0.07167911529541016, -0.0685882568359375, -0.06549739837646484, -0.06240653991699219, -0.05931568145751953, -0.056224822998046875, -0.05313396453857422, -0.05004310607910156, -0.046952247619628906, -0.04386138916015625, -0.040770530700683594, -0.03767967224121094, -0.03458881378173828, -0.031497955322265625, -0.02840709686279297, -0.025316238403320312, -0.022225379943847656, -0.019134521484375, -0.016043663024902344, -0.012952804565429688, -0.009861946105957031, -0.006771087646484375, -0.0036802291870117188, -0.0005893707275390625, 0.0025014877319335938, 0.00559234619140625, 0.008683204650878906, 0.011774063110351562, 0.014864921569824219, 0.017955780029296875, 0.02104663848876953, 0.024137496948242188, 0.027228355407714844, 0.0303192138671875, 0.033410072326660156, 0.03650093078613281, 0.03959178924560547, 0.042682647705078125, 0.04577350616455078, 0.04886436462402344, 0.051955223083496094, 0.05504608154296875, 0.058136940002441406, 0.06122779846191406, 0.06431865692138672, 0.06740951538085938, 0.07050037384033203, 0.07359123229980469, 0.07668209075927734, 0.07977294921875]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 26.0, 408.0, 531.0, 47.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.011294923722743988, -0.011044549755752087, -0.010794175788760185, -0.010543801821768284, -0.010293427854776382, -0.010043052956461906, -0.009792678989470005, -0.009542305022478104, -0.009291931055486202, -0.0090415570884943, -0.0087911831215024, -0.008540809154510498, -0.008290434256196022, -0.00804006028920412, -0.007789686322212219, -0.007539312355220318, -0.0072889383882284164, -0.007038564421236515, -0.006788190454244614, -0.006537816021591425, -0.0062874420545995235, -0.006037068087607622, -0.0057866936549544334, -0.005536319687962532, -0.005285945720970631, -0.005035571753978729, -0.004785197786986828, -0.004534823354333639, -0.004284449387341738, -0.004034075420349836, -0.0037837012205272913, -0.0035333270207047462, -0.0032829521223902702, -0.003032578155398369, -0.002782203955575824, -0.0025318297557532787, -0.0022814557887613773, -0.002031081821769476, -0.0017807076219469309, -0.0015303335385397077, -0.0012799594551324844, -0.0010295853717252612, -0.000779211288318038, -0.0005288372049108148, -0.00027846312150359154, -2.8089038096368313e-05, 0.0002222850453108549, 0.00047265912871807814, 0.0007230332121253014, 0.0009734072955325246, 0.0012237813789397478, 0.001474155462346971, 0.0017245295457541943, 0.0019749035127460957, 0.0022252777125686407, 0.0024756519123911858, 0.002726025879383087, 0.0029763998463749886, 0.0032267740461975336, 0.0034771482460200787, 0.00372752221301198, 0.0039778961800038815, 0.00422827061265707, 0.0044786445796489716, 0.004729018546640873]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 6.0, 9.0, 4.0, 11.0, 11.0, 8.0, 12.0, 15.0, 22.0, 21.0, 19.0, 21.0, 25.0, 20.0, 32.0, 30.0, 34.0, 35.0, 47.0, 49.0, 52.0, 32.0, 49.0, 37.0, 33.0, 50.0, 36.0, 31.0, 39.0, 37.0, 31.0, 27.0, 25.0, 12.0, 19.0, 8.0, 8.0, 10.0, 10.0, 7.0, 2.0, 6.0, 5.0, 5.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0013399720191955566, -0.001294896937906742, -0.0012498218566179276, -0.001204746775329113, -0.0011596716940402985, -0.001114596612751484, -0.0010695215314626694, -0.0010244464501738548, -0.0009793713688850403, -0.0009342962875962257, -0.0008892212063074112, -0.0008441461250185966, -0.0007990710437297821, -0.0007539959624409676, -0.000708920881152153, -0.0006638457998633385, -0.0006187707185745239, -0.0005736956372857094, -0.0005286205559968948, -0.0004835454747080803, -0.00043847039341926575, -0.0003933953121304512, -0.00034832023084163666, -0.0003032451495528221, -0.00025817006826400757, -0.00021309498697519302, -0.00016801990568637848, -0.00012294482439756393, -7.786974310874939e-05, -3.2794661819934845e-05, 1.22804194688797e-05, 5.7355500757694244e-05, 0.00010243058204650879, 0.00014750566333532333, 0.00019258074462413788, 0.00023765582591295242, 0.00028273090720176697, 0.0003278059884905815, 0.00037288106977939606, 0.0004179561510682106, 0.00046303123235702515, 0.0005081063136458397, 0.0005531813949346542, 0.0005982564762234688, 0.0006433315575122833, 0.0006884066388010979, 0.0007334817200899124, 0.000778556801378727, 0.0008236318826675415, 0.000868706963956356, 0.0009137820452451706, 0.0009588571265339851, 0.0010039322078227997, 0.0010490072891116142, 0.0010940823704004288, 0.0011391574516892433, 0.0011842325329780579, 0.0012293076142668724, 0.001274382695555687, 0.0013194577768445015, 0.001364532858133316, 0.0014096079394221306, 0.0014546830207109451, 0.0014997581019997597, 0.0015448331832885742]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 3.0, 5.0, 8.0, 6.0, 6.0, 13.0, 17.0, 15.0, 16.0, 17.0, 21.0, 18.0, 24.0, 30.0, 20.0, 36.0, 37.0, 31.0, 40.0, 43.0, 40.0, 32.0, 49.0, 44.0, 44.0, 31.0, 38.0, 31.0, 35.0, 25.0, 29.0, 38.0, 32.0, 15.0, 19.0, 17.0, 18.0, 9.0, 10.0, 14.0, 8.0, 8.0, 5.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.60546875, -5.4368896484375, -5.268310546875, -5.0997314453125, -4.93115234375, -4.7625732421875, -4.593994140625, -4.4254150390625, -4.2568359375, -4.0882568359375, -3.919677734375, -3.7510986328125, -3.58251953125, -3.4139404296875, -3.245361328125, -3.0767822265625, -2.908203125, -2.7396240234375, -2.571044921875, -2.4024658203125, -2.23388671875, -2.0653076171875, -1.896728515625, -1.7281494140625, -1.5595703125, -1.3909912109375, -1.222412109375, -1.0538330078125, -0.88525390625, -0.7166748046875, -0.548095703125, -0.3795166015625, -0.2109375, -0.0423583984375, 0.126220703125, 0.2947998046875, 0.46337890625, 0.6319580078125, 0.800537109375, 0.9691162109375, 1.1376953125, 1.3062744140625, 1.474853515625, 1.6434326171875, 1.81201171875, 1.9805908203125, 2.149169921875, 2.3177490234375, 2.486328125, 2.6549072265625, 2.823486328125, 2.9920654296875, 3.16064453125, 3.3292236328125, 3.497802734375, 3.6663818359375, 3.8349609375, 4.0035400390625, 4.172119140625, 4.3406982421875, 4.50927734375, 4.6778564453125, 4.846435546875, 5.0150146484375, 5.18359375]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 6.0, 7.0, 9.0, 14.0, 19.0, 34.0, 33.0, 54.0, 60.0, 109.0, 170.0, 210.0, 277.0, 459.0, 654.0, 1002.0, 1414.0, 2237.0, 3244.0, 5062.0, 8722.0, 16086.0, 35651.0, 100269.0, 403159.0, 318928.0, 83384.0, 30891.0, 14501.0, 7879.0, 4673.0, 3046.0, 2027.0, 1310.0, 893.0, 631.0, 440.0, 259.0, 234.0, 173.0, 97.0, 67.0, 60.0, 27.0, 23.0, 17.0, 14.0, 10.0, 5.0, 7.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-4.76171875, -4.6170654296875, -4.472412109375, -4.3277587890625, -4.18310546875, -4.0384521484375, -3.893798828125, -3.7491455078125, -3.6044921875, -3.4598388671875, -3.315185546875, -3.1705322265625, -3.02587890625, -2.8812255859375, -2.736572265625, -2.5919189453125, -2.447265625, -2.3026123046875, -2.157958984375, -2.0133056640625, -1.86865234375, -1.7239990234375, -1.579345703125, -1.4346923828125, -1.2900390625, -1.1453857421875, -1.000732421875, -0.8560791015625, -0.71142578125, -0.5667724609375, -0.422119140625, -0.2774658203125, -0.1328125, 0.0118408203125, 0.156494140625, 0.3011474609375, 0.44580078125, 0.5904541015625, 0.735107421875, 0.8797607421875, 1.0244140625, 1.1690673828125, 1.313720703125, 1.4583740234375, 1.60302734375, 1.7476806640625, 1.892333984375, 2.0369873046875, 2.181640625, 2.3262939453125, 2.470947265625, 2.6156005859375, 2.76025390625, 2.9049072265625, 3.049560546875, 3.1942138671875, 3.3388671875, 3.4835205078125, 3.628173828125, 3.7728271484375, 3.91748046875, 4.0621337890625, 4.206787109375, 4.3514404296875, 4.49609375]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 5.0, 4.0, 3.0, 4.0, 9.0, 15.0, 14.0, 12.0, 14.0, 23.0, 18.0, 18.0, 36.0, 23.0, 32.0, 38.0, 40.0, 42.0, 47.0, 53.0, 74.0, 268.0, 1660.0, 120.0, 70.0, 56.0, 49.0, 41.0, 31.0, 28.0, 36.0, 33.0, 21.0, 19.0, 14.0, 14.0, 11.0, 14.0, 11.0, 6.0, 13.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.359375, -17.791015625, -17.22265625, -16.654296875, -16.0859375, -15.517578125, -14.94921875, -14.380859375, -13.8125, -13.244140625, -12.67578125, -12.107421875, -11.5390625, -10.970703125, -10.40234375, -9.833984375, -9.265625, -8.697265625, -8.12890625, -7.560546875, -6.9921875, -6.423828125, -5.85546875, -5.287109375, -4.71875, -4.150390625, -3.58203125, -3.013671875, -2.4453125, -1.876953125, -1.30859375, -0.740234375, -0.171875, 0.396484375, 0.96484375, 1.533203125, 2.1015625, 2.669921875, 3.23828125, 3.806640625, 4.375, 4.943359375, 5.51171875, 6.080078125, 6.6484375, 7.216796875, 7.78515625, 8.353515625, 8.921875, 9.490234375, 10.05859375, 10.626953125, 11.1953125, 11.763671875, 12.33203125, 12.900390625, 13.46875, 14.037109375, 14.60546875, 15.173828125, 15.7421875, 16.310546875, 16.87890625, 17.447265625, 18.015625]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 4.0, 8.0, 11.0, 11.0, 14.0, 23.0, 25.0, 29.0, 42.0, 63.0, 105.0, 145.0, 209.0, 350.0, 1094.0, 12275.0, 3052496.0, 74839.0, 2575.0, 491.0, 271.0, 183.0, 121.0, 70.0, 51.0, 46.0, 40.0, 24.0, 25.0, 20.0, 15.0, 8.0, 7.0, 6.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-42.96875, -41.61376953125, -40.2587890625, -38.90380859375, -37.548828125, -36.19384765625, -34.8388671875, -33.48388671875, -32.12890625, -30.77392578125, -29.4189453125, -28.06396484375, -26.708984375, -25.35400390625, -23.9990234375, -22.64404296875, -21.2890625, -19.93408203125, -18.5791015625, -17.22412109375, -15.869140625, -14.51416015625, -13.1591796875, -11.80419921875, -10.44921875, -9.09423828125, -7.7392578125, -6.38427734375, -5.029296875, -3.67431640625, -2.3193359375, -0.96435546875, 0.390625, 1.74560546875, 3.1005859375, 4.45556640625, 5.810546875, 7.16552734375, 8.5205078125, 9.87548828125, 11.23046875, 12.58544921875, 13.9404296875, 15.29541015625, 16.650390625, 18.00537109375, 19.3603515625, 20.71533203125, 22.0703125, 23.42529296875, 24.7802734375, 26.13525390625, 27.490234375, 28.84521484375, 30.2001953125, 31.55517578125, 32.91015625, 34.26513671875, 35.6201171875, 36.97509765625, 38.330078125, 39.68505859375, 41.0400390625, 42.39501953125, 43.75]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 10.0, 99.0, 377.0, 396.0, 113.0, 14.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-89.2614517211914, -86.91714477539062, -84.57283782958984, -82.22853088378906, -79.88422393798828, -77.5399169921875, -75.19561004638672, -72.85130310058594, -70.50699615478516, -68.16268920898438, -65.8183822631836, -63.47407531738281, -61.12976837158203, -58.78546142578125, -56.44115447998047, -54.09684753417969, -51.75254440307617, -49.40823745727539, -47.06393051147461, -44.71962356567383, -42.37531661987305, -40.031009674072266, -37.68670654296875, -35.34239959716797, -32.99809265136719, -30.653785705566406, -28.309478759765625, -25.965171813964844, -23.620864868164062, -21.27655792236328, -18.932252883911133, -16.58794593811035, -14.243633270263672, -11.89932632446289, -9.55501937866211, -7.2107133865356445, -4.866406440734863, -2.522099494934082, -0.1777935028076172, 2.166513442993164, 4.510820388793945, 6.855127334594727, 9.199434280395508, 11.543740272521973, 13.888047218322754, 16.23235321044922, 18.57666015625, 20.92096710205078, 23.265274047851562, 25.609580993652344, 27.953887939453125, 30.298194885253906, 32.64250183105469, 34.98680877685547, 37.33111572265625, 39.67542266845703, 42.01972961425781, 44.364036560058594, 46.708343505859375, 49.052650451660156, 51.39695739746094, 53.74126434326172, 56.0855712890625, 58.42987823486328, 60.7741813659668]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 4.0, 7.0, 10.0, 8.0, 13.0, 15.0, 13.0, 15.0, 19.0, 19.0, 21.0, 29.0, 44.0, 23.0, 35.0, 37.0, 51.0, 24.0, 36.0, 43.0, 55.0, 46.0, 43.0, 33.0, 36.0, 41.0, 36.0, 28.0, 34.0, 17.0, 30.0, 20.0, 14.0, 16.0, 19.0, 13.0, 12.0, 7.0, 7.0, 8.0, 4.0, 7.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-53.17256164550781, -51.45109558105469, -49.72963333129883, -48.00817108154297, -46.286705017089844, -44.56523895263672, -42.84377670288086, -41.122314453125, -39.400848388671875, -37.67938232421875, -35.95792007446289, -34.23645782470703, -32.514991760253906, -30.793527603149414, -29.072063446044922, -27.35059928894043, -25.629135131835938, -23.907670974731445, -22.186206817626953, -20.46474266052246, -18.74327850341797, -17.021814346313477, -15.300350189208984, -13.578886032104492, -11.857421875, -10.135957717895508, -8.414493560791016, -6.693029403686523, -4.971565246582031, -3.250101089477539, -1.5286369323730469, 0.1928272247314453, 1.9142951965332031, 3.6357593536376953, 5.3572235107421875, 7.07868766784668, 8.800151824951172, 10.521615982055664, 12.243080139160156, 13.964544296264648, 15.68600845336914, 17.407472610473633, 19.128936767578125, 20.850400924682617, 22.57186508178711, 24.2933292388916, 26.014793395996094, 27.736257553100586, 29.457721710205078, 31.17918586730957, 32.90065002441406, 34.62211608886719, 36.34357833862305, 38.065040588378906, 39.78650665283203, 41.507972717285156, 43.229434967041016, 44.950897216796875, 46.67236328125, 48.393829345703125, 50.115291595458984, 51.836753845214844, 53.55821990966797, 55.279685974121094, 57.00114822387695]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 5.0, 12.0, 11.0, 15.0, 11.0, 18.0, 14.0, 19.0, 26.0, 21.0, 22.0, 29.0, 31.0, 32.0, 31.0, 35.0, 49.0, 45.0, 41.0, 39.0, 47.0, 46.0, 39.0, 33.0, 30.0, 30.0, 31.0, 31.0, 35.0, 34.0, 24.0, 16.0, 18.0, 14.0, 12.0, 13.0, 13.0, 5.0, 4.0, 7.0, 6.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.79296875, -5.6151123046875, -5.437255859375, -5.2593994140625, -5.08154296875, -4.9036865234375, -4.725830078125, -4.5479736328125, -4.3701171875, -4.1922607421875, -4.014404296875, -3.8365478515625, -3.65869140625, -3.4808349609375, -3.302978515625, -3.1251220703125, -2.947265625, -2.7694091796875, -2.591552734375, -2.4136962890625, -2.23583984375, -2.0579833984375, -1.880126953125, -1.7022705078125, -1.5244140625, -1.3465576171875, -1.168701171875, -0.9908447265625, -0.81298828125, -0.6351318359375, -0.457275390625, -0.2794189453125, -0.1015625, 0.0762939453125, 0.254150390625, 0.4320068359375, 0.60986328125, 0.7877197265625, 0.965576171875, 1.1434326171875, 1.3212890625, 1.4991455078125, 1.677001953125, 1.8548583984375, 2.03271484375, 2.2105712890625, 2.388427734375, 2.5662841796875, 2.744140625, 2.9219970703125, 3.099853515625, 3.2777099609375, 3.45556640625, 3.6334228515625, 3.811279296875, 3.9891357421875, 4.1669921875, 4.3448486328125, 4.522705078125, 4.7005615234375, 4.87841796875, 5.0562744140625, 5.234130859375, 5.4119873046875, 5.58984375]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 7.0, 9.0, 13.0, 12.0, 32.0, 45.0, 60.0, 72.0, 110.0, 168.0, 314.0, 502.0, 1008.0, 2052.0, 4714.0, 11818.0, 33125.0, 111937.0, 423356.0, 1185686.0, 1461432.0, 682535.0, 192155.0, 53069.0, 17589.0, 6623.0, 2800.0, 1334.0, 703.0, 346.0, 222.0, 144.0, 88.0, 59.0, 45.0, 26.0, 23.0, 22.0, 9.0, 5.0, 4.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-7.1953125, -6.98492431640625, -6.7745361328125, -6.56414794921875, -6.353759765625, -6.14337158203125, -5.9329833984375, -5.72259521484375, -5.51220703125, -5.30181884765625, -5.0914306640625, -4.88104248046875, -4.670654296875, -4.46026611328125, -4.2498779296875, -4.03948974609375, -3.8291015625, -3.61871337890625, -3.4083251953125, -3.19793701171875, -2.987548828125, -2.77716064453125, -2.5667724609375, -2.35638427734375, -2.14599609375, -1.93560791015625, -1.7252197265625, -1.51483154296875, -1.304443359375, -1.09405517578125, -0.8836669921875, -0.67327880859375, -0.462890625, -0.25250244140625, -0.0421142578125, 0.16827392578125, 0.378662109375, 0.58905029296875, 0.7994384765625, 1.00982666015625, 1.22021484375, 1.43060302734375, 1.6409912109375, 1.85137939453125, 2.061767578125, 2.27215576171875, 2.4825439453125, 2.69293212890625, 2.9033203125, 3.11370849609375, 3.3240966796875, 3.53448486328125, 3.744873046875, 3.95526123046875, 4.1656494140625, 4.37603759765625, 4.58642578125, 4.79681396484375, 5.0072021484375, 5.21759033203125, 5.427978515625, 5.63836669921875, 5.8487548828125, 6.05914306640625, 6.26953125]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 8.0, 4.0, 14.0, 17.0, 21.0, 40.0, 50.0, 51.0, 63.0, 99.0, 140.0, 207.0, 231.0, 344.0, 407.0, 434.0, 397.0, 378.0, 282.0, 235.0, 178.0, 122.0, 98.0, 71.0, 57.0, 33.0, 22.0, 25.0, 16.0, 7.0, 7.0, 6.0, 9.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.234375, -14.768310546875, -14.30224609375, -13.836181640625, -13.3701171875, -12.904052734375, -12.43798828125, -11.971923828125, -11.505859375, -11.039794921875, -10.57373046875, -10.107666015625, -9.6416015625, -9.175537109375, -8.70947265625, -8.243408203125, -7.77734375, -7.311279296875, -6.84521484375, -6.379150390625, -5.9130859375, -5.447021484375, -4.98095703125, -4.514892578125, -4.048828125, -3.582763671875, -3.11669921875, -2.650634765625, -2.1845703125, -1.718505859375, -1.25244140625, -0.786376953125, -0.3203125, 0.145751953125, 0.61181640625, 1.077880859375, 1.5439453125, 2.010009765625, 2.47607421875, 2.942138671875, 3.408203125, 3.874267578125, 4.34033203125, 4.806396484375, 5.2724609375, 5.738525390625, 6.20458984375, 6.670654296875, 7.13671875, 7.602783203125, 8.06884765625, 8.534912109375, 9.0009765625, 9.467041015625, 9.93310546875, 10.399169921875, 10.865234375, 11.331298828125, 11.79736328125, 12.263427734375, 12.7294921875, 13.195556640625, 13.66162109375, 14.127685546875, 14.59375]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 3.0, 4.0, 2.0, 1.0, 7.0, 6.0, 12.0, 9.0, 16.0, 20.0, 36.0, 39.0, 51.0, 62.0, 92.0, 113.0, 194.0, 322.0, 620.0, 4998.0, 2483996.0, 1698086.0, 4170.0, 562.0, 289.0, 168.0, 107.0, 73.0, 62.0, 46.0, 38.0, 25.0, 17.0, 13.0, 12.0, 9.0, 8.0, 5.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.125, -43.0712890625, -41.017578125, -38.9638671875, -36.91015625, -34.8564453125, -32.802734375, -30.7490234375, -28.6953125, -26.6416015625, -24.587890625, -22.5341796875, -20.48046875, -18.4267578125, -16.373046875, -14.3193359375, -12.265625, -10.2119140625, -8.158203125, -6.1044921875, -4.05078125, -1.9970703125, 0.056640625, 2.1103515625, 4.1640625, 6.2177734375, 8.271484375, 10.3251953125, 12.37890625, 14.4326171875, 16.486328125, 18.5400390625, 20.59375, 22.6474609375, 24.701171875, 26.7548828125, 28.80859375, 30.8623046875, 32.916015625, 34.9697265625, 37.0234375, 39.0771484375, 41.130859375, 43.1845703125, 45.23828125, 47.2919921875, 49.345703125, 51.3994140625, 53.453125, 55.5068359375, 57.560546875, 59.6142578125, 61.66796875, 63.7216796875, 65.775390625, 67.8291015625, 69.8828125, 71.9365234375, 73.990234375, 76.0439453125, 78.09765625, 80.1513671875, 82.205078125, 84.2587890625, 86.3125]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 10.0, 25.0, 68.0, 139.0, 225.0, 228.0, 157.0, 81.0, 47.0, 22.0, 5.0, 3.0, 1.0, 0.0, 1.0], "bins": [-191.09642028808594, -187.56163024902344, -184.02684020996094, -180.49205017089844, -176.95726013183594, -173.42247009277344, -169.88768005371094, -166.35289001464844, -162.81809997558594, -159.28330993652344, -155.74851989746094, -152.21372985839844, -148.67893981933594, -145.14414978027344, -141.60935974121094, -138.07456970214844, -134.53976440429688, -131.00497436523438, -127.47018432617188, -123.93539428710938, -120.40060424804688, -116.86581420898438, -113.33102416992188, -109.79623413085938, -106.26144409179688, -102.72665405273438, -99.19186401367188, -95.65707397460938, -92.12228393554688, -88.58749389648438, -85.05270385742188, -81.51791381835938, -77.98312377929688, -74.44833374023438, -70.91354370117188, -67.37875366210938, -63.843963623046875, -60.309173583984375, -56.77437973022461, -53.23958969116211, -49.70479965209961, -46.17000961303711, -42.63521957397461, -39.100425720214844, -35.565635681152344, -32.030845642089844, -28.496055603027344, -24.961265563964844, -21.426475524902344, -17.891685485839844, -14.356894493103027, -10.822103500366211, -7.287313461303711, -3.752523422241211, -0.21773147583007812, 3.317058563232422, 6.851848602294922, 10.386638641357422, 13.921429634094238, 17.456220626831055, 20.991010665893555, 24.525800704956055, 28.060592651367188, 31.595382690429688, 35.13017272949219]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 3.0, 8.0, 6.0, 6.0, 2.0, 8.0, 16.0, 12.0, 16.0, 16.0, 15.0, 22.0, 25.0, 19.0, 11.0, 24.0, 32.0, 21.0, 30.0, 35.0, 29.0, 32.0, 41.0, 50.0, 23.0, 29.0, 41.0, 35.0, 30.0, 35.0, 30.0, 33.0, 25.0, 29.0, 23.0, 43.0, 19.0, 20.0, 12.0, 10.0, 17.0, 21.0, 13.0, 7.0, 6.0, 3.0, 4.0, 4.0, 6.0, 1.0, 1.0, 4.0, 3.0, 1.0, 3.0], "bins": [-44.93877410888672, -43.59572219848633, -42.25267028808594, -40.90961456298828, -39.56656265258789, -38.2235107421875, -36.88045883178711, -35.53740692138672, -34.19435119628906, -32.85129928588867, -31.50824546813965, -30.165193557739258, -28.822139739990234, -27.479087829589844, -26.136035919189453, -24.79298210144043, -23.44993019104004, -22.10687828063965, -20.763824462890625, -19.420772552490234, -18.07771873474121, -16.73466682434082, -15.391613960266113, -14.048561096191406, -12.7055082321167, -11.362455368041992, -10.019402503967285, -8.676349639892578, -7.333297252655029, -5.990244388580322, -4.647192001342773, -3.3041391372680664, -1.9610862731933594, -0.6180335283279419, 0.7250192165374756, 2.0680718421936035, 3.4111247062683105, 4.754177570343018, 6.097229957580566, 7.440282821655273, 8.78333568572998, 10.126388549804688, 11.469441413879395, 12.812494277954102, 14.155546188354492, 15.498600006103516, 16.841651916503906, 18.184703826904297, 19.52775764465332, 20.87080955505371, 22.213863372802734, 23.556915283203125, 24.89996910095215, 26.24302101135254, 27.586074829101562, 28.929126739501953, 30.272178649902344, 31.615230560302734, 32.958282470703125, 34.30133819580078, 35.64439010620117, 36.98744201660156, 38.33049392700195, 39.673545837402344, 41.0166015625]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 9.0, 6.0, 9.0, 8.0, 11.0, 18.0, 18.0, 14.0, 24.0, 22.0, 19.0, 27.0, 24.0, 22.0, 31.0, 33.0, 34.0, 41.0, 47.0, 44.0, 55.0, 35.0, 28.0, 39.0, 47.0, 33.0, 25.0, 28.0, 36.0, 39.0, 28.0, 25.0, 19.0, 16.0, 18.0, 16.0, 9.0, 9.0, 2.0, 9.0, 7.0, 3.0, 6.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.765625, -5.5888671875, -5.412109375, -5.2353515625, -5.05859375, -4.8818359375, -4.705078125, -4.5283203125, -4.3515625, -4.1748046875, -3.998046875, -3.8212890625, -3.64453125, -3.4677734375, -3.291015625, -3.1142578125, -2.9375, -2.7607421875, -2.583984375, -2.4072265625, -2.23046875, -2.0537109375, -1.876953125, -1.7001953125, -1.5234375, -1.3466796875, -1.169921875, -0.9931640625, -0.81640625, -0.6396484375, -0.462890625, -0.2861328125, -0.109375, 0.0673828125, 0.244140625, 0.4208984375, 0.59765625, 0.7744140625, 0.951171875, 1.1279296875, 1.3046875, 1.4814453125, 1.658203125, 1.8349609375, 2.01171875, 2.1884765625, 2.365234375, 2.5419921875, 2.71875, 2.8955078125, 3.072265625, 3.2490234375, 3.42578125, 3.6025390625, 3.779296875, 3.9560546875, 4.1328125, 4.3095703125, 4.486328125, 4.6630859375, 4.83984375, 5.0166015625, 5.193359375, 5.3701171875, 5.546875]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 7.0, 1.0, 13.0, 9.0, 14.0, 27.0, 34.0, 67.0, 76.0, 125.0, 165.0, 248.0, 397.0, 566.0, 812.0, 1167.0, 1751.0, 2648.0, 3916.0, 5678.0, 8594.0, 13083.0, 19572.0, 29165.0, 43655.0, 66550.0, 102812.0, 164665.0, 198976.0, 133818.0, 84007.0, 55301.0, 36493.0, 24498.0, 16311.0, 11074.0, 7307.0, 4873.0, 3316.0, 2157.0, 1474.0, 990.0, 693.0, 491.0, 301.0, 211.0, 159.0, 102.0, 62.0, 40.0, 28.0, 29.0, 14.0, 13.0, 6.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.57373046875, -0.555389404296875, -0.53704833984375, -0.518707275390625, -0.5003662109375, -0.482025146484375, -0.46368408203125, -0.445343017578125, -0.427001953125, -0.408660888671875, -0.39031982421875, -0.371978759765625, -0.3536376953125, -0.335296630859375, -0.31695556640625, -0.298614501953125, -0.2802734375, -0.261932373046875, -0.24359130859375, -0.225250244140625, -0.2069091796875, -0.188568115234375, -0.17022705078125, -0.151885986328125, -0.133544921875, -0.115203857421875, -0.09686279296875, -0.078521728515625, -0.0601806640625, -0.041839599609375, -0.02349853515625, -0.005157470703125, 0.01318359375, 0.031524658203125, 0.04986572265625, 0.068206787109375, 0.0865478515625, 0.104888916015625, 0.12322998046875, 0.141571044921875, 0.159912109375, 0.178253173828125, 0.19659423828125, 0.214935302734375, 0.2332763671875, 0.251617431640625, 0.26995849609375, 0.288299560546875, 0.306640625, 0.324981689453125, 0.34332275390625, 0.361663818359375, 0.3800048828125, 0.398345947265625, 0.41668701171875, 0.435028076171875, 0.453369140625, 0.471710205078125, 0.49005126953125, 0.508392333984375, 0.5267333984375, 0.545074462890625, 0.56341552734375, 0.581756591796875, 0.60009765625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 4.0, 4.0, 11.0, 3.0, 14.0, 8.0, 7.0, 13.0, 19.0, 21.0, 18.0, 25.0, 33.0, 29.0, 26.0, 36.0, 31.0, 41.0, 56.0, 30.0, 37.0, 1070.0, 35.0, 35.0, 47.0, 40.0, 39.0, 27.0, 44.0, 31.0, 26.0, 18.0, 31.0, 20.0, 24.0, 11.0, 16.0, 8.0, 4.0, 7.0, 11.0, 3.0, 7.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-3.916015625, -3.804107666015625, -3.69219970703125, -3.580291748046875, -3.4683837890625, -3.356475830078125, -3.24456787109375, -3.132659912109375, -3.020751953125, -2.908843994140625, -2.79693603515625, -2.685028076171875, -2.5731201171875, -2.461212158203125, -2.34930419921875, -2.237396240234375, -2.12548828125, -2.013580322265625, -1.90167236328125, -1.789764404296875, -1.6778564453125, -1.565948486328125, -1.45404052734375, -1.342132568359375, -1.230224609375, -1.118316650390625, -1.00640869140625, -0.894500732421875, -0.7825927734375, -0.670684814453125, -0.55877685546875, -0.446868896484375, -0.3349609375, -0.223052978515625, -0.11114501953125, 0.000762939453125, 0.1126708984375, 0.224578857421875, 0.33648681640625, 0.448394775390625, 0.560302734375, 0.672210693359375, 0.78411865234375, 0.896026611328125, 1.0079345703125, 1.119842529296875, 1.23175048828125, 1.343658447265625, 1.45556640625, 1.567474365234375, 1.67938232421875, 1.791290283203125, 1.9031982421875, 2.015106201171875, 2.12701416015625, 2.238922119140625, 2.350830078125, 2.462738037109375, 2.57464599609375, 2.686553955078125, 2.7984619140625, 2.910369873046875, 3.02227783203125, 3.134185791015625, 3.24609375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 8.0, 6.0, 12.0, 18.0, 28.0, 31.0, 65.0, 68.0, 114.0, 167.0, 256.0, 351.0, 484.0, 681.0, 1081.0, 1464.0, 2310.0, 3398.0, 5082.0, 7739.0, 11684.0, 18144.0, 28230.0, 43871.0, 69274.0, 108651.0, 170646.0, 1247247.0, 135884.0, 85635.0, 54498.0, 34764.0, 22432.0, 14348.0, 9477.0, 6228.0, 4113.0, 2685.0, 1897.0, 1299.0, 885.0, 599.0, 403.0, 260.0, 199.0, 135.0, 95.0, 76.0, 46.0, 26.0, 14.0, 11.0, 6.0, 7.0, 8.0, 1.0, 2.0, 3.0], "bins": [-0.56982421875, -0.5526809692382812, -0.5355377197265625, -0.5183944702148438, -0.501251220703125, -0.48410797119140625, -0.4669647216796875, -0.44982147216796875, -0.43267822265625, -0.41553497314453125, -0.3983917236328125, -0.38124847412109375, -0.364105224609375, -0.34696197509765625, -0.3298187255859375, -0.31267547607421875, -0.2955322265625, -0.27838897705078125, -0.2612457275390625, -0.24410247802734375, -0.226959228515625, -0.20981597900390625, -0.1926727294921875, -0.17552947998046875, -0.15838623046875, -0.14124298095703125, -0.1240997314453125, -0.10695648193359375, -0.089813232421875, -0.07266998291015625, -0.0555267333984375, -0.03838348388671875, -0.021240234375, -0.00409698486328125, 0.0130462646484375, 0.03018951416015625, 0.047332763671875, 0.06447601318359375, 0.0816192626953125, 0.09876251220703125, 0.11590576171875, 0.13304901123046875, 0.1501922607421875, 0.16733551025390625, 0.184478759765625, 0.20162200927734375, 0.2187652587890625, 0.23590850830078125, 0.2530517578125, 0.27019500732421875, 0.2873382568359375, 0.30448150634765625, 0.321624755859375, 0.33876800537109375, 0.3559112548828125, 0.37305450439453125, 0.39019775390625, 0.40734100341796875, 0.4244842529296875, 0.44162750244140625, 0.458770751953125, 0.47591400146484375, 0.4930572509765625, 0.5102005004882812, 0.52734375]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 8.0, 4.0, 3.0, 2.0, 12.0, 13.0, 15.0, 14.0, 27.0, 22.0, 34.0, 29.0, 42.0, 48.0, 54.0, 53.0, 57.0, 76.0, 73.0, 58.0, 63.0, 58.0, 55.0, 28.0, 30.0, 22.0, 22.0, 18.0, 12.0, 12.0, 8.0, 10.0, 2.0, 5.0, 3.0, 0.0, 2.0, 5.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0], "bins": [-0.002445220947265625, -0.0023785382509231567, -0.0023118555545806885, -0.00224517285823822, -0.002178490161895752, -0.0021118074655532837, -0.0020451247692108154, -0.001978442072868347, -0.001911759376525879, -0.0018450766801834106, -0.0017783939838409424, -0.0017117112874984741, -0.0016450285911560059, -0.0015783458948135376, -0.0015116631984710693, -0.001444980502128601, -0.0013782978057861328, -0.0013116151094436646, -0.0012449324131011963, -0.001178249716758728, -0.0011115670204162598, -0.0010448843240737915, -0.0009782016277313232, -0.000911518931388855, -0.0008448362350463867, -0.0007781535387039185, -0.0007114708423614502, -0.0006447881460189819, -0.0005781054496765137, -0.0005114227533340454, -0.00044474005699157715, -0.0003780573606491089, -0.0003113746643066406, -0.00024469196796417236, -0.0001780092716217041, -0.00011132657527923584, -4.464387893676758e-05, 2.2038817405700684e-05, 8.872151374816895e-05, 0.0001554042100906372, 0.00022208690643310547, 0.00028876960277557373, 0.000355452299118042, 0.00042213499546051025, 0.0004888176918029785, 0.0005555003881454468, 0.000622183084487915, 0.0006888657808303833, 0.0007555484771728516, 0.0008222311735153198, 0.0008889138698577881, 0.0009555965662002563, 0.0010222792625427246, 0.0010889619588851929, 0.0011556446552276611, 0.0012223273515701294, 0.0012890100479125977, 0.001355692744255066, 0.0014223754405975342, 0.0014890581369400024, 0.0015557408332824707, 0.001622423529624939, 0.0016891062259674072, 0.0017557889223098755, 0.0018224716186523438]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 4.0, 2.0, 3.0, 1.0, 5.0, 4.0, 3.0, 5.0, 5.0, 9.0, 6.0, 13.0, 10.0, 20.0, 25.0, 38.0, 40.0, 77.0, 110.0, 211.0, 373.0, 1352.0, 998993.0, 45743.0, 783.0, 288.0, 133.0, 85.0, 56.0, 36.0, 28.0, 28.0, 16.0, 17.0, 10.0, 9.0, 6.0, 6.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04583740234375, -0.044060707092285156, -0.04228401184082031, -0.04050731658935547, -0.038730621337890625, -0.03695392608642578, -0.03517723083496094, -0.033400535583496094, -0.03162384033203125, -0.029847145080566406, -0.028070449829101562, -0.02629375457763672, -0.024517059326171875, -0.02274036407470703, -0.020963668823242188, -0.019186973571777344, -0.0174102783203125, -0.015633583068847656, -0.013856887817382812, -0.012080192565917969, -0.010303497314453125, -0.008526802062988281, -0.0067501068115234375, -0.004973411560058594, -0.00319671630859375, -0.0014200210571289062, 0.0003566741943359375, 0.0021333694458007812, 0.003910064697265625, 0.005686759948730469, 0.0074634552001953125, 0.009240150451660156, 0.011016845703125, 0.012793540954589844, 0.014570236206054688, 0.01634693145751953, 0.018123626708984375, 0.01990032196044922, 0.021677017211914062, 0.023453712463378906, 0.02523040771484375, 0.027007102966308594, 0.028783798217773438, 0.03056049346923828, 0.032337188720703125, 0.03411388397216797, 0.03589057922363281, 0.037667274475097656, 0.0394439697265625, 0.041220664978027344, 0.04299736022949219, 0.04477405548095703, 0.046550750732421875, 0.04832744598388672, 0.05010414123535156, 0.051880836486816406, 0.05365753173828125, 0.055434226989746094, 0.05721092224121094, 0.05898761749267578, 0.060764312744140625, 0.06254100799560547, 0.06431770324707031, 0.06609439849853516, 0.06787109375]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 52.0, 470.0, 457.0, 31.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.013056381605565548, -0.012818903662264347, -0.01258142665028572, -0.01234394870698452, -0.012106470763683319, -0.011868992820382118, -0.011631515808403492, -0.011394037865102291, -0.011156560853123665, -0.010919082909822464, -0.010681605897843838, -0.010444127954542637, -0.010206650011241436, -0.00996917299926281, -0.009731695055961609, -0.009494217112660408, -0.009256739169359207, -0.009019261226058006, -0.00878178421407938, -0.00854430627077818, -0.008306828327476978, -0.008069351315498352, -0.007831873372197151, -0.00759439542889595, -0.007356917951256037, -0.007119440473616123, -0.006881962530314922, -0.006644485052675009, -0.006407007575035095, -0.006169529631733894, -0.005932052154093981, -0.005694574676454067, -0.005457096733152866, -0.005219619255512953, -0.004982141312211752, -0.004744663834571838, -0.0045071858912706375, -0.004269708413630724, -0.00403223093599081, -0.003794753225520253, -0.003557275515049696, -0.0033197978045791388, -0.0030823200941085815, -0.002844842616468668, -0.0026073649059981108, -0.0023698871955275536, -0.00213240971788764, -0.0018949320074170828, -0.0016574542969465256, -0.0014199765864759684, -0.001182498992420733, -0.0009450213401578367, -0.0007075436878949404, -0.00047006597742438316, -0.00023258838336914778, 4.889210686087608e-06, 0.00024236692115664482, 0.0004798445734195411, 0.0007173222256824374, 0.0009547998779453337, 0.00119227753020823, 0.0014297552406787872, 0.0016672328347340226, 0.001904710428789258, 0.002142188139259815]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 1.0, 9.0, 11.0, 7.0, 15.0, 12.0, 14.0, 11.0, 17.0, 17.0, 26.0, 34.0, 26.0, 33.0, 28.0, 37.0, 32.0, 39.0, 42.0, 29.0, 40.0, 45.0, 41.0, 53.0, 40.0, 39.0, 53.0, 35.0, 33.0, 29.0, 26.0, 15.0, 21.0, 18.0, 15.0, 14.0, 13.0, 8.0, 4.0, 6.0, 7.0, 2.0, 5.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0012217164039611816, -0.0011874651536345482, -0.0011532139033079147, -0.0011189626529812813, -0.0010847114026546478, -0.0010504601523280144, -0.001016208902001381, -0.0009819576516747475, -0.000947706401348114, -0.0009134551510214806, -0.0008792039006948471, -0.0008449526503682137, -0.0008107014000415802, -0.0007764501497149467, -0.0007421988993883133, -0.0007079476490616798, -0.0006736963987350464, -0.0006394451484084129, -0.0006051938980817795, -0.000570942647755146, -0.0005366913974285126, -0.0005024401471018791, -0.00046818889677524567, -0.0004339376464486122, -0.00039968639612197876, -0.0003654351457953453, -0.00033118389546871185, -0.0002969326451420784, -0.00026268139481544495, -0.0002284301444888115, -0.00019417889416217804, -0.00015992764383554459, -0.00012567639350891113, -9.142514318227768e-05, -5.7173892855644226e-05, -2.2922642529010773e-05, 1.132860779762268e-05, 4.5579858124256134e-05, 7.983110845088959e-05, 0.00011408235877752304, 0.0001483336091041565, 0.00018258485943078995, 0.0002168361097574234, 0.00025108736008405685, 0.0002853386104106903, 0.00031958986073732376, 0.0003538411110639572, 0.00038809236139059067, 0.0004223436117172241, 0.0004565948620438576, 0.000490846112370491, 0.0005250973626971245, 0.0005593486130237579, 0.0005935998633503914, 0.0006278511136770248, 0.0006621023640036583, 0.0006963536143302917, 0.0007306048646569252, 0.0007648561149835587, 0.0007991073653101921, 0.0008333586156368256, 0.000867609865963459, 0.0009018611162900925, 0.0009361123666167259, 0.0009703636169433594]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 9.0, 6.0, 9.0, 8.0, 11.0, 18.0, 18.0, 14.0, 24.0, 22.0, 19.0, 27.0, 24.0, 22.0, 31.0, 33.0, 34.0, 41.0, 47.0, 44.0, 55.0, 35.0, 28.0, 39.0, 47.0, 33.0, 25.0, 28.0, 36.0, 39.0, 28.0, 25.0, 19.0, 16.0, 18.0, 16.0, 9.0, 9.0, 2.0, 9.0, 7.0, 3.0, 6.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.765625, -5.5888671875, -5.412109375, -5.2353515625, -5.05859375, -4.8818359375, -4.705078125, -4.5283203125, -4.3515625, -4.1748046875, -3.998046875, -3.8212890625, -3.64453125, -3.4677734375, -3.291015625, -3.1142578125, -2.9375, -2.7607421875, -2.583984375, -2.4072265625, -2.23046875, -2.0537109375, -1.876953125, -1.7001953125, -1.5234375, -1.3466796875, -1.169921875, -0.9931640625, -0.81640625, -0.6396484375, -0.462890625, -0.2861328125, -0.109375, 0.0673828125, 0.244140625, 0.4208984375, 0.59765625, 0.7744140625, 0.951171875, 1.1279296875, 1.3046875, 1.4814453125, 1.658203125, 1.8349609375, 2.01171875, 2.1884765625, 2.365234375, 2.5419921875, 2.71875, 2.8955078125, 3.072265625, 3.2490234375, 3.42578125, 3.6025390625, 3.779296875, 3.9560546875, 4.1328125, 4.3095703125, 4.486328125, 4.6630859375, 4.83984375, 5.0166015625, 5.193359375, 5.3701171875, 5.546875]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 3.0, 4.0, 11.0, 10.0, 9.0, 18.0, 20.0, 22.0, 38.0, 57.0, 70.0, 113.0, 159.0, 246.0, 305.0, 538.0, 972.0, 1750.0, 3811.0, 8698.0, 22259.0, 66102.0, 228276.0, 460623.0, 171502.0, 50918.0, 17777.0, 7114.0, 3264.0, 1496.0, 825.0, 530.0, 304.0, 211.0, 135.0, 102.0, 74.0, 47.0, 45.0, 25.0, 18.0, 14.0, 14.0, 14.0, 9.0, 2.0, 0.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.76953125, -4.60723876953125, -4.4449462890625, -4.28265380859375, -4.120361328125, -3.95806884765625, -3.7957763671875, -3.63348388671875, -3.47119140625, -3.30889892578125, -3.1466064453125, -2.98431396484375, -2.822021484375, -2.65972900390625, -2.4974365234375, -2.33514404296875, -2.1728515625, -2.01055908203125, -1.8482666015625, -1.68597412109375, -1.523681640625, -1.36138916015625, -1.1990966796875, -1.03680419921875, -0.87451171875, -0.71221923828125, -0.5499267578125, -0.38763427734375, -0.225341796875, -0.06304931640625, 0.0992431640625, 0.26153564453125, 0.423828125, 0.58612060546875, 0.7484130859375, 0.91070556640625, 1.072998046875, 1.23529052734375, 1.3975830078125, 1.55987548828125, 1.72216796875, 1.88446044921875, 2.0467529296875, 2.20904541015625, 2.371337890625, 2.53363037109375, 2.6959228515625, 2.85821533203125, 3.0205078125, 3.18280029296875, 3.3450927734375, 3.50738525390625, 3.669677734375, 3.83197021484375, 3.9942626953125, 4.15655517578125, 4.31884765625, 4.48114013671875, 4.6434326171875, 4.80572509765625, 4.968017578125, 5.13031005859375, 5.2926025390625, 5.45489501953125, 5.6171875]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 3.0, 5.0, 11.0, 5.0, 8.0, 7.0, 14.0, 24.0, 17.0, 22.0, 29.0, 24.0, 33.0, 37.0, 42.0, 45.0, 43.0, 50.0, 90.0, 174.0, 1649.0, 229.0, 83.0, 50.0, 47.0, 37.0, 42.0, 28.0, 32.0, 30.0, 23.0, 22.0, 25.0, 10.0, 10.0, 12.0, 10.0, 7.0, 4.0, 3.0, 3.0, 1.0, 5.0, 3.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.171875, -20.521484375, -19.87109375, -19.220703125, -18.5703125, -17.919921875, -17.26953125, -16.619140625, -15.96875, -15.318359375, -14.66796875, -14.017578125, -13.3671875, -12.716796875, -12.06640625, -11.416015625, -10.765625, -10.115234375, -9.46484375, -8.814453125, -8.1640625, -7.513671875, -6.86328125, -6.212890625, -5.5625, -4.912109375, -4.26171875, -3.611328125, -2.9609375, -2.310546875, -1.66015625, -1.009765625, -0.359375, 0.291015625, 0.94140625, 1.591796875, 2.2421875, 2.892578125, 3.54296875, 4.193359375, 4.84375, 5.494140625, 6.14453125, 6.794921875, 7.4453125, 8.095703125, 8.74609375, 9.396484375, 10.046875, 10.697265625, 11.34765625, 11.998046875, 12.6484375, 13.298828125, 13.94921875, 14.599609375, 15.25, 15.900390625, 16.55078125, 17.201171875, 17.8515625, 18.501953125, 19.15234375, 19.802734375, 20.453125]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 3.0, 5.0, 2.0, 3.0, 4.0, 6.0, 7.0, 11.0, 13.0, 10.0, 18.0, 17.0, 31.0, 47.0, 64.0, 67.0, 70.0, 134.0, 167.0, 270.0, 437.0, 1407.0, 23209.0, 3087066.0, 29599.0, 1538.0, 485.0, 271.0, 183.0, 149.0, 97.0, 72.0, 39.0, 36.0, 34.0, 27.0, 22.0, 20.0, 14.0, 6.0, 13.0, 13.0, 11.0, 3.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-41.4375, -40.123046875, -38.80859375, -37.494140625, -36.1796875, -34.865234375, -33.55078125, -32.236328125, -30.921875, -29.607421875, -28.29296875, -26.978515625, -25.6640625, -24.349609375, -23.03515625, -21.720703125, -20.40625, -19.091796875, -17.77734375, -16.462890625, -15.1484375, -13.833984375, -12.51953125, -11.205078125, -9.890625, -8.576171875, -7.26171875, -5.947265625, -4.6328125, -3.318359375, -2.00390625, -0.689453125, 0.625, 1.939453125, 3.25390625, 4.568359375, 5.8828125, 7.197265625, 8.51171875, 9.826171875, 11.140625, 12.455078125, 13.76953125, 15.083984375, 16.3984375, 17.712890625, 19.02734375, 20.341796875, 21.65625, 22.970703125, 24.28515625, 25.599609375, 26.9140625, 28.228515625, 29.54296875, 30.857421875, 32.171875, 33.486328125, 34.80078125, 36.115234375, 37.4296875, 38.744140625, 40.05859375, 41.373046875, 42.6875]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 55.0, 563.0, 376.0, 20.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-207.1810760498047, -203.26205444335938, -199.34303283691406, -195.42401123046875, -191.50498962402344, -187.58596801757812, -183.6669464111328, -179.7479248046875, -175.8289031982422, -171.90988159179688, -167.99085998535156, -164.07183837890625, -160.15281677246094, -156.23379516601562, -152.3147735595703, -148.395751953125, -144.4767303466797, -140.55770874023438, -136.63868713378906, -132.71966552734375, -128.80064392089844, -124.88162231445312, -120.96260070800781, -117.0435791015625, -113.12455749511719, -109.20553588867188, -105.28651428222656, -101.36749267578125, -97.44847106933594, -93.52944946289062, -89.61042785644531, -85.69140625, -81.77239227294922, -77.8533706665039, -73.9343490600586, -70.01532745361328, -66.09630584716797, -62.177284240722656, -58.258262634277344, -54.33924102783203, -50.42021942138672, -46.501197814941406, -42.582176208496094, -38.66315460205078, -34.74413299560547, -30.825111389160156, -26.906089782714844, -22.98706817626953, -19.06804656982422, -15.149024963378906, -11.230003356933594, -7.310981750488281, -3.3919601440429688, 0.5270614624023438, 4.446083068847656, 8.365104675292969, 12.284126281738281, 16.203147888183594, 20.122169494628906, 24.04119110107422, 27.96021270751953, 31.879234313964844, 35.798255920410156, 39.71727752685547, 43.63629913330078]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 12.0, 7.0, 11.0, 9.0, 13.0, 13.0, 21.0, 25.0, 28.0, 25.0, 30.0, 25.0, 38.0, 32.0, 42.0, 40.0, 37.0, 34.0, 46.0, 45.0, 34.0, 36.0, 35.0, 48.0, 32.0, 32.0, 30.0, 27.0, 30.0, 24.0, 19.0, 21.0, 17.0, 16.0, 5.0, 14.0, 4.0, 9.0, 8.0, 5.0, 6.0, 7.0, 3.0, 1.0, 4.0, 2.0], "bins": [-59.74174880981445, -58.1429557800293, -56.544166564941406, -54.94537353515625, -53.34658432006836, -51.7477912902832, -50.14900207519531, -48.550209045410156, -46.951419830322266, -45.35262680053711, -43.75383758544922, -42.15504455566406, -40.55625534057617, -38.957462310791016, -37.358673095703125, -35.75988006591797, -34.16108703613281, -32.562294006347656, -30.963504791259766, -29.364713668823242, -27.76592254638672, -26.167131423950195, -24.568340301513672, -22.969547271728516, -21.370758056640625, -19.7719669342041, -18.173175811767578, -16.574384689331055, -14.975593566894531, -13.376802444458008, -11.778010368347168, -10.179219245910645, -8.580429077148438, -6.981637954711914, -5.382846832275391, -3.784055233001709, -2.1852641105651855, -0.5864729881286621, 1.0123186111450195, 2.611109733581543, 4.209900856018066, 5.80869197845459, 7.407483100891113, 9.006275177001953, 10.605066299438477, 12.203857421875, 13.802648544311523, 15.401439666748047, 17.00023078918457, 18.599021911621094, 20.197813034057617, 21.79660415649414, 23.395395278930664, 24.994186401367188, 26.592979431152344, 28.191768646240234, 29.79056167602539, 31.389352798461914, 32.98814392089844, 34.586936950683594, 36.185726165771484, 37.78451919555664, 39.38330841064453, 40.98210144042969, 42.58089065551758]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 8.0, 7.0, 4.0, 8.0, 9.0, 14.0, 19.0, 16.0, 12.0, 17.0, 25.0, 19.0, 29.0, 18.0, 25.0, 25.0, 34.0, 35.0, 43.0, 44.0, 46.0, 44.0, 42.0, 32.0, 34.0, 32.0, 40.0, 31.0, 30.0, 34.0, 36.0, 32.0, 28.0, 21.0, 15.0, 18.0, 16.0, 13.0, 9.0, 9.0, 9.0, 3.0, 3.0, 5.0, 7.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.921875, -5.74285888671875, -5.5638427734375, -5.38482666015625, -5.205810546875, -5.02679443359375, -4.8477783203125, -4.66876220703125, -4.48974609375, -4.31072998046875, -4.1317138671875, -3.95269775390625, -3.773681640625, -3.59466552734375, -3.4156494140625, -3.23663330078125, -3.0576171875, -2.87860107421875, -2.6995849609375, -2.52056884765625, -2.341552734375, -2.16253662109375, -1.9835205078125, -1.80450439453125, -1.62548828125, -1.44647216796875, -1.2674560546875, -1.08843994140625, -0.909423828125, -0.73040771484375, -0.5513916015625, -0.37237548828125, -0.193359375, -0.01434326171875, 0.1646728515625, 0.34368896484375, 0.522705078125, 0.70172119140625, 0.8807373046875, 1.05975341796875, 1.23876953125, 1.41778564453125, 1.5968017578125, 1.77581787109375, 1.954833984375, 2.13385009765625, 2.3128662109375, 2.49188232421875, 2.6708984375, 2.84991455078125, 3.0289306640625, 3.20794677734375, 3.386962890625, 3.56597900390625, 3.7449951171875, 3.92401123046875, 4.10302734375, 4.28204345703125, 4.4610595703125, 4.64007568359375, 4.819091796875, 4.99810791015625, 5.1771240234375, 5.35614013671875, 5.53515625]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 4.0, 12.0, 9.0, 10.0, 11.0, 13.0, 14.0, 14.0, 24.0, 18.0, 20.0, 20.0, 31.0, 44.0, 38.0, 57.0, 81.0, 192.0, 408.0, 2166.0, 41539.0, 3203336.0, 933488.0, 10927.0, 1003.0, 275.0, 110.0, 75.0, 56.0, 48.0, 41.0, 25.0, 25.0, 35.0, 16.0, 24.0, 8.0, 14.0, 9.0, 10.0, 8.0, 7.0, 4.0, 3.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0], "bins": [-32.25, -31.296142578125, -30.34228515625, -29.388427734375, -28.4345703125, -27.480712890625, -26.52685546875, -25.572998046875, -24.619140625, -23.665283203125, -22.71142578125, -21.757568359375, -20.8037109375, -19.849853515625, -18.89599609375, -17.942138671875, -16.98828125, -16.034423828125, -15.08056640625, -14.126708984375, -13.1728515625, -12.218994140625, -11.26513671875, -10.311279296875, -9.357421875, -8.403564453125, -7.44970703125, -6.495849609375, -5.5419921875, -4.588134765625, -3.63427734375, -2.680419921875, -1.7265625, -0.772705078125, 0.18115234375, 1.135009765625, 2.0888671875, 3.042724609375, 3.99658203125, 4.950439453125, 5.904296875, 6.858154296875, 7.81201171875, 8.765869140625, 9.7197265625, 10.673583984375, 11.62744140625, 12.581298828125, 13.53515625, 14.489013671875, 15.44287109375, 16.396728515625, 17.3505859375, 18.304443359375, 19.25830078125, 20.212158203125, 21.166015625, 22.119873046875, 23.07373046875, 24.027587890625, 24.9814453125, 25.935302734375, 26.88916015625, 27.843017578125, 28.796875]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 5.0, 6.0, 11.0, 10.0, 10.0, 23.0, 35.0, 40.0, 54.0, 66.0, 93.0, 116.0, 168.0, 215.0, 332.0, 397.0, 450.0, 464.0, 418.0, 332.0, 234.0, 168.0, 113.0, 85.0, 56.0, 50.0, 36.0, 26.0, 15.0, 14.0, 9.0, 8.0, 7.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.984375, -14.515625, -14.046875, -13.578125, -13.109375, -12.640625, -12.171875, -11.703125, -11.234375, -10.765625, -10.296875, -9.828125, -9.359375, -8.890625, -8.421875, -7.953125, -7.484375, -7.015625, -6.546875, -6.078125, -5.609375, -5.140625, -4.671875, -4.203125, -3.734375, -3.265625, -2.796875, -2.328125, -1.859375, -1.390625, -0.921875, -0.453125, 0.015625, 0.484375, 0.953125, 1.421875, 1.890625, 2.359375, 2.828125, 3.296875, 3.765625, 4.234375, 4.703125, 5.171875, 5.640625, 6.109375, 6.578125, 7.046875, 7.515625, 7.984375, 8.453125, 8.921875, 9.390625, 9.859375, 10.328125, 10.796875, 11.265625, 11.734375, 12.203125, 12.671875, 13.140625, 13.609375, 14.078125, 14.546875, 15.015625]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 3.0, 6.0, 4.0, 7.0, 6.0, 8.0, 10.0, 11.0, 14.0, 17.0, 20.0, 18.0, 20.0, 31.0, 47.0, 60.0, 68.0, 101.0, 127.0, 168.0, 243.0, 353.0, 766.0, 3252.0, 120652.0, 3974194.0, 89153.0, 2837.0, 738.0, 355.0, 254.0, 165.0, 135.0, 89.0, 68.0, 72.0, 58.0, 35.0, 27.0, 32.0, 22.0, 12.0, 3.0, 9.0, 6.0, 4.0, 5.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-47.53125, -45.91845703125, -44.3056640625, -42.69287109375, -41.080078125, -39.46728515625, -37.8544921875, -36.24169921875, -34.62890625, -33.01611328125, -31.4033203125, -29.79052734375, -28.177734375, -26.56494140625, -24.9521484375, -23.33935546875, -21.7265625, -20.11376953125, -18.5009765625, -16.88818359375, -15.275390625, -13.66259765625, -12.0498046875, -10.43701171875, -8.82421875, -7.21142578125, -5.5986328125, -3.98583984375, -2.373046875, -0.76025390625, 0.8525390625, 2.46533203125, 4.078125, 5.69091796875, 7.3037109375, 8.91650390625, 10.529296875, 12.14208984375, 13.7548828125, 15.36767578125, 16.98046875, 18.59326171875, 20.2060546875, 21.81884765625, 23.431640625, 25.04443359375, 26.6572265625, 28.27001953125, 29.8828125, 31.49560546875, 33.1083984375, 34.72119140625, 36.333984375, 37.94677734375, 39.5595703125, 41.17236328125, 42.78515625, 44.39794921875, 46.0107421875, 47.62353515625, 49.236328125, 50.84912109375, 52.4619140625, 54.07470703125, 55.6875]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 18.0, 27.0, 56.0, 97.0, 176.0, 167.0, 172.0, 115.0, 93.0, 42.0, 27.0, 6.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.478450775146484, -47.65727615356445, -44.83610153198242, -42.014930725097656, -39.193756103515625, -36.372581481933594, -33.55140686035156, -30.73023223876953, -27.9090576171875, -25.08788299560547, -22.266708374023438, -19.44553565979004, -16.624361038208008, -13.803186416625977, -10.982013702392578, -8.160839080810547, -5.339664459228516, -2.5184903144836426, 0.30268383026123047, 3.1238574981689453, 5.945032119750977, 8.766206741333008, 11.587379455566406, 14.408554077148438, 17.22972869873047, 20.0509033203125, 22.87207794189453, 25.69325065612793, 28.51442527770996, 31.335599899291992, 34.15677261352539, 36.97794723510742, 39.79911804199219, 42.62029266357422, 45.44146728515625, 48.26264190673828, 51.08381652832031, 53.904991149902344, 56.72616195678711, 59.54733657836914, 62.36851119995117, 65.18968200683594, 68.01085662841797, 70.83203125, 73.65320587158203, 76.47438049316406, 79.2955551147461, 82.11672973632812, 84.93790435791016, 87.75907897949219, 90.58025360107422, 93.40142822265625, 96.22260284423828, 99.04377746582031, 101.86494445800781, 104.68612670898438, 107.50729370117188, 110.3284683227539, 113.14964294433594, 115.97081756591797, 118.7919921875, 121.61316680908203, 124.43434143066406, 127.25550842285156, 130.07669067382812]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 9.0, 9.0, 16.0, 10.0, 12.0, 23.0, 17.0, 23.0, 22.0, 28.0, 26.0, 29.0, 32.0, 30.0, 33.0, 33.0, 30.0, 39.0, 41.0, 43.0, 30.0, 34.0, 45.0, 35.0, 34.0, 28.0, 40.0, 31.0, 31.0, 21.0, 19.0, 16.0, 17.0, 18.0, 15.0, 10.0, 9.0, 11.0, 8.0, 8.0, 5.0, 3.0, 6.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0], "bins": [-44.51927185058594, -43.101348876953125, -41.68342208862305, -40.265499114990234, -38.847572326660156, -37.429649353027344, -36.01172637939453, -34.59379959106445, -33.175872802734375, -31.75794792175293, -30.340023040771484, -28.922100067138672, -27.504173278808594, -26.08625030517578, -24.668325424194336, -23.25040054321289, -21.832477569580078, -20.414552688598633, -18.996627807617188, -17.578704833984375, -16.160778045654297, -14.742854118347168, -13.324930191040039, -11.907005310058594, -10.489080429077148, -9.071155548095703, -7.653231143951416, -6.235306739807129, -4.817381858825684, -3.3994569778442383, -1.9815330505371094, -0.5636081695556641, 0.8543167114257812, 2.2722413539886475, 3.6901659965515137, 5.108090400695801, 6.526015281677246, 7.943940162658691, 9.36186408996582, 10.779788970947266, 12.197713851928711, 13.615638732910156, 15.033563613891602, 16.451488494873047, 17.86941146850586, 19.287338256835938, 20.70526123046875, 22.123186111450195, 23.54111099243164, 24.959035873413086, 26.37696075439453, 27.794883728027344, 29.212810516357422, 30.630733489990234, 32.04866027832031, 33.466583251953125, 34.88450622558594, 36.30242919921875, 37.72035598754883, 39.13827896118164, 40.55620574951172, 41.97412872314453, 43.392051696777344, 44.80997848510742, 46.2279052734375]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 8.0, 3.0, 6.0, 7.0, 11.0, 13.0, 6.0, 14.0, 16.0, 15.0, 15.0, 25.0, 28.0, 29.0, 30.0, 22.0, 30.0, 34.0, 27.0, 42.0, 39.0, 33.0, 36.0, 50.0, 37.0, 31.0, 42.0, 33.0, 36.0, 31.0, 35.0, 25.0, 25.0, 26.0, 20.0, 26.0, 18.0, 12.0, 14.0, 16.0, 7.0, 7.0, 4.0, 6.0, 5.0, 3.0, 1.0, 2.0, 5.0, 1.0, 1.0, 0.0, 2.0], "bins": [-6.0703125, -5.89111328125, -5.7119140625, -5.53271484375, -5.353515625, -5.17431640625, -4.9951171875, -4.81591796875, -4.63671875, -4.45751953125, -4.2783203125, -4.09912109375, -3.919921875, -3.74072265625, -3.5615234375, -3.38232421875, -3.203125, -3.02392578125, -2.8447265625, -2.66552734375, -2.486328125, -2.30712890625, -2.1279296875, -1.94873046875, -1.76953125, -1.59033203125, -1.4111328125, -1.23193359375, -1.052734375, -0.87353515625, -0.6943359375, -0.51513671875, -0.3359375, -0.15673828125, 0.0224609375, 0.20166015625, 0.380859375, 0.56005859375, 0.7392578125, 0.91845703125, 1.09765625, 1.27685546875, 1.4560546875, 1.63525390625, 1.814453125, 1.99365234375, 2.1728515625, 2.35205078125, 2.53125, 2.71044921875, 2.8896484375, 3.06884765625, 3.248046875, 3.42724609375, 3.6064453125, 3.78564453125, 3.96484375, 4.14404296875, 4.3232421875, 4.50244140625, 4.681640625, 4.86083984375, 5.0400390625, 5.21923828125, 5.3984375]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 9.0, 9.0, 11.0, 21.0, 26.0, 27.0, 54.0, 76.0, 119.0, 154.0, 239.0, 298.0, 458.0, 645.0, 873.0, 1305.0, 1881.0, 2875.0, 4163.0, 6042.0, 9055.0, 13088.0, 19936.0, 29820.0, 45269.0, 69005.0, 106051.0, 162897.0, 189330.0, 131996.0, 85786.0, 55736.0, 36568.0, 24262.0, 16343.0, 10895.0, 7251.0, 4941.0, 3458.0, 2297.0, 1600.0, 1103.0, 812.0, 523.0, 371.0, 256.0, 189.0, 130.0, 105.0, 61.0, 38.0, 36.0, 19.0, 21.0, 11.0, 14.0, 5.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.58984375, -0.5709686279296875, -0.552093505859375, -0.5332183837890625, -0.51434326171875, -0.4954681396484375, -0.476593017578125, -0.4577178955078125, -0.4388427734375, -0.4199676513671875, -0.401092529296875, -0.3822174072265625, -0.36334228515625, -0.3444671630859375, -0.325592041015625, -0.3067169189453125, -0.287841796875, -0.2689666748046875, -0.250091552734375, -0.2312164306640625, -0.21234130859375, -0.1934661865234375, -0.174591064453125, -0.1557159423828125, -0.1368408203125, -0.1179656982421875, -0.099090576171875, -0.0802154541015625, -0.06134033203125, -0.0424652099609375, -0.023590087890625, -0.0047149658203125, 0.01416015625, 0.0330352783203125, 0.051910400390625, 0.0707855224609375, 0.08966064453125, 0.1085357666015625, 0.127410888671875, 0.1462860107421875, 0.1651611328125, 0.1840362548828125, 0.202911376953125, 0.2217864990234375, 0.24066162109375, 0.2595367431640625, 0.278411865234375, 0.2972869873046875, 0.316162109375, 0.3350372314453125, 0.353912353515625, 0.3727874755859375, 0.39166259765625, 0.4105377197265625, 0.429412841796875, 0.4482879638671875, 0.4671630859375, 0.4860382080078125, 0.504913330078125, 0.5237884521484375, 0.54266357421875, 0.5615386962890625, 0.580413818359375, 0.5992889404296875, 0.6181640625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 7.0, 9.0, 8.0, 10.0, 9.0, 11.0, 18.0, 14.0, 19.0, 32.0, 24.0, 30.0, 31.0, 34.0, 29.0, 42.0, 31.0, 48.0, 43.0, 37.0, 1062.0, 30.0, 37.0, 45.0, 34.0, 37.0, 26.0, 39.0, 23.0, 27.0, 27.0, 25.0, 21.0, 19.0, 16.0, 12.0, 16.0, 11.0, 7.0, 7.0, 8.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-4.22265625, -4.097320556640625, -3.97198486328125, -3.846649169921875, -3.7213134765625, -3.595977783203125, -3.47064208984375, -3.345306396484375, -3.219970703125, -3.094635009765625, -2.96929931640625, -2.843963623046875, -2.7186279296875, -2.593292236328125, -2.46795654296875, -2.342620849609375, -2.21728515625, -2.091949462890625, -1.96661376953125, -1.841278076171875, -1.7159423828125, -1.590606689453125, -1.46527099609375, -1.339935302734375, -1.214599609375, -1.089263916015625, -0.96392822265625, -0.838592529296875, -0.7132568359375, -0.587921142578125, -0.46258544921875, -0.337249755859375, -0.2119140625, -0.086578369140625, 0.03875732421875, 0.164093017578125, 0.2894287109375, 0.414764404296875, 0.54010009765625, 0.665435791015625, 0.790771484375, 0.916107177734375, 1.04144287109375, 1.166778564453125, 1.2921142578125, 1.417449951171875, 1.54278564453125, 1.668121337890625, 1.79345703125, 1.918792724609375, 2.04412841796875, 2.169464111328125, 2.2947998046875, 2.420135498046875, 2.54547119140625, 2.670806884765625, 2.796142578125, 2.921478271484375, 3.04681396484375, 3.172149658203125, 3.2974853515625, 3.422821044921875, 3.54815673828125, 3.673492431640625, 3.798828125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 10.0, 7.0, 11.0, 14.0, 22.0, 25.0, 41.0, 62.0, 87.0, 133.0, 194.0, 270.0, 405.0, 600.0, 910.0, 1267.0, 2044.0, 2977.0, 4595.0, 6991.0, 10577.0, 16380.0, 25688.0, 40766.0, 64371.0, 102459.0, 166775.0, 1257319.0, 145767.0, 89729.0, 55991.0, 35673.0, 22854.0, 14459.0, 9350.0, 6096.0, 4042.0, 2665.0, 1787.0, 1243.0, 776.0, 531.0, 390.0, 273.0, 166.0, 95.0, 85.0, 46.0, 57.0, 17.0, 15.0, 12.0, 10.0, 7.0, 4.0, 3.0, 1.0, 2.0, 1.0], "bins": [-0.64013671875, -0.6203536987304688, -0.6005706787109375, -0.5807876586914062, -0.561004638671875, -0.5412216186523438, -0.5214385986328125, -0.5016555786132812, -0.48187255859375, -0.46208953857421875, -0.4423065185546875, -0.42252349853515625, -0.402740478515625, -0.38295745849609375, -0.3631744384765625, -0.34339141845703125, -0.3236083984375, -0.30382537841796875, -0.2840423583984375, -0.26425933837890625, -0.244476318359375, -0.22469329833984375, -0.2049102783203125, -0.18512725830078125, -0.16534423828125, -0.14556121826171875, -0.1257781982421875, -0.10599517822265625, -0.086212158203125, -0.06642913818359375, -0.0466461181640625, -0.02686309814453125, -0.007080078125, 0.01270294189453125, 0.0324859619140625, 0.05226898193359375, 0.072052001953125, 0.09183502197265625, 0.1116180419921875, 0.13140106201171875, 0.15118408203125, 0.17096710205078125, 0.1907501220703125, 0.21053314208984375, 0.230316162109375, 0.25009918212890625, 0.2698822021484375, 0.28966522216796875, 0.3094482421875, 0.32923126220703125, 0.3490142822265625, 0.36879730224609375, 0.388580322265625, 0.40836334228515625, 0.4281463623046875, 0.44792938232421875, 0.46771240234375, 0.48749542236328125, 0.5072784423828125, 0.5270614624023438, 0.546844482421875, 0.5666275024414062, 0.5864105224609375, 0.6061935424804688, 0.6259765625]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 2.0, 0.0, 5.0, 2.0, 6.0, 3.0, 6.0, 14.0, 14.0, 15.0, 9.0, 22.0, 23.0, 32.0, 37.0, 39.0, 54.0, 47.0, 70.0, 59.0, 55.0, 71.0, 66.0, 61.0, 45.0, 41.0, 46.0, 36.0, 22.0, 13.0, 17.0, 18.0, 15.0, 7.0, 9.0, 4.0, 6.0, 4.0, 4.0, 3.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0025463104248046875, -0.002461731433868408, -0.002377152442932129, -0.0022925734519958496, -0.0022079944610595703, -0.002123415470123291, -0.0020388364791870117, -0.0019542574882507324, -0.0018696784973144531, -0.0017850995063781738, -0.0017005205154418945, -0.0016159415245056152, -0.001531362533569336, -0.0014467835426330566, -0.0013622045516967773, -0.001277625560760498, -0.0011930465698242188, -0.0011084675788879395, -0.0010238885879516602, -0.0009393095970153809, -0.0008547306060791016, -0.0007701516151428223, -0.000685572624206543, -0.0006009936332702637, -0.0005164146423339844, -0.0004318356513977051, -0.0003472566604614258, -0.0002626776695251465, -0.0001780986785888672, -9.351968765258789e-05, -8.940696716308594e-06, 7.56382942199707e-05, 0.00016021728515625, 0.0002447962760925293, 0.0003293752670288086, 0.0004139542579650879, 0.0004985332489013672, 0.0005831122398376465, 0.0006676912307739258, 0.0007522702217102051, 0.0008368492126464844, 0.0009214282035827637, 0.001006007194519043, 0.0010905861854553223, 0.0011751651763916016, 0.0012597441673278809, 0.0013443231582641602, 0.0014289021492004395, 0.0015134811401367188, 0.001598060131072998, 0.0016826391220092773, 0.0017672181129455566, 0.001851797103881836, 0.0019363760948181152, 0.0020209550857543945, 0.002105534076690674, 0.002190113067626953, 0.0022746920585632324, 0.0023592710494995117, 0.002443850040435791, 0.0025284290313720703, 0.0026130080223083496, 0.002697587013244629, 0.002782166004180908, 0.0028667449951171875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 5.0, 2.0, 3.0, 2.0, 10.0, 7.0, 12.0, 15.0, 15.0, 19.0, 21.0, 28.0, 53.0, 49.0, 77.0, 154.0, 332.0, 848.0, 175033.0, 869951.0, 1059.0, 383.0, 154.0, 93.0, 68.0, 32.0, 29.0, 22.0, 16.0, 17.0, 8.0, 7.0, 5.0, 3.0, 6.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0740966796875, -0.07178688049316406, -0.06947708129882812, -0.06716728210449219, -0.06485748291015625, -0.06254768371582031, -0.060237884521484375, -0.05792808532714844, -0.0556182861328125, -0.05330848693847656, -0.050998687744140625, -0.04868888854980469, -0.04637908935546875, -0.04406929016113281, -0.041759490966796875, -0.03944969177246094, -0.037139892578125, -0.03483009338378906, -0.032520294189453125, -0.030210494995117188, -0.02790069580078125, -0.025590896606445312, -0.023281097412109375, -0.020971298217773438, -0.0186614990234375, -0.016351699829101562, -0.014041900634765625, -0.011732101440429688, -0.00942230224609375, -0.0071125030517578125, -0.004802703857421875, -0.0024929046630859375, -0.00018310546875, 0.0021266937255859375, 0.004436492919921875, 0.0067462921142578125, 0.00905609130859375, 0.011365890502929688, 0.013675689697265625, 0.015985488891601562, 0.0182952880859375, 0.020605087280273438, 0.022914886474609375, 0.025224685668945312, 0.02753448486328125, 0.029844284057617188, 0.032154083251953125, 0.03446388244628906, 0.036773681640625, 0.03908348083496094, 0.041393280029296875, 0.04370307922363281, 0.04601287841796875, 0.04832267761230469, 0.050632476806640625, 0.05294227600097656, 0.0552520751953125, 0.05756187438964844, 0.059871673583984375, 0.06218147277832031, 0.06449127197265625, 0.06680107116699219, 0.06911087036132812, 0.07142066955566406, 0.07373046875]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 7.0, 87.0, 517.0, 361.0, 41.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.008776150643825531, -0.008561138063669205, -0.008346124552190304, -0.008131111040711403, -0.007916098460555077, -0.007701085414737463, -0.007486072368919849, -0.007271059323102236, -0.007056046277284622, -0.006841033231467009, -0.006626020185649395, -0.006411007139831781, -0.006195994094014168, -0.005980981048196554, -0.005765968002378941, -0.005550954956561327, -0.005335941910743713, -0.0051209288649261, -0.004905915819108486, -0.004690902773290873, -0.004475889727473259, -0.004260876681655645, -0.004045863635838032, -0.003830850590020418, -0.0036158375442028046, -0.003400824498385191, -0.0031858114525675774, -0.0029707984067499638, -0.00275578536093235, -0.0025407723151147366, -0.002325759269297123, -0.0021107462234795094, -0.001895733643323183, -0.0016807205975055695, -0.0014657075516879559, -0.0012506945058703423, -0.0010356814600527287, -0.000820668414235115, -0.0006056553684175014, -0.00039064232259988785, -0.00017562927678227425, 3.9383769035339355e-05, 0.00025439681485295296, 0.00046940986067056656, 0.0006844229064881802, 0.0008994359523057938, 0.0011144489981234074, 0.001329462043941021, 0.0015444750897586346, 0.0017594881355762482, 0.0019745011813938618, 0.0021895142272114754, 0.002404527273029089, 0.0026195403188467026, 0.002834553364664316, 0.0030495664104819298, 0.0032645794562995434, 0.003479592502117157, 0.0036946055479347706, 0.003909618593752384, 0.004124631639569998, 0.004339644685387611, 0.004554657731205225, 0.004769670777022839, 0.004984683822840452]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 4.0, 6.0, 6.0, 13.0, 12.0, 10.0, 12.0, 19.0, 11.0, 21.0, 23.0, 28.0, 18.0, 25.0, 21.0, 36.0, 33.0, 28.0, 50.0, 34.0, 45.0, 41.0, 37.0, 45.0, 40.0, 37.0, 30.0, 27.0, 35.0, 38.0, 37.0, 24.0, 27.0, 25.0, 17.0, 16.0, 7.0, 14.0, 9.0, 13.0, 4.0, 9.0, 9.0, 5.0, 1.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011767148971557617, -0.0011347737163305283, -0.0010928325355052948, -0.0010508913546800613, -0.0010089501738548279, -0.0009670089930295944, -0.000925067812204361, -0.0008831266313791275, -0.000841185450553894, -0.0007992442697286606, -0.0007573030889034271, -0.0007153619080781937, -0.0006734207272529602, -0.0006314795464277267, -0.0005895383656024933, -0.0005475971847772598, -0.0005056560039520264, -0.0004637148231267929, -0.00042177364230155945, -0.000379832461476326, -0.00033789128065109253, -0.00029595009982585907, -0.0002540089190006256, -0.00021206773817539215, -0.0001701265573501587, -0.00012818537652492523, -8.624419569969177e-05, -4.430301487445831e-05, -2.3618340492248535e-06, 3.9579346776008606e-05, 8.152052760124207e-05, 0.00012346170842647552, 0.00016540288925170898, 0.00020734407007694244, 0.0002492852509021759, 0.00029122643172740936, 0.0003331676125526428, 0.0003751087933778763, 0.00041704997420310974, 0.0004589911550283432, 0.0005009323358535767, 0.0005428735166788101, 0.0005848146975040436, 0.000626755878329277, 0.0006686970591545105, 0.000710638239979744, 0.0007525794208049774, 0.0007945206016302109, 0.0008364617824554443, 0.0008784029632806778, 0.0009203441441059113, 0.0009622853249311447, 0.0010042265057563782, 0.0010461676865816116, 0.001088108867406845, 0.0011300500482320786, 0.001171991229057312, 0.0012139324098825455, 0.001255873590707779, 0.0012978147715330124, 0.0013397559523582458, 0.0013816971331834793, 0.0014236383140087128, 0.0014655794948339462, 0.0015075206756591797]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 8.0, 3.0, 6.0, 7.0, 11.0, 13.0, 6.0, 14.0, 16.0, 15.0, 15.0, 25.0, 28.0, 29.0, 30.0, 22.0, 30.0, 34.0, 27.0, 42.0, 39.0, 33.0, 36.0, 50.0, 37.0, 31.0, 42.0, 33.0, 36.0, 31.0, 35.0, 25.0, 25.0, 26.0, 20.0, 26.0, 18.0, 12.0, 14.0, 16.0, 7.0, 7.0, 4.0, 6.0, 5.0, 3.0, 1.0, 2.0, 5.0, 1.0, 1.0, 0.0, 2.0], "bins": [-6.0703125, -5.89111328125, -5.7119140625, -5.53271484375, -5.353515625, -5.17431640625, -4.9951171875, -4.81591796875, -4.63671875, -4.45751953125, -4.2783203125, -4.09912109375, -3.919921875, -3.74072265625, -3.5615234375, -3.38232421875, -3.203125, -3.02392578125, -2.8447265625, -2.66552734375, -2.486328125, -2.30712890625, -2.1279296875, -1.94873046875, -1.76953125, -1.59033203125, -1.4111328125, -1.23193359375, -1.052734375, -0.87353515625, -0.6943359375, -0.51513671875, -0.3359375, -0.15673828125, 0.0224609375, 0.20166015625, 0.380859375, 0.56005859375, 0.7392578125, 0.91845703125, 1.09765625, 1.27685546875, 1.4560546875, 1.63525390625, 1.814453125, 1.99365234375, 2.1728515625, 2.35205078125, 2.53125, 2.71044921875, 2.8896484375, 3.06884765625, 3.248046875, 3.42724609375, 3.6064453125, 3.78564453125, 3.96484375, 4.14404296875, 4.3232421875, 4.50244140625, 4.681640625, 4.86083984375, 5.0400390625, 5.21923828125, 5.3984375]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 4.0, 6.0, 13.0, 5.0, 11.0, 18.0, 26.0, 43.0, 64.0, 118.0, 166.0, 264.0, 440.0, 707.0, 1178.0, 1743.0, 2875.0, 4623.0, 8159.0, 14945.0, 29765.0, 63281.0, 144577.0, 334404.0, 243990.0, 101511.0, 45491.0, 22214.0, 11565.0, 6451.0, 3700.0, 2338.0, 1433.0, 859.0, 586.0, 349.0, 228.0, 136.0, 74.0, 67.0, 37.0, 28.0, 19.0, 15.0, 10.0, 8.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.6875, -3.571502685546875, -3.45550537109375, -3.339508056640625, -3.2235107421875, -3.107513427734375, -2.99151611328125, -2.875518798828125, -2.759521484375, -2.643524169921875, -2.52752685546875, -2.411529541015625, -2.2955322265625, -2.179534912109375, -2.06353759765625, -1.947540283203125, -1.83154296875, -1.715545654296875, -1.59954833984375, -1.483551025390625, -1.3675537109375, -1.251556396484375, -1.13555908203125, -1.019561767578125, -0.903564453125, -0.787567138671875, -0.67156982421875, -0.555572509765625, -0.4395751953125, -0.323577880859375, -0.20758056640625, -0.091583251953125, 0.0244140625, 0.140411376953125, 0.25640869140625, 0.372406005859375, 0.4884033203125, 0.604400634765625, 0.72039794921875, 0.836395263671875, 0.952392578125, 1.068389892578125, 1.18438720703125, 1.300384521484375, 1.4163818359375, 1.532379150390625, 1.64837646484375, 1.764373779296875, 1.88037109375, 1.996368408203125, 2.11236572265625, 2.228363037109375, 2.3443603515625, 2.460357666015625, 2.57635498046875, 2.692352294921875, 2.808349609375, 2.924346923828125, 3.04034423828125, 3.156341552734375, 3.2723388671875, 3.388336181640625, 3.50433349609375, 3.620330810546875, 3.736328125]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 5.0, 7.0, 8.0, 17.0, 12.0, 18.0, 21.0, 21.0, 32.0, 28.0, 27.0, 41.0, 37.0, 44.0, 74.0, 73.0, 136.0, 1562.0, 323.0, 106.0, 65.0, 45.0, 47.0, 43.0, 36.0, 39.0, 32.0, 18.0, 25.0, 20.0, 19.0, 8.0, 15.0, 10.0, 8.0, 7.0, 4.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-23.953125, -23.224609375, -22.49609375, -21.767578125, -21.0390625, -20.310546875, -19.58203125, -18.853515625, -18.125, -17.396484375, -16.66796875, -15.939453125, -15.2109375, -14.482421875, -13.75390625, -13.025390625, -12.296875, -11.568359375, -10.83984375, -10.111328125, -9.3828125, -8.654296875, -7.92578125, -7.197265625, -6.46875, -5.740234375, -5.01171875, -4.283203125, -3.5546875, -2.826171875, -2.09765625, -1.369140625, -0.640625, 0.087890625, 0.81640625, 1.544921875, 2.2734375, 3.001953125, 3.73046875, 4.458984375, 5.1875, 5.916015625, 6.64453125, 7.373046875, 8.1015625, 8.830078125, 9.55859375, 10.287109375, 11.015625, 11.744140625, 12.47265625, 13.201171875, 13.9296875, 14.658203125, 15.38671875, 16.115234375, 16.84375, 17.572265625, 18.30078125, 19.029296875, 19.7578125, 20.486328125, 21.21484375, 21.943359375, 22.671875]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 4.0, 8.0, 10.0, 11.0, 19.0, 27.0, 35.0, 50.0, 73.0, 101.0, 193.0, 275.0, 506.0, 2250.0, 2843919.0, 295527.0, 1521.0, 465.0, 243.0, 134.0, 92.0, 63.0, 54.0, 38.0, 21.0, 9.0, 13.0, 12.0, 7.0, 4.0, 6.0, 5.0, 4.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.8125, -67.478515625, -65.14453125, -62.810546875, -60.4765625, -58.142578125, -55.80859375, -53.474609375, -51.140625, -48.806640625, -46.47265625, -44.138671875, -41.8046875, -39.470703125, -37.13671875, -34.802734375, -32.46875, -30.134765625, -27.80078125, -25.466796875, -23.1328125, -20.798828125, -18.46484375, -16.130859375, -13.796875, -11.462890625, -9.12890625, -6.794921875, -4.4609375, -2.126953125, 0.20703125, 2.541015625, 4.875, 7.208984375, 9.54296875, 11.876953125, 14.2109375, 16.544921875, 18.87890625, 21.212890625, 23.546875, 25.880859375, 28.21484375, 30.548828125, 32.8828125, 35.216796875, 37.55078125, 39.884765625, 42.21875, 44.552734375, 46.88671875, 49.220703125, 51.5546875, 53.888671875, 56.22265625, 58.556640625, 60.890625, 63.224609375, 65.55859375, 67.892578125, 70.2265625, 72.560546875, 74.89453125, 77.228515625, 79.5625]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 10.0, 30.0, 90.0, 234.0, 333.0, 212.0, 80.0, 17.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.545326232910156, -54.41698455810547, -52.28864288330078, -50.160301208496094, -48.031959533691406, -45.90361785888672, -43.7752799987793, -41.64693832397461, -39.51859664916992, -37.390254974365234, -35.26191329956055, -33.13357162475586, -31.005231857299805, -28.876890182495117, -26.748550415039062, -24.620208740234375, -22.491867065429688, -20.363525390625, -18.235183715820312, -16.106843948364258, -13.97850227355957, -11.850160598754883, -9.721819877624512, -7.593479156494141, -5.465137481689453, -3.336796283721924, -1.2084550857543945, 0.9198861122131348, 3.048227310180664, 5.176568984985352, 7.304909706115723, 9.433250427246094, 11.561599731445312, 13.68994140625, 15.818282127380371, 17.946622848510742, 20.07496452331543, 22.203306198120117, 24.331645965576172, 26.45998764038086, 28.588329315185547, 30.716670989990234, 32.84501266479492, 34.97335433959961, 37.10169219970703, 39.23003387451172, 41.358375549316406, 43.486717224121094, 45.61505889892578, 47.74340057373047, 49.871742248535156, 52.000083923339844, 54.12842559814453, 56.25676727294922, 58.38510513305664, 60.51344680786133, 62.641788482666016, 64.77012634277344, 66.89846801757812, 69.02680969238281, 71.1551513671875, 73.28349304199219, 75.41183471679688, 77.54017639160156, 79.66851806640625]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 5.0, 7.0, 9.0, 8.0, 17.0, 17.0, 22.0, 16.0, 19.0, 23.0, 37.0, 30.0, 42.0, 61.0, 44.0, 51.0, 45.0, 47.0, 52.0, 58.0, 57.0, 44.0, 38.0, 37.0, 27.0, 25.0, 23.0, 29.0, 18.0, 34.0, 14.0, 14.0, 14.0, 6.0, 6.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-87.09019470214844, -84.74664306640625, -82.40308380126953, -80.05953216552734, -77.71597290039062, -75.37242126464844, -73.02886199951172, -70.68531036376953, -68.34175109863281, -65.99819946289062, -63.654640197753906, -61.31108474731445, -58.967529296875, -56.62397384643555, -54.280418395996094, -51.936866760253906, -49.59331130981445, -47.249755859375, -44.90620040893555, -42.562644958496094, -40.21908950805664, -37.87553405761719, -35.531982421875, -33.18842315673828, -30.84486961364746, -28.501314163208008, -26.157758712768555, -23.814205169677734, -21.47064971923828, -19.127094268798828, -16.783538818359375, -14.439983367919922, -12.096424102783203, -9.75286865234375, -7.409313678741455, -5.06575870513916, -2.722203254699707, -0.3786478042602539, 1.9649066925048828, 4.308462142944336, 6.652017593383789, 8.995573043823242, 11.339128494262695, 13.682682991027832, 16.02623748779297, 18.369792938232422, 20.713348388671875, 23.056903839111328, 25.40045928955078, 27.744014739990234, 30.087570190429688, 32.43112564086914, 34.774681091308594, 37.11823654174805, 39.4617919921875, 41.80534362792969, 44.148902893066406, 46.49245834350586, 48.83601379394531, 51.179569244384766, 53.52312469482422, 55.86668014526367, 58.210235595703125, 60.55378723144531, 62.897342681884766]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 6.0, 5.0, 7.0, 7.0, 9.0, 19.0, 7.0, 9.0, 13.0, 14.0, 21.0, 31.0, 24.0, 28.0, 40.0, 29.0, 28.0, 34.0, 35.0, 41.0, 38.0, 45.0, 46.0, 47.0, 37.0, 38.0, 29.0, 30.0, 34.0, 25.0, 35.0, 28.0, 24.0, 22.0, 23.0, 21.0, 12.0, 17.0, 6.0, 14.0, 9.0, 6.0, 5.0, 1.0, 0.0, 4.0, 5.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.79296875, -6.593505859375, -6.39404296875, -6.194580078125, -5.9951171875, -5.795654296875, -5.59619140625, -5.396728515625, -5.197265625, -4.997802734375, -4.79833984375, -4.598876953125, -4.3994140625, -4.199951171875, -4.00048828125, -3.801025390625, -3.6015625, -3.402099609375, -3.20263671875, -3.003173828125, -2.8037109375, -2.604248046875, -2.40478515625, -2.205322265625, -2.005859375, -1.806396484375, -1.60693359375, -1.407470703125, -1.2080078125, -1.008544921875, -0.80908203125, -0.609619140625, -0.41015625, -0.210693359375, -0.01123046875, 0.188232421875, 0.3876953125, 0.587158203125, 0.78662109375, 0.986083984375, 1.185546875, 1.385009765625, 1.58447265625, 1.783935546875, 1.9833984375, 2.182861328125, 2.38232421875, 2.581787109375, 2.78125, 2.980712890625, 3.18017578125, 3.379638671875, 3.5791015625, 3.778564453125, 3.97802734375, 4.177490234375, 4.376953125, 4.576416015625, 4.77587890625, 4.975341796875, 5.1748046875, 5.374267578125, 5.57373046875, 5.773193359375, 5.97265625]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 5.0, 8.0, 7.0, 12.0, 12.0, 26.0, 28.0, 41.0, 55.0, 71.0, 73.0, 146.0, 200.0, 295.0, 557.0, 1001.0, 2211.0, 6333.0, 22343.0, 112595.0, 672401.0, 1867328.0, 1201513.0, 247749.0, 42765.0, 10220.0, 3194.0, 1309.0, 646.0, 356.0, 233.0, 147.0, 100.0, 95.0, 52.0, 38.0, 30.0, 22.0, 17.0, 15.0, 10.0, 10.0, 7.0, 5.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-10.75, -10.4403076171875, -10.130615234375, -9.8209228515625, -9.51123046875, -9.2015380859375, -8.891845703125, -8.5821533203125, -8.2724609375, -7.9627685546875, -7.653076171875, -7.3433837890625, -7.03369140625, -6.7239990234375, -6.414306640625, -6.1046142578125, -5.794921875, -5.4852294921875, -5.175537109375, -4.8658447265625, -4.55615234375, -4.2464599609375, -3.936767578125, -3.6270751953125, -3.3173828125, -3.0076904296875, -2.697998046875, -2.3883056640625, -2.07861328125, -1.7689208984375, -1.459228515625, -1.1495361328125, -0.83984375, -0.5301513671875, -0.220458984375, 0.0892333984375, 0.39892578125, 0.7086181640625, 1.018310546875, 1.3280029296875, 1.6376953125, 1.9473876953125, 2.257080078125, 2.5667724609375, 2.87646484375, 3.1861572265625, 3.495849609375, 3.8055419921875, 4.115234375, 4.4249267578125, 4.734619140625, 5.0443115234375, 5.35400390625, 5.6636962890625, 5.973388671875, 6.2830810546875, 6.5927734375, 6.9024658203125, 7.212158203125, 7.5218505859375, 7.83154296875, 8.1412353515625, 8.450927734375, 8.7606201171875, 9.0703125]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 7.0, 3.0, 11.0, 9.0, 19.0, 30.0, 47.0, 63.0, 92.0, 105.0, 167.0, 267.0, 399.0, 490.0, 606.0, 497.0, 386.0, 278.0, 200.0, 121.0, 89.0, 76.0, 40.0, 22.0, 24.0, 10.0, 6.0, 5.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.875, -20.28564453125, -19.6962890625, -19.10693359375, -18.517578125, -17.92822265625, -17.3388671875, -16.74951171875, -16.16015625, -15.57080078125, -14.9814453125, -14.39208984375, -13.802734375, -13.21337890625, -12.6240234375, -12.03466796875, -11.4453125, -10.85595703125, -10.2666015625, -9.67724609375, -9.087890625, -8.49853515625, -7.9091796875, -7.31982421875, -6.73046875, -6.14111328125, -5.5517578125, -4.96240234375, -4.373046875, -3.78369140625, -3.1943359375, -2.60498046875, -2.015625, -1.42626953125, -0.8369140625, -0.24755859375, 0.341796875, 0.93115234375, 1.5205078125, 2.10986328125, 2.69921875, 3.28857421875, 3.8779296875, 4.46728515625, 5.056640625, 5.64599609375, 6.2353515625, 6.82470703125, 7.4140625, 8.00341796875, 8.5927734375, 9.18212890625, 9.771484375, 10.36083984375, 10.9501953125, 11.53955078125, 12.12890625, 12.71826171875, 13.3076171875, 13.89697265625, 14.486328125, 15.07568359375, 15.6650390625, 16.25439453125, 16.84375]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 7.0, 13.0, 7.0, 10.0, 18.0, 22.0, 20.0, 39.0, 52.0, 48.0, 71.0, 118.0, 151.0, 273.0, 452.0, 1194.0, 22406.0, 4055822.0, 110575.0, 1663.0, 467.0, 253.0, 154.0, 109.0, 81.0, 52.0, 48.0, 36.0, 28.0, 22.0, 20.0, 12.0, 9.0, 3.0, 5.0, 6.0, 6.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.0, -59.9072265625, -57.814453125, -55.7216796875, -53.62890625, -51.5361328125, -49.443359375, -47.3505859375, -45.2578125, -43.1650390625, -41.072265625, -38.9794921875, -36.88671875, -34.7939453125, -32.701171875, -30.6083984375, -28.515625, -26.4228515625, -24.330078125, -22.2373046875, -20.14453125, -18.0517578125, -15.958984375, -13.8662109375, -11.7734375, -9.6806640625, -7.587890625, -5.4951171875, -3.40234375, -1.3095703125, 0.783203125, 2.8759765625, 4.96875, 7.0615234375, 9.154296875, 11.2470703125, 13.33984375, 15.4326171875, 17.525390625, 19.6181640625, 21.7109375, 23.8037109375, 25.896484375, 27.9892578125, 30.08203125, 32.1748046875, 34.267578125, 36.3603515625, 38.453125, 40.5458984375, 42.638671875, 44.7314453125, 46.82421875, 48.9169921875, 51.009765625, 53.1025390625, 55.1953125, 57.2880859375, 59.380859375, 61.4736328125, 63.56640625, 65.6591796875, 67.751953125, 69.8447265625, 71.9375]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 19.0, 36.0, 73.0, 143.0, 214.0, 218.0, 161.0, 86.0, 38.0, 19.0, 6.0, 1.0, 1.0, 1.0, 1.0], "bins": [-197.10147094726562, -193.4561767578125, -189.81089782714844, -186.1656036376953, -182.52032470703125, -178.87503051757812, -175.22975158691406, -171.58445739746094, -167.93917846679688, -164.29388427734375, -160.6486053466797, -157.00331115722656, -153.3580322265625, -149.71273803710938, -146.0674591064453, -142.4221649169922, -138.77688598632812, -135.131591796875, -131.48631286621094, -127.84102630615234, -124.19573974609375, -120.55045318603516, -116.90516662597656, -113.25987243652344, -109.61457824707031, -105.96929168701172, -102.32400512695312, -98.67871856689453, -95.03343200683594, -91.38814544677734, -87.74285888671875, -84.09756469726562, -80.45228576660156, -76.80699920654297, -73.16171264648438, -69.51642608642578, -65.87113952636719, -62.225852966308594, -58.580562591552734, -54.93527603149414, -51.28999328613281, -47.64470672607422, -43.999420166015625, -40.35413360595703, -36.70884704589844, -33.063560485839844, -29.418270111083984, -25.77298355102539, -22.127696990966797, -18.482410430908203, -14.837122917175293, -11.191835403442383, -7.546548843383789, -3.9012622833251953, -0.25597381591796875, 3.389312744140625, 7.034599304199219, 10.679885864257812, 14.325173377990723, 17.970460891723633, 21.615747451782227, 25.26103401184082, 28.906322479248047, 32.55160903930664, 36.196895599365234]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 3.0, 3.0, 3.0, 5.0, 11.0, 6.0, 4.0, 1.0, 13.0, 14.0, 10.0, 15.0, 18.0, 24.0, 25.0, 25.0, 33.0, 42.0, 50.0, 30.0, 22.0, 42.0, 40.0, 39.0, 46.0, 38.0, 41.0, 34.0, 34.0, 31.0, 30.0, 33.0, 28.0, 20.0, 30.0, 21.0, 22.0, 14.0, 22.0, 11.0, 13.0, 14.0, 11.0, 11.0, 7.0, 5.0, 7.0, 2.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0], "bins": [-49.736572265625, -48.22053146362305, -46.70449447631836, -45.188453674316406, -43.67241287231445, -42.1563720703125, -40.64033508300781, -39.12429428100586, -37.608253479003906, -36.09221267700195, -34.576175689697266, -33.06013488769531, -31.54409408569336, -30.02805519104004, -28.51201629638672, -26.995975494384766, -25.479936599731445, -23.963897705078125, -22.447856903076172, -20.93181800842285, -19.4157772064209, -17.899738311767578, -16.383697509765625, -14.867658615112305, -13.351618766784668, -11.835578918457031, -10.319539070129395, -8.803499221801758, -7.287459850311279, -5.771420001983643, -4.255380630493164, -2.7393407821655273, -1.2233009338378906, 0.29273879528045654, 1.8087785243988037, 3.3248181343078613, 4.840857982635498, 6.356897830963135, 7.872937202453613, 9.38897705078125, 10.905016899108887, 12.421056747436523, 13.93709659576416, 15.453136444091797, 16.969175338745117, 18.48521614074707, 20.00125503540039, 21.517295837402344, 23.033334732055664, 24.549373626708984, 26.065414428710938, 27.581453323364258, 29.09749412536621, 30.61353302001953, 32.129573822021484, 33.64561462402344, 35.161651611328125, 36.67769241333008, 38.193729400634766, 39.70977020263672, 41.22581100463867, 42.741851806640625, 44.25788879394531, 45.773929595947266, 47.28997039794922]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 2.0, 2.0, 5.0, 4.0, 3.0, 2.0, 4.0, 10.0, 6.0, 14.0, 12.0, 19.0, 23.0, 21.0, 23.0, 27.0, 18.0, 30.0, 36.0, 38.0, 42.0, 37.0, 29.0, 41.0, 46.0, 55.0, 38.0, 35.0, 36.0, 37.0, 38.0, 31.0, 38.0, 19.0, 35.0, 22.0, 24.0, 18.0, 11.0, 17.0, 12.0, 10.0, 7.0, 8.0, 5.0, 6.0, 3.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0], "bins": [-7.28125, -7.07867431640625, -6.8760986328125, -6.67352294921875, -6.470947265625, -6.26837158203125, -6.0657958984375, -5.86322021484375, -5.66064453125, -5.45806884765625, -5.2554931640625, -5.05291748046875, -4.850341796875, -4.64776611328125, -4.4451904296875, -4.24261474609375, -4.0400390625, -3.83746337890625, -3.6348876953125, -3.43231201171875, -3.229736328125, -3.02716064453125, -2.8245849609375, -2.62200927734375, -2.41943359375, -2.21685791015625, -2.0142822265625, -1.81170654296875, -1.609130859375, -1.40655517578125, -1.2039794921875, -1.00140380859375, -0.798828125, -0.59625244140625, -0.3936767578125, -0.19110107421875, 0.011474609375, 0.21405029296875, 0.4166259765625, 0.61920166015625, 0.82177734375, 1.02435302734375, 1.2269287109375, 1.42950439453125, 1.632080078125, 1.83465576171875, 2.0372314453125, 2.23980712890625, 2.4423828125, 2.64495849609375, 2.8475341796875, 3.05010986328125, 3.252685546875, 3.45526123046875, 3.6578369140625, 3.86041259765625, 4.06298828125, 4.26556396484375, 4.4681396484375, 4.67071533203125, 4.873291015625, 5.07586669921875, 5.2784423828125, 5.48101806640625, 5.68359375]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 6.0, 11.0, 8.0, 30.0, 26.0, 52.0, 48.0, 101.0, 171.0, 260.0, 335.0, 489.0, 731.0, 954.0, 1607.0, 2317.0, 3660.0, 5475.0, 8474.0, 13008.0, 20253.0, 31856.0, 50386.0, 80891.0, 130833.0, 205850.0, 183747.0, 113583.0, 70488.0, 44074.0, 27592.0, 17897.0, 11515.0, 7449.0, 4793.0, 3253.0, 2027.0, 1492.0, 978.0, 610.0, 401.0, 296.0, 178.0, 128.0, 72.0, 49.0, 47.0, 20.0, 15.0, 12.0, 8.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.76220703125, -0.7390060424804688, -0.7158050537109375, -0.6926040649414062, -0.669403076171875, -0.6462020874023438, -0.6230010986328125, -0.5998001098632812, -0.57659912109375, -0.5533981323242188, -0.5301971435546875, -0.5069961547851562, -0.483795166015625, -0.46059417724609375, -0.4373931884765625, -0.41419219970703125, -0.3909912109375, -0.36779022216796875, -0.3445892333984375, -0.32138824462890625, -0.298187255859375, -0.27498626708984375, -0.2517852783203125, -0.22858428955078125, -0.20538330078125, -0.18218231201171875, -0.1589813232421875, -0.13578033447265625, -0.112579345703125, -0.08937835693359375, -0.0661773681640625, -0.04297637939453125, -0.019775390625, 0.00342559814453125, 0.0266265869140625, 0.04982757568359375, 0.073028564453125, 0.09622955322265625, 0.1194305419921875, 0.14263153076171875, 0.16583251953125, 0.18903350830078125, 0.2122344970703125, 0.23543548583984375, 0.258636474609375, 0.28183746337890625, 0.3050384521484375, 0.32823944091796875, 0.3514404296875, 0.37464141845703125, 0.3978424072265625, 0.42104339599609375, 0.444244384765625, 0.46744537353515625, 0.4906463623046875, 0.5138473510742188, 0.53704833984375, 0.5602493286132812, 0.5834503173828125, 0.6066513061523438, 0.629852294921875, 0.6530532836914062, 0.6762542724609375, 0.6994552612304688, 0.72265625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 3.0, 6.0, 3.0, 10.0, 6.0, 7.0, 8.0, 7.0, 11.0, 14.0, 15.0, 13.0, 20.0, 28.0, 44.0, 24.0, 34.0, 29.0, 26.0, 33.0, 41.0, 34.0, 45.0, 41.0, 1053.0, 44.0, 36.0, 38.0, 31.0, 50.0, 33.0, 23.0, 28.0, 37.0, 14.0, 20.0, 22.0, 14.0, 18.0, 18.0, 9.0, 10.0, 11.0, 5.0, 2.0, 4.0, 4.0, 2.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.515625, -3.392333984375, -3.26904296875, -3.145751953125, -3.0224609375, -2.899169921875, -2.77587890625, -2.652587890625, -2.529296875, -2.406005859375, -2.28271484375, -2.159423828125, -2.0361328125, -1.912841796875, -1.78955078125, -1.666259765625, -1.54296875, -1.419677734375, -1.29638671875, -1.173095703125, -1.0498046875, -0.926513671875, -0.80322265625, -0.679931640625, -0.556640625, -0.433349609375, -0.31005859375, -0.186767578125, -0.0634765625, 0.059814453125, 0.18310546875, 0.306396484375, 0.4296875, 0.552978515625, 0.67626953125, 0.799560546875, 0.9228515625, 1.046142578125, 1.16943359375, 1.292724609375, 1.416015625, 1.539306640625, 1.66259765625, 1.785888671875, 1.9091796875, 2.032470703125, 2.15576171875, 2.279052734375, 2.40234375, 2.525634765625, 2.64892578125, 2.772216796875, 2.8955078125, 3.018798828125, 3.14208984375, 3.265380859375, 3.388671875, 3.511962890625, 3.63525390625, 3.758544921875, 3.8818359375, 4.005126953125, 4.12841796875, 4.251708984375, 4.375]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 5.0, 14.0, 15.0, 24.0, 23.0, 37.0, 60.0, 89.0, 103.0, 149.0, 198.0, 345.0, 464.0, 686.0, 961.0, 1493.0, 2140.0, 3311.0, 4708.0, 7284.0, 11142.0, 17272.0, 27486.0, 42240.0, 66187.0, 105239.0, 168327.0, 1252917.0, 140489.0, 87171.0, 55050.0, 35482.0, 22875.0, 14682.0, 9517.0, 6296.0, 4091.0, 2630.0, 1859.0, 1249.0, 888.0, 628.0, 412.0, 283.0, 207.0, 132.0, 91.0, 65.0, 46.0, 25.0, 15.0, 12.0, 12.0, 5.0, 6.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.5810546875, -0.5612258911132812, -0.5413970947265625, -0.5215682983398438, -0.501739501953125, -0.48191070556640625, -0.4620819091796875, -0.44225311279296875, -0.42242431640625, -0.40259552001953125, -0.3827667236328125, -0.36293792724609375, -0.343109130859375, -0.32328033447265625, -0.3034515380859375, -0.28362274169921875, -0.2637939453125, -0.24396514892578125, -0.2241363525390625, -0.20430755615234375, -0.184478759765625, -0.16464996337890625, -0.1448211669921875, -0.12499237060546875, -0.10516357421875, -0.08533477783203125, -0.0655059814453125, -0.04567718505859375, -0.025848388671875, -0.00601959228515625, 0.0138092041015625, 0.03363800048828125, 0.053466796875, 0.07329559326171875, 0.0931243896484375, 0.11295318603515625, 0.132781982421875, 0.15261077880859375, 0.1724395751953125, 0.19226837158203125, 0.21209716796875, 0.23192596435546875, 0.2517547607421875, 0.27158355712890625, 0.291412353515625, 0.31124114990234375, 0.3310699462890625, 0.35089874267578125, 0.3707275390625, 0.39055633544921875, 0.4103851318359375, 0.43021392822265625, 0.450042724609375, 0.46987152099609375, 0.4897003173828125, 0.5095291137695312, 0.52935791015625, 0.5491867065429688, 0.5690155029296875, 0.5888442993164062, 0.608673095703125, 0.6285018920898438, 0.6483306884765625, 0.6681594848632812, 0.68798828125]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 5.0, 2.0, 6.0, 3.0, 5.0, 8.0, 8.0, 10.0, 9.0, 15.0, 10.0, 12.0, 17.0, 23.0, 15.0, 41.0, 32.0, 42.0, 40.0, 53.0, 47.0, 71.0, 70.0, 71.0, 63.0, 65.0, 39.0, 38.0, 38.0, 23.0, 19.0, 23.0, 17.0, 19.0, 12.0, 5.0, 6.0, 7.0, 8.0, 6.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.002613067626953125, -0.002532660961151123, -0.002452254295349121, -0.002371847629547119, -0.002291440963745117, -0.0022110342979431152, -0.0021306276321411133, -0.0020502209663391113, -0.0019698143005371094, -0.0018894076347351074, -0.0018090009689331055, -0.0017285943031311035, -0.0016481876373291016, -0.0015677809715270996, -0.0014873743057250977, -0.0014069676399230957, -0.0013265609741210938, -0.0012461543083190918, -0.0011657476425170898, -0.0010853409767150879, -0.001004934310913086, -0.000924527645111084, -0.000844120979309082, -0.0007637143135070801, -0.0006833076477050781, -0.0006029009819030762, -0.0005224943161010742, -0.00044208765029907227, -0.0003616809844970703, -0.00028127431869506836, -0.0002008676528930664, -0.00012046098709106445, -4.00543212890625e-05, 4.035234451293945e-05, 0.0001207590103149414, 0.00020116567611694336, 0.0002815723419189453, 0.00036197900772094727, 0.0004423856735229492, 0.0005227923393249512, 0.0006031990051269531, 0.0006836056709289551, 0.000764012336730957, 0.000844419002532959, 0.0009248256683349609, 0.0010052323341369629, 0.0010856389999389648, 0.0011660456657409668, 0.0012464523315429688, 0.0013268589973449707, 0.0014072656631469727, 0.0014876723289489746, 0.0015680789947509766, 0.0016484856605529785, 0.0017288923263549805, 0.0018092989921569824, 0.0018897056579589844, 0.0019701123237609863, 0.0020505189895629883, 0.0021309256553649902, 0.002211332321166992, 0.002291738986968994, 0.002372145652770996, 0.002452552318572998, 0.002532958984375]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 6.0, 3.0, 6.0, 3.0, 8.0, 6.0, 8.0, 16.0, 19.0, 18.0, 22.0, 29.0, 55.0, 95.0, 159.0, 320.0, 851.0, 48069.0, 996317.0, 1551.0, 448.0, 164.0, 105.0, 68.0, 42.0, 33.0, 25.0, 19.0, 15.0, 9.0, 12.0, 8.0, 8.0, 15.0, 5.0, 8.0, 4.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.07171630859375, -0.06955623626708984, -0.06739616394042969, -0.06523609161376953, -0.06307601928710938, -0.06091594696044922, -0.05875587463378906, -0.056595802307128906, -0.05443572998046875, -0.052275657653808594, -0.05011558532714844, -0.04795551300048828, -0.045795440673828125, -0.04363536834716797, -0.04147529602050781, -0.039315223693847656, -0.0371551513671875, -0.034995079040527344, -0.03283500671386719, -0.03067493438720703, -0.028514862060546875, -0.02635478973388672, -0.024194717407226562, -0.022034645080566406, -0.01987457275390625, -0.017714500427246094, -0.015554428100585938, -0.013394355773925781, -0.011234283447265625, -0.009074211120605469, -0.0069141387939453125, -0.004754066467285156, -0.002593994140625, -0.00043392181396484375, 0.0017261505126953125, 0.0038862228393554688, 0.006046295166015625, 0.008206367492675781, 0.010366439819335938, 0.012526512145996094, 0.01468658447265625, 0.016846656799316406, 0.019006729125976562, 0.02116680145263672, 0.023326873779296875, 0.02548694610595703, 0.027647018432617188, 0.029807090759277344, 0.0319671630859375, 0.034127235412597656, 0.03628730773925781, 0.03844738006591797, 0.040607452392578125, 0.04276752471923828, 0.04492759704589844, 0.047087669372558594, 0.04924774169921875, 0.051407814025878906, 0.05356788635253906, 0.05572795867919922, 0.057888031005859375, 0.06004810333251953, 0.06220817565917969, 0.06436824798583984, 0.0665283203125]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 6.0, 18.0, 59.0, 149.0, 261.0, 268.0, 153.0, 69.0, 20.0, 8.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00555547745898366, -0.005450621247291565, -0.005345764569938183, -0.005240908358246088, -0.005136052146553993, -0.005031195469200611, -0.004926339257508516, -0.0048214830458164215, -0.004716626368463039, -0.004611770156770945, -0.0045069134794175625, -0.004402057267725468, -0.004297201056033373, -0.004192344378679991, -0.004087488166987896, -0.003982631955295801, -0.0038777755107730627, -0.0037729190662503242, -0.0036680628545582294, -0.003563206410035491, -0.0034583499655127525, -0.0033534937538206577, -0.0032486373092979193, -0.003143780864775181, -0.003038924653083086, -0.0029340682085603476, -0.0028292119968682528, -0.0027243555523455143, -0.002619499107822776, -0.0025146426633000374, -0.0024097864516079426, -0.002304930007085204, -0.0022000735625624657, -0.002095217118039727, -0.0019903609063476324, -0.001885504461824894, -0.0017806480173021555, -0.0016757916891947389, -0.0015709353610873222, -0.0014660789165645838, -0.0013612224720418453, -0.0012563661439344287, -0.0011515096994116902, -0.0010466533713042736, -0.0009417969849891961, -0.0008369405986741185, -0.0007320842705667019, -0.0006272278842516243, -0.0005223714979365468, -0.00041751511162146926, -0.00031265875441022217, -0.00020780239719897509, -0.00010294601088389754, 1.9103754311800003e-06, 0.00010676670353859663, 0.00021162308985367417, 0.0003164794761687517, 0.00042133586248382926, 0.0005261922487989068, 0.0006310485769063234, 0.000735904963221401, 0.0008407613495364785, 0.0009456176776438951, 0.0010504741221666336, 0.0011553304502740502]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 1.0, 1.0, 3.0, 5.0, 5.0, 6.0, 6.0, 3.0, 8.0, 10.0, 15.0, 17.0, 10.0, 23.0, 14.0, 31.0, 31.0, 35.0, 35.0, 29.0, 32.0, 39.0, 27.0, 35.0, 39.0, 31.0, 42.0, 42.0, 32.0, 26.0, 31.0, 40.0, 34.0, 27.0, 27.0, 29.0, 17.0, 20.0, 23.0, 17.0, 14.0, 12.0, 23.0, 12.0, 9.0, 6.0, 7.0, 6.0, 6.0, 2.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 5.0], "bins": [-0.0012511610984802246, -0.0012137191370129585, -0.0011762771755456924, -0.0011388352140784264, -0.0011013932526111603, -0.0010639512911438942, -0.0010265093296766281, -0.000989067368209362, -0.000951625406742096, -0.0009141834452748299, -0.0008767414838075638, -0.0008392995223402977, -0.0008018575608730316, -0.0007644155994057655, -0.0007269736379384995, -0.0006895316764712334, -0.0006520897150039673, -0.0006146477535367012, -0.0005772057920694351, -0.000539763830602169, -0.000502321869134903, -0.00046487990766763687, -0.0004274379462003708, -0.0003899959847331047, -0.0003525540232658386, -0.00031511206179857254, -0.00027767010033130646, -0.00024022813886404037, -0.0002027861773967743, -0.0001653442159295082, -0.00012790225446224213, -9.046029299497604e-05, -5.301833152770996e-05, -1.5576370060443878e-05, 2.1865591406822205e-05, 5.930755287408829e-05, 9.674951434135437e-05, 0.00013419147580862045, 0.00017163343727588654, 0.00020907539874315262, 0.0002465173602104187, 0.0002839593216776848, 0.00032140128314495087, 0.00035884324461221695, 0.00039628520607948303, 0.0004337271675467491, 0.0004711691290140152, 0.0005086110904812813, 0.0005460530519485474, 0.0005834950134158134, 0.0006209369748830795, 0.0006583789363503456, 0.0006958208978176117, 0.0007332628592848778, 0.0007707048207521439, 0.0008081467822194099, 0.000845588743686676, 0.0008830307051539421, 0.0009204726666212082, 0.0009579146280884743, 0.0009953565895557404, 0.0010327985510230064, 0.0010702405124902725, 0.0011076824739575386, 0.0011451244354248047]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 2.0, 2.0, 5.0, 4.0, 3.0, 2.0, 4.0, 10.0, 6.0, 14.0, 12.0, 19.0, 23.0, 21.0, 23.0, 27.0, 18.0, 30.0, 36.0, 38.0, 42.0, 37.0, 29.0, 41.0, 46.0, 55.0, 38.0, 35.0, 36.0, 37.0, 38.0, 31.0, 38.0, 19.0, 35.0, 22.0, 24.0, 18.0, 11.0, 17.0, 12.0, 10.0, 7.0, 8.0, 5.0, 6.0, 3.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0], "bins": [-7.28125, -7.07867431640625, -6.8760986328125, -6.67352294921875, -6.470947265625, -6.26837158203125, -6.0657958984375, -5.86322021484375, -5.66064453125, -5.45806884765625, -5.2554931640625, -5.05291748046875, -4.850341796875, -4.64776611328125, -4.4451904296875, -4.24261474609375, -4.0400390625, -3.83746337890625, -3.6348876953125, -3.43231201171875, -3.229736328125, -3.02716064453125, -2.8245849609375, -2.62200927734375, -2.41943359375, -2.21685791015625, -2.0142822265625, -1.81170654296875, -1.609130859375, -1.40655517578125, -1.2039794921875, -1.00140380859375, -0.798828125, -0.59625244140625, -0.3936767578125, -0.19110107421875, 0.011474609375, 0.21405029296875, 0.4166259765625, 0.61920166015625, 0.82177734375, 1.02435302734375, 1.2269287109375, 1.42950439453125, 1.632080078125, 1.83465576171875, 2.0372314453125, 2.23980712890625, 2.4423828125, 2.64495849609375, 2.8475341796875, 3.05010986328125, 3.252685546875, 3.45526123046875, 3.6578369140625, 3.86041259765625, 4.06298828125, 4.26556396484375, 4.4681396484375, 4.67071533203125, 4.873291015625, 5.07586669921875, 5.2784423828125, 5.48101806640625, 5.68359375]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 12.0, 8.0, 8.0, 7.0, 29.0, 35.0, 40.0, 53.0, 84.0, 121.0, 176.0, 261.0, 389.0, 605.0, 937.0, 1478.0, 2481.0, 4562.0, 8008.0, 14247.0, 25768.0, 48378.0, 94505.0, 193248.0, 290780.0, 176573.0, 86313.0, 44708.0, 23843.0, 13109.0, 7167.0, 4151.0, 2409.0, 1424.0, 906.0, 577.0, 344.0, 246.0, 193.0, 116.0, 72.0, 60.0, 26.0, 28.0, 19.0, 20.0, 12.0, 3.0, 12.0, 4.0, 2.0, 4.0, 2.0], "bins": [-4.3828125, -4.259124755859375, -4.13543701171875, -4.011749267578125, -3.8880615234375, -3.764373779296875, -3.64068603515625, -3.516998291015625, -3.393310546875, -3.269622802734375, -3.14593505859375, -3.022247314453125, -2.8985595703125, -2.774871826171875, -2.65118408203125, -2.527496337890625, -2.40380859375, -2.280120849609375, -2.15643310546875, -2.032745361328125, -1.9090576171875, -1.785369873046875, -1.66168212890625, -1.537994384765625, -1.414306640625, -1.290618896484375, -1.16693115234375, -1.043243408203125, -0.9195556640625, -0.795867919921875, -0.67218017578125, -0.548492431640625, -0.4248046875, -0.301116943359375, -0.17742919921875, -0.053741455078125, 0.0699462890625, 0.193634033203125, 0.31732177734375, 0.441009521484375, 0.564697265625, 0.688385009765625, 0.81207275390625, 0.935760498046875, 1.0594482421875, 1.183135986328125, 1.30682373046875, 1.430511474609375, 1.55419921875, 1.677886962890625, 1.80157470703125, 1.925262451171875, 2.0489501953125, 2.172637939453125, 2.29632568359375, 2.420013427734375, 2.543701171875, 2.667388916015625, 2.79107666015625, 2.914764404296875, 3.0384521484375, 3.162139892578125, 3.28582763671875, 3.409515380859375, 3.533203125]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 3.0, 5.0, 10.0, 9.0, 8.0, 12.0, 19.0, 22.0, 30.0, 32.0, 28.0, 43.0, 40.0, 41.0, 44.0, 58.0, 103.0, 236.0, 1641.0, 177.0, 88.0, 58.0, 48.0, 40.0, 28.0, 46.0, 26.0, 27.0, 23.0, 18.0, 15.0, 15.0, 13.0, 7.0, 6.0, 4.0, 6.0, 6.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.28125, -24.477294921875, -23.67333984375, -22.869384765625, -22.0654296875, -21.261474609375, -20.45751953125, -19.653564453125, -18.849609375, -18.045654296875, -17.24169921875, -16.437744140625, -15.6337890625, -14.829833984375, -14.02587890625, -13.221923828125, -12.41796875, -11.614013671875, -10.81005859375, -10.006103515625, -9.2021484375, -8.398193359375, -7.59423828125, -6.790283203125, -5.986328125, -5.182373046875, -4.37841796875, -3.574462890625, -2.7705078125, -1.966552734375, -1.16259765625, -0.358642578125, 0.4453125, 1.249267578125, 2.05322265625, 2.857177734375, 3.6611328125, 4.465087890625, 5.26904296875, 6.072998046875, 6.876953125, 7.680908203125, 8.48486328125, 9.288818359375, 10.0927734375, 10.896728515625, 11.70068359375, 12.504638671875, 13.30859375, 14.112548828125, 14.91650390625, 15.720458984375, 16.5244140625, 17.328369140625, 18.13232421875, 18.936279296875, 19.740234375, 20.544189453125, 21.34814453125, 22.152099609375, 22.9560546875, 23.760009765625, 24.56396484375, 25.367919921875, 26.171875]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 5.0, 3.0, 7.0, 10.0, 11.0, 12.0, 15.0, 23.0, 24.0, 33.0, 51.0, 48.0, 63.0, 96.0, 105.0, 181.0, 234.0, 352.0, 895.0, 6210.0, 2902215.0, 230535.0, 2800.0, 584.0, 313.0, 200.0, 176.0, 115.0, 81.0, 79.0, 46.0, 39.0, 35.0, 25.0, 22.0, 16.0, 13.0, 7.0, 6.0, 4.0, 5.0, 7.0, 2.0, 3.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-58.28125, -56.50634765625, -54.7314453125, -52.95654296875, -51.181640625, -49.40673828125, -47.6318359375, -45.85693359375, -44.08203125, -42.30712890625, -40.5322265625, -38.75732421875, -36.982421875, -35.20751953125, -33.4326171875, -31.65771484375, -29.8828125, -28.10791015625, -26.3330078125, -24.55810546875, -22.783203125, -21.00830078125, -19.2333984375, -17.45849609375, -15.68359375, -13.90869140625, -12.1337890625, -10.35888671875, -8.583984375, -6.80908203125, -5.0341796875, -3.25927734375, -1.484375, 0.29052734375, 2.0654296875, 3.84033203125, 5.615234375, 7.39013671875, 9.1650390625, 10.93994140625, 12.71484375, 14.48974609375, 16.2646484375, 18.03955078125, 19.814453125, 21.58935546875, 23.3642578125, 25.13916015625, 26.9140625, 28.68896484375, 30.4638671875, 32.23876953125, 34.013671875, 35.78857421875, 37.5634765625, 39.33837890625, 41.11328125, 42.88818359375, 44.6630859375, 46.43798828125, 48.212890625, 49.98779296875, 51.7626953125, 53.53759765625, 55.3125]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 6.0, 339.0, 658.0, 15.0, 1.0], "bins": [-474.718017578125, -466.95147705078125, -459.1849060058594, -451.4183654785156, -443.65179443359375, -435.88525390625, -428.11871337890625, -420.3521423339844, -412.5856018066406, -404.8190612792969, -397.052490234375, -389.28594970703125, -381.5193786621094, -373.7528381347656, -365.9862976074219, -358.2197265625, -350.45318603515625, -342.6866455078125, -334.9200744628906, -327.1535339355469, -319.386962890625, -311.62042236328125, -303.8538818359375, -296.0873107910156, -288.3207702636719, -280.5542297363281, -272.78765869140625, -265.0211181640625, -257.2545471191406, -249.48800659179688, -241.72145080566406, -233.95489501953125, -226.18832397460938, -218.42176818847656, -210.65521240234375, -202.888671875, -195.1221160888672, -187.35556030273438, -179.58900451660156, -171.82244873046875, -164.055908203125, -156.2893524169922, -148.52279663085938, -140.75625610351562, -132.9897003173828, -125.22314453125, -117.45658874511719, -109.6900405883789, -101.92349243164062, -94.15693664550781, -86.39038848876953, -78.62383270263672, -70.85728454589844, -63.090728759765625, -55.32417678833008, -47.55762481689453, -39.79106903076172, -32.02451705932617, -24.257965087890625, -16.491411209106445, -8.724859237670898, -0.9583053588867188, 6.808246612548828, 14.574798583984375, 22.34134864807129]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 4.0, 4.0, 13.0, 15.0, 19.0, 23.0, 26.0, 12.0, 22.0, 15.0, 16.0, 26.0, 22.0, 28.0, 29.0, 22.0, 44.0, 32.0, 45.0, 40.0, 38.0, 34.0, 29.0, 46.0, 35.0, 26.0, 31.0, 18.0, 30.0, 35.0, 26.0, 31.0, 18.0, 12.0, 24.0, 21.0, 12.0, 11.0, 11.0, 7.0, 10.0, 9.0, 7.0, 4.0, 6.0, 3.0, 1.0, 4.0, 1.0, 1.0, 4.0, 2.0], "bins": [-52.793060302734375, -51.22348403930664, -49.653907775878906, -48.08433151245117, -46.51475524902344, -44.9451789855957, -43.37560272216797, -41.806026458740234, -40.2364501953125, -38.666873931884766, -37.09729766845703, -35.5277214050293, -33.95814514160156, -32.38856887817383, -30.818992614746094, -29.24941635131836, -27.679840087890625, -26.11026382446289, -24.540687561035156, -22.971111297607422, -21.401535034179688, -19.831958770751953, -18.26238250732422, -16.692806243896484, -15.12322998046875, -13.553653717041016, -11.984077453613281, -10.414501190185547, -8.844924926757812, -7.275348663330078, -5.705772399902344, -4.136196136474609, -2.566619873046875, -0.9970436096191406, 0.5725326538085938, 2.142108917236328, 3.7116851806640625, 5.281261444091797, 6.850837707519531, 8.420413970947266, 9.989990234375, 11.559566497802734, 13.129142761230469, 14.698719024658203, 16.268295288085938, 17.837871551513672, 19.407447814941406, 20.97702407836914, 22.546600341796875, 24.11617660522461, 25.685752868652344, 27.255329132080078, 28.824905395507812, 30.394481658935547, 31.96405792236328, 33.533634185791016, 35.10321044921875, 36.672786712646484, 38.24236297607422, 39.81193923950195, 41.38151550292969, 42.95109176635742, 44.520668029785156, 46.09024429321289, 47.659820556640625]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 3.0, 1.0, 7.0, 2.0, 6.0, 7.0, 11.0, 10.0, 11.0, 13.0, 18.0, 18.0, 24.0, 24.0, 34.0, 30.0, 27.0, 30.0, 37.0, 52.0, 35.0, 40.0, 40.0, 47.0, 50.0, 39.0, 38.0, 37.0, 31.0, 34.0, 32.0, 31.0, 32.0, 20.0, 20.0, 19.0, 14.0, 18.0, 16.0, 10.0, 5.0, 9.0, 6.0, 9.0, 1.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.49609375, -7.2833251953125, -7.070556640625, -6.8577880859375, -6.64501953125, -6.4322509765625, -6.219482421875, -6.0067138671875, -5.7939453125, -5.5811767578125, -5.368408203125, -5.1556396484375, -4.94287109375, -4.7301025390625, -4.517333984375, -4.3045654296875, -4.091796875, -3.8790283203125, -3.666259765625, -3.4534912109375, -3.24072265625, -3.0279541015625, -2.815185546875, -2.6024169921875, -2.3896484375, -2.1768798828125, -1.964111328125, -1.7513427734375, -1.53857421875, -1.3258056640625, -1.113037109375, -0.9002685546875, -0.6875, -0.4747314453125, -0.261962890625, -0.0491943359375, 0.16357421875, 0.3763427734375, 0.589111328125, 0.8018798828125, 1.0146484375, 1.2274169921875, 1.440185546875, 1.6529541015625, 1.86572265625, 2.0784912109375, 2.291259765625, 2.5040283203125, 2.716796875, 2.9295654296875, 3.142333984375, 3.3551025390625, 3.56787109375, 3.7806396484375, 3.993408203125, 4.2061767578125, 4.4189453125, 4.6317138671875, 4.844482421875, 5.0572509765625, 5.27001953125, 5.4827880859375, 5.695556640625, 5.9083251953125, 6.12109375]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 5.0, 4.0, 6.0, 7.0, 5.0, 10.0, 10.0, 6.0, 15.0, 19.0, 15.0, 21.0, 24.0, 38.0, 35.0, 35.0, 59.0, 94.0, 375.0, 1756.0, 19866.0, 1577238.0, 2555290.0, 36308.0, 2197.0, 413.0, 117.0, 54.0, 40.0, 36.0, 26.0, 20.0, 28.0, 26.0, 19.0, 18.0, 12.0, 13.0, 7.0, 7.0, 6.0, 2.0, 6.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.71875, -30.814697265625, -29.91064453125, -29.006591796875, -28.1025390625, -27.198486328125, -26.29443359375, -25.390380859375, -24.486328125, -23.582275390625, -22.67822265625, -21.774169921875, -20.8701171875, -19.966064453125, -19.06201171875, -18.157958984375, -17.25390625, -16.349853515625, -15.44580078125, -14.541748046875, -13.6376953125, -12.733642578125, -11.82958984375, -10.925537109375, -10.021484375, -9.117431640625, -8.21337890625, -7.309326171875, -6.4052734375, -5.501220703125, -4.59716796875, -3.693115234375, -2.7890625, -1.885009765625, -0.98095703125, -0.076904296875, 0.8271484375, 1.731201171875, 2.63525390625, 3.539306640625, 4.443359375, 5.347412109375, 6.25146484375, 7.155517578125, 8.0595703125, 8.963623046875, 9.86767578125, 10.771728515625, 11.67578125, 12.579833984375, 13.48388671875, 14.387939453125, 15.2919921875, 16.196044921875, 17.10009765625, 18.004150390625, 18.908203125, 19.812255859375, 20.71630859375, 21.620361328125, 22.5244140625, 23.428466796875, 24.33251953125, 25.236572265625, 26.140625]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 3.0, 5.0, 9.0, 11.0, 19.0, 28.0, 38.0, 49.0, 68.0, 83.0, 114.0, 154.0, 214.0, 286.0, 360.0, 404.0, 449.0, 416.0, 359.0, 258.0, 210.0, 144.0, 109.0, 81.0, 56.0, 36.0, 28.0, 16.0, 20.0, 15.0, 10.0, 4.0, 8.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-15.875, -15.4124755859375, -14.949951171875, -14.4874267578125, -14.02490234375, -13.5623779296875, -13.099853515625, -12.6373291015625, -12.1748046875, -11.7122802734375, -11.249755859375, -10.7872314453125, -10.32470703125, -9.8621826171875, -9.399658203125, -8.9371337890625, -8.474609375, -8.0120849609375, -7.549560546875, -7.0870361328125, -6.62451171875, -6.1619873046875, -5.699462890625, -5.2369384765625, -4.7744140625, -4.3118896484375, -3.849365234375, -3.3868408203125, -2.92431640625, -2.4617919921875, -1.999267578125, -1.5367431640625, -1.07421875, -0.6116943359375, -0.149169921875, 0.3133544921875, 0.77587890625, 1.2384033203125, 1.700927734375, 2.1634521484375, 2.6259765625, 3.0885009765625, 3.551025390625, 4.0135498046875, 4.47607421875, 4.9385986328125, 5.401123046875, 5.8636474609375, 6.326171875, 6.7886962890625, 7.251220703125, 7.7137451171875, 8.17626953125, 8.6387939453125, 9.101318359375, 9.5638427734375, 10.0263671875, 10.4888916015625, 10.951416015625, 11.4139404296875, 11.87646484375, 12.3389892578125, 12.801513671875, 13.2640380859375, 13.7265625]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 7.0, 4.0, 2.0, 5.0, 6.0, 16.0, 24.0, 25.0, 33.0, 51.0, 68.0, 99.0, 170.0, 317.0, 702.0, 5737.0, 4071134.0, 113593.0, 1208.0, 389.0, 242.0, 136.0, 107.0, 51.0, 52.0, 42.0, 23.0, 14.0, 10.0, 4.0, 7.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-106.4375, -103.6884765625, -100.939453125, -98.1904296875, -95.44140625, -92.6923828125, -89.943359375, -87.1943359375, -84.4453125, -81.6962890625, -78.947265625, -76.1982421875, -73.44921875, -70.7001953125, -67.951171875, -65.2021484375, -62.453125, -59.7041015625, -56.955078125, -54.2060546875, -51.45703125, -48.7080078125, -45.958984375, -43.2099609375, -40.4609375, -37.7119140625, -34.962890625, -32.2138671875, -29.46484375, -26.7158203125, -23.966796875, -21.2177734375, -18.46875, -15.7197265625, -12.970703125, -10.2216796875, -7.47265625, -4.7236328125, -1.974609375, 0.7744140625, 3.5234375, 6.2724609375, 9.021484375, 11.7705078125, 14.51953125, 17.2685546875, 20.017578125, 22.7666015625, 25.515625, 28.2646484375, 31.013671875, 33.7626953125, 36.51171875, 39.2607421875, 42.009765625, 44.7587890625, 47.5078125, 50.2568359375, 53.005859375, 55.7548828125, 58.50390625, 61.2529296875, 64.001953125, 66.7509765625, 69.5]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [9.0, 77.0, 344.0, 413.0, 157.0, 20.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.650272369384766, -16.953258514404297, -9.256246566772461, -1.559234619140625, 6.137779235839844, 13.834793090820312, 21.531803131103516, 29.228816986083984, 36.92583084106445, 44.62284469604492, 52.319854736328125, 60.016868591308594, 67.71388244628906, 75.41089630126953, 83.10791015625, 90.80491638183594, 98.50193786621094, 106.1989517211914, 113.89596557617188, 121.59297180175781, 129.2899932861328, 136.98699951171875, 144.68402099609375, 152.3810272216797, 160.07803344726562, 167.77503967285156, 175.47206115722656, 183.1690673828125, 190.8660888671875, 198.56309509277344, 206.26010131835938, 213.95712280273438, 221.65414428710938, 229.3511505126953, 237.0481719970703, 244.74517822265625, 252.44219970703125, 260.13922119140625, 267.8362121582031, 275.5332336425781, 283.2302551269531, 290.9272766113281, 298.624267578125, 306.3212890625, 314.018310546875, 321.71533203125, 329.4123229980469, 337.1093444824219, 344.80633544921875, 352.50335693359375, 360.2003479003906, 367.8973693847656, 375.5943908691406, 383.2914123535156, 390.9884033203125, 398.6854248046875, 406.3824462890625, 414.0794677734375, 421.7764587402344, 429.4734802246094, 437.1705017089844, 444.8675231933594, 452.56451416015625, 460.26153564453125, 467.95855712890625]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 0.0, 2.0, 1.0, 5.0, 6.0, 6.0, 12.0, 10.0, 17.0, 14.0, 22.0, 22.0, 30.0, 20.0, 26.0, 29.0, 38.0, 38.0, 30.0, 39.0, 41.0, 36.0, 34.0, 39.0, 45.0, 45.0, 40.0, 42.0, 31.0, 35.0, 38.0, 29.0, 28.0, 22.0, 25.0, 22.0, 11.0, 11.0, 13.0, 13.0, 6.0, 7.0, 7.0, 4.0, 6.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-50.4613037109375, -48.953128814697266, -47.44495391845703, -45.9367790222168, -44.42860412597656, -42.92042922973633, -41.412254333496094, -39.90407943725586, -38.395904541015625, -36.88772964477539, -35.379554748535156, -33.87137985229492, -32.36320495605469, -30.855030059814453, -29.34685516357422, -27.838680267333984, -26.33050537109375, -24.822330474853516, -23.31415557861328, -21.805980682373047, -20.297805786132812, -18.789630889892578, -17.281455993652344, -15.77328109741211, -14.265106201171875, -12.75693130493164, -11.248756408691406, -9.740581512451172, -8.232406616210938, -6.724231719970703, -5.216056823730469, -3.7078819274902344, -2.19970703125, -0.6915321350097656, 0.8166427612304688, 2.324817657470703, 3.8329925537109375, 5.341167449951172, 6.849342346191406, 8.35751724243164, 9.865692138671875, 11.37386703491211, 12.882041931152344, 14.390216827392578, 15.898391723632812, 17.406566619873047, 18.91474151611328, 20.422916412353516, 21.93109130859375, 23.439266204833984, 24.94744110107422, 26.455615997314453, 27.963790893554688, 29.471965789794922, 30.980140686035156, 32.48831558227539, 33.996490478515625, 35.50466537475586, 37.012840270996094, 38.52101516723633, 40.02919006347656, 41.5373649597168, 43.04553985595703, 44.553714752197266, 46.0618896484375]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 4.0, 4.0, 4.0, 4.0, 5.0, 7.0, 11.0, 10.0, 11.0, 13.0, 12.0, 26.0, 20.0, 31.0, 30.0, 32.0, 23.0, 35.0, 34.0, 38.0, 42.0, 42.0, 35.0, 52.0, 47.0, 51.0, 33.0, 35.0, 34.0, 35.0, 39.0, 21.0, 20.0, 18.0, 16.0, 27.0, 17.0, 15.0, 10.0, 9.0, 9.0, 13.0, 6.0, 6.0, 4.0, 3.0, 2.0, 5.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.47265625, -6.2723388671875, -6.072021484375, -5.8717041015625, -5.67138671875, -5.4710693359375, -5.270751953125, -5.0704345703125, -4.8701171875, -4.6697998046875, -4.469482421875, -4.2691650390625, -4.06884765625, -3.8685302734375, -3.668212890625, -3.4678955078125, -3.267578125, -3.0672607421875, -2.866943359375, -2.6666259765625, -2.46630859375, -2.2659912109375, -2.065673828125, -1.8653564453125, -1.6650390625, -1.4647216796875, -1.264404296875, -1.0640869140625, -0.86376953125, -0.6634521484375, -0.463134765625, -0.2628173828125, -0.0625, 0.1378173828125, 0.338134765625, 0.5384521484375, 0.73876953125, 0.9390869140625, 1.139404296875, 1.3397216796875, 1.5400390625, 1.7403564453125, 1.940673828125, 2.1409912109375, 2.34130859375, 2.5416259765625, 2.741943359375, 2.9422607421875, 3.142578125, 3.3428955078125, 3.543212890625, 3.7435302734375, 3.94384765625, 4.1441650390625, 4.344482421875, 4.5447998046875, 4.7451171875, 4.9454345703125, 5.145751953125, 5.3460693359375, 5.54638671875, 5.7467041015625, 5.947021484375, 6.1473388671875, 6.34765625]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 13.0, 16.0, 35.0, 53.0, 84.0, 107.0, 168.0, 263.0, 393.0, 598.0, 922.0, 1365.0, 2033.0, 3034.0, 4558.0, 6706.0, 10392.0, 15897.0, 24101.0, 37027.0, 58043.0, 92676.0, 149605.0, 207003.0, 159159.0, 98061.0, 61779.0, 39533.0, 25776.0, 16665.0, 11009.0, 7095.0, 4850.0, 3192.0, 2184.0, 1386.0, 911.0, 669.0, 422.0, 274.0, 176.0, 134.0, 71.0, 42.0, 28.0, 15.0, 14.0, 7.0, 8.0, 1.0, 2.0, 4.0, 2.0, 1.0], "bins": [-0.73779296875, -0.7158126831054688, -0.6938323974609375, -0.6718521118164062, -0.649871826171875, -0.6278915405273438, -0.6059112548828125, -0.5839309692382812, -0.56195068359375, -0.5399703979492188, -0.5179901123046875, -0.49600982666015625, -0.474029541015625, -0.45204925537109375, -0.4300689697265625, -0.40808868408203125, -0.3861083984375, -0.36412811279296875, -0.3421478271484375, -0.32016754150390625, -0.298187255859375, -0.27620697021484375, -0.2542266845703125, -0.23224639892578125, -0.21026611328125, -0.18828582763671875, -0.1663055419921875, -0.14432525634765625, -0.122344970703125, -0.10036468505859375, -0.0783843994140625, -0.05640411376953125, -0.034423828125, -0.01244354248046875, 0.0095367431640625, 0.03151702880859375, 0.053497314453125, 0.07547760009765625, 0.0974578857421875, 0.11943817138671875, 0.14141845703125, 0.16339874267578125, 0.1853790283203125, 0.20735931396484375, 0.229339599609375, 0.25131988525390625, 0.2733001708984375, 0.29528045654296875, 0.3172607421875, 0.33924102783203125, 0.3612213134765625, 0.38320159912109375, 0.405181884765625, 0.42716217041015625, 0.4491424560546875, 0.47112274169921875, 0.49310302734375, 0.5150833129882812, 0.5370635986328125, 0.5590438842773438, 0.581024169921875, 0.6030044555664062, 0.6249847412109375, 0.6469650268554688, 0.6689453125]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 1.0, 4.0, 3.0, 6.0, 8.0, 9.0, 15.0, 10.0, 9.0, 11.0, 15.0, 20.0, 19.0, 8.0, 30.0, 22.0, 22.0, 21.0, 30.0, 26.0, 43.0, 29.0, 53.0, 37.0, 31.0, 1063.0, 40.0, 42.0, 36.0, 34.0, 33.0, 38.0, 24.0, 28.0, 26.0, 29.0, 22.0, 18.0, 16.0, 16.0, 19.0, 16.0, 8.0, 2.0, 7.0, 7.0, 3.0, 4.0, 6.0, 7.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.955078125, -3.8316650390625, -3.708251953125, -3.5848388671875, -3.46142578125, -3.3380126953125, -3.214599609375, -3.0911865234375, -2.9677734375, -2.8443603515625, -2.720947265625, -2.5975341796875, -2.47412109375, -2.3507080078125, -2.227294921875, -2.1038818359375, -1.98046875, -1.8570556640625, -1.733642578125, -1.6102294921875, -1.48681640625, -1.3634033203125, -1.239990234375, -1.1165771484375, -0.9931640625, -0.8697509765625, -0.746337890625, -0.6229248046875, -0.49951171875, -0.3760986328125, -0.252685546875, -0.1292724609375, -0.005859375, 0.1175537109375, 0.240966796875, 0.3643798828125, 0.48779296875, 0.6112060546875, 0.734619140625, 0.8580322265625, 0.9814453125, 1.1048583984375, 1.228271484375, 1.3516845703125, 1.47509765625, 1.5985107421875, 1.721923828125, 1.8453369140625, 1.96875, 2.0921630859375, 2.215576171875, 2.3389892578125, 2.46240234375, 2.5858154296875, 2.709228515625, 2.8326416015625, 2.9560546875, 3.0794677734375, 3.202880859375, 3.3262939453125, 3.44970703125, 3.5731201171875, 3.696533203125, 3.8199462890625, 3.943359375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 4.0, 1.0, 9.0, 15.0, 23.0, 26.0, 38.0, 50.0, 77.0, 130.0, 159.0, 247.0, 338.0, 471.0, 664.0, 1003.0, 1462.0, 2079.0, 2994.0, 4319.0, 6527.0, 9440.0, 14062.0, 21109.0, 32195.0, 49283.0, 76655.0, 120753.0, 939335.0, 473089.0, 119265.0, 76048.0, 48673.0, 31942.0, 21116.0, 13888.0, 9288.0, 6261.0, 4339.0, 2999.0, 2059.0, 1327.0, 1042.0, 740.0, 497.0, 337.0, 210.0, 185.0, 126.0, 90.0, 55.0, 34.0, 20.0, 20.0, 13.0, 6.0, 3.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.63232421875, -0.6125564575195312, -0.5927886962890625, -0.5730209350585938, -0.553253173828125, -0.5334854125976562, -0.5137176513671875, -0.49394989013671875, -0.47418212890625, -0.45441436767578125, -0.4346466064453125, -0.41487884521484375, -0.395111083984375, -0.37534332275390625, -0.3555755615234375, -0.33580780029296875, -0.3160400390625, -0.29627227783203125, -0.2765045166015625, -0.25673675537109375, -0.236968994140625, -0.21720123291015625, -0.1974334716796875, -0.17766571044921875, -0.15789794921875, -0.13813018798828125, -0.1183624267578125, -0.09859466552734375, -0.078826904296875, -0.05905914306640625, -0.0392913818359375, -0.01952362060546875, 0.000244140625, 0.02001190185546875, 0.0397796630859375, 0.05954742431640625, 0.079315185546875, 0.09908294677734375, 0.1188507080078125, 0.13861846923828125, 0.15838623046875, 0.17815399169921875, 0.1979217529296875, 0.21768951416015625, 0.237457275390625, 0.25722503662109375, 0.2769927978515625, 0.29676055908203125, 0.3165283203125, 0.33629608154296875, 0.3560638427734375, 0.37583160400390625, 0.395599365234375, 0.41536712646484375, 0.4351348876953125, 0.45490264892578125, 0.47467041015625, 0.49443817138671875, 0.5142059326171875, 0.5339736938476562, 0.553741455078125, 0.5735092163085938, 0.5932769775390625, 0.6130447387695312, 0.6328125]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 4.0, 7.0, 9.0, 9.0, 8.0, 17.0, 23.0, 34.0, 39.0, 46.0, 54.0, 53.0, 69.0, 82.0, 78.0, 72.0, 64.0, 62.0, 54.0, 44.0, 38.0, 35.0, 22.0, 13.0, 16.0, 15.0, 8.0, 9.0, 2.0, 2.0, 6.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0028514862060546875, -0.0027438104152679443, -0.002636134624481201, -0.002528458833694458, -0.002420783042907715, -0.0023131072521209717, -0.0022054314613342285, -0.0020977556705474854, -0.001990079879760742, -0.001882404088973999, -0.0017747282981872559, -0.0016670525074005127, -0.0015593767166137695, -0.0014517009258270264, -0.0013440251350402832, -0.00123634934425354, -0.0011286735534667969, -0.0010209977626800537, -0.0009133219718933105, -0.0008056461811065674, -0.0006979703903198242, -0.0005902945995330811, -0.0004826188087463379, -0.0003749430179595947, -0.00026726722717285156, -0.0001595914363861084, -5.1915645599365234e-05, 5.576014518737793e-05, 0.0001634359359741211, 0.00027111172676086426, 0.0003787875175476074, 0.0004864633083343506, 0.0005941390991210938, 0.0007018148899078369, 0.0008094906806945801, 0.0009171664714813232, 0.0010248422622680664, 0.0011325180530548096, 0.0012401938438415527, 0.001347869634628296, 0.001455545425415039, 0.0015632212162017822, 0.0016708970069885254, 0.0017785727977752686, 0.0018862485885620117, 0.001993924379348755, 0.002101600170135498, 0.002209275960922241, 0.0023169517517089844, 0.0024246275424957275, 0.0025323033332824707, 0.002639979124069214, 0.002747654914855957, 0.0028553307056427, 0.0029630064964294434, 0.0030706822872161865, 0.0031783580780029297, 0.003286033868789673, 0.003393709659576416, 0.003501385450363159, 0.0036090612411499023, 0.0037167370319366455, 0.0038244128227233887, 0.003932088613510132, 0.004039764404296875]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 6.0, 4.0, 10.0, 15.0, 16.0, 17.0, 28.0, 33.0, 45.0, 64.0, 118.0, 155.0, 682.0, 224084.0, 821902.0, 798.0, 196.0, 94.0, 87.0, 45.0, 26.0, 35.0, 23.0, 12.0, 8.0, 14.0, 10.0, 7.0, 2.0, 0.0, 3.0, 6.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1036376953125, -0.10076332092285156, -0.09788894653320312, -0.09501457214355469, -0.09214019775390625, -0.08926582336425781, -0.08639144897460938, -0.08351707458496094, -0.0806427001953125, -0.07776832580566406, -0.07489395141601562, -0.07201957702636719, -0.06914520263671875, -0.06627082824707031, -0.06339645385742188, -0.06052207946777344, -0.057647705078125, -0.05477333068847656, -0.051898956298828125, -0.04902458190917969, -0.04615020751953125, -0.04327583312988281, -0.040401458740234375, -0.03752708435058594, -0.0346527099609375, -0.03177833557128906, -0.028903961181640625, -0.026029586791992188, -0.02315521240234375, -0.020280838012695312, -0.017406463623046875, -0.014532089233398438, -0.01165771484375, -0.008783340454101562, -0.005908966064453125, -0.0030345916748046875, -0.00016021728515625, 0.0027141571044921875, 0.005588531494140625, 0.008462905883789062, 0.0113372802734375, 0.014211654663085938, 0.017086029052734375, 0.019960403442382812, 0.02283477783203125, 0.025709152221679688, 0.028583526611328125, 0.03145790100097656, 0.034332275390625, 0.03720664978027344, 0.040081024169921875, 0.04295539855957031, 0.04582977294921875, 0.04870414733886719, 0.051578521728515625, 0.05445289611816406, 0.0573272705078125, 0.06020164489746094, 0.06307601928710938, 0.06595039367675781, 0.06882476806640625, 0.07169914245605469, 0.07457351684570312, 0.07744789123535156, 0.080322265625]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 14.0, 359.0, 611.0, 31.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.014790809713304043, -0.014448071829974651, -0.014105333015322685, -0.013762595131993294, -0.013419857248663902, -0.013077118434011936, -0.012734380550682545, -0.012391641736030579, -0.012048903852701187, -0.011706165969371796, -0.01136342715471983, -0.011020689271390438, -0.010677950456738472, -0.01033521257340908, -0.009992474690079689, -0.009649736806750298, -0.009306997992098331, -0.00896426010876894, -0.008621521294116974, -0.008278783410787582, -0.007936045527458191, -0.007593306712806225, -0.007250568829476833, -0.0069078304804861546, -0.006565092131495476, -0.006222353782504797, -0.005879615433514118, -0.005536877550184727, -0.005194139201194048, -0.004851400852203369, -0.004508662968873978, -0.004165924619883299, -0.00382318627089262, -0.0034804479219019413, -0.003137709805741906, -0.002794971689581871, -0.0024522333405911922, -0.0021094949916005135, -0.0017667568754404783, -0.0014240187592804432, -0.0010812804102897644, -0.0007385421777144074, -0.0003958039451390505, -5.3065712563693523e-05, 0.00028967252001166344, 0.0006324107525870204, 0.0009751489851623774, 0.0013178871013224125, 0.0016606254503130913, 0.00200336379930377, 0.002346101915463805, 0.0026888400316238403, 0.003031578380614519, 0.003374316729605198, 0.003717054845765233, 0.004059792961925268, 0.004402531310915947, 0.004745269659906626, 0.0050880080088973045, 0.005430745892226696, 0.005773484241217375, 0.006116222590208054, 0.006458960473537445, 0.006801698822528124, 0.007144437171518803]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 7.0, 2.0, 12.0, 4.0, 11.0, 12.0, 15.0, 16.0, 10.0, 9.0, 21.0, 19.0, 32.0, 30.0, 27.0, 31.0, 30.0, 49.0, 50.0, 36.0, 36.0, 46.0, 34.0, 43.0, 41.0, 34.0, 39.0, 36.0, 28.0, 33.0, 30.0, 25.0, 30.0, 22.0, 19.0, 15.0, 14.0, 10.0, 16.0, 10.0, 5.0, 5.0, 8.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012925267219543457, -0.0012477543205022812, -0.0012029819190502167, -0.0011582095175981522, -0.0011134371161460876, -0.0010686647146940231, -0.0010238923132419586, -0.000979119911789894, -0.0009343475103378296, -0.0008895751088857651, -0.0008448027074337006, -0.000800030305981636, -0.0007552579045295715, -0.000710485503077507, -0.0006657131016254425, -0.000620940700173378, -0.0005761682987213135, -0.000531395897269249, -0.00048662349581718445, -0.00044185109436511993, -0.0003970786929130554, -0.0003523062914609909, -0.0003075338900089264, -0.0002627614885568619, -0.00021798908710479736, -0.00017321668565273285, -0.00012844428420066833, -8.367188274860382e-05, -3.889948129653931e-05, 5.8729201555252075e-06, 5.064532160758972e-05, 9.541772305965424e-05, 0.00014019012451171875, 0.00018496252596378326, 0.00022973492741584778, 0.0002745073288679123, 0.0003192797303199768, 0.0003640521317720413, 0.00040882453322410583, 0.00045359693467617035, 0.0004983693361282349, 0.0005431417375802994, 0.0005879141390323639, 0.0006326865404844284, 0.0006774589419364929, 0.0007222313433885574, 0.000767003744840622, 0.0008117761462926865, 0.000856548547744751, 0.0009013209491968155, 0.00094609335064888, 0.0009908657521009445, 0.001035638153553009, 0.0010804105550050735, 0.001125182956457138, 0.0011699553579092026, 0.001214727759361267, 0.0012595001608133316, 0.0013042725622653961, 0.0013490449637174606, 0.0013938173651695251, 0.0014385897666215897, 0.0014833621680736542, 0.0015281345695257187, 0.0015729069709777832]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 4.0, 4.0, 4.0, 4.0, 5.0, 7.0, 11.0, 10.0, 11.0, 13.0, 12.0, 26.0, 20.0, 30.0, 31.0, 32.0, 23.0, 35.0, 34.0, 38.0, 42.0, 42.0, 35.0, 52.0, 47.0, 51.0, 33.0, 35.0, 34.0, 35.0, 39.0, 21.0, 20.0, 18.0, 16.0, 27.0, 17.0, 15.0, 10.0, 9.0, 9.0, 13.0, 6.0, 6.0, 4.0, 3.0, 2.0, 5.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.47265625, -6.2723388671875, -6.072021484375, -5.8717041015625, -5.67138671875, -5.4710693359375, -5.270751953125, -5.0704345703125, -4.8701171875, -4.6697998046875, -4.469482421875, -4.2691650390625, -4.06884765625, -3.8685302734375, -3.668212890625, -3.4678955078125, -3.267578125, -3.0672607421875, -2.866943359375, -2.6666259765625, -2.46630859375, -2.2659912109375, -2.065673828125, -1.8653564453125, -1.6650390625, -1.4647216796875, -1.264404296875, -1.0640869140625, -0.86376953125, -0.6634521484375, -0.463134765625, -0.2628173828125, -0.0625, 0.1378173828125, 0.338134765625, 0.5384521484375, 0.73876953125, 0.9390869140625, 1.139404296875, 1.3397216796875, 1.5400390625, 1.7403564453125, 1.940673828125, 2.1409912109375, 2.34130859375, 2.5416259765625, 2.741943359375, 2.9422607421875, 3.142578125, 3.3428955078125, 3.543212890625, 3.7435302734375, 3.94384765625, 4.1441650390625, 4.344482421875, 4.5447998046875, 4.7451171875, 4.9454345703125, 5.145751953125, 5.3460693359375, 5.54638671875, 5.7467041015625, 5.947021484375, 6.1473388671875, 6.34765625]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 7.0, 10.0, 5.0, 14.0, 10.0, 36.0, 40.0, 58.0, 91.0, 114.0, 159.0, 272.0, 347.0, 608.0, 896.0, 1485.0, 2668.0, 4771.0, 9285.0, 18622.0, 39187.0, 88451.0, 218780.0, 376752.0, 157974.0, 66586.0, 30148.0, 14256.0, 7152.0, 4028.0, 2109.0, 1316.0, 785.0, 505.0, 318.0, 220.0, 136.0, 95.0, 75.0, 59.0, 38.0, 25.0, 21.0, 11.0, 14.0, 6.0, 2.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.80078125, -4.6370849609375, -4.473388671875, -4.3096923828125, -4.14599609375, -3.9822998046875, -3.818603515625, -3.6549072265625, -3.4912109375, -3.3275146484375, -3.163818359375, -3.0001220703125, -2.83642578125, -2.6727294921875, -2.509033203125, -2.3453369140625, -2.181640625, -2.0179443359375, -1.854248046875, -1.6905517578125, -1.52685546875, -1.3631591796875, -1.199462890625, -1.0357666015625, -0.8720703125, -0.7083740234375, -0.544677734375, -0.3809814453125, -0.21728515625, -0.0535888671875, 0.110107421875, 0.2738037109375, 0.4375, 0.6011962890625, 0.764892578125, 0.9285888671875, 1.09228515625, 1.2559814453125, 1.419677734375, 1.5833740234375, 1.7470703125, 1.9107666015625, 2.074462890625, 2.2381591796875, 2.40185546875, 2.5655517578125, 2.729248046875, 2.8929443359375, 3.056640625, 3.2203369140625, 3.384033203125, 3.5477294921875, 3.71142578125, 3.8751220703125, 4.038818359375, 4.2025146484375, 4.3662109375, 4.5299072265625, 4.693603515625, 4.8572998046875, 5.02099609375, 5.1846923828125, 5.348388671875, 5.5120849609375, 5.67578125]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 7.0, 9.0, 8.0, 8.0, 8.0, 9.0, 13.0, 17.0, 25.0, 42.0, 34.0, 33.0, 37.0, 25.0, 42.0, 49.0, 65.0, 87.0, 268.0, 1577.0, 176.0, 91.0, 66.0, 44.0, 27.0, 43.0, 31.0, 29.0, 29.0, 30.0, 17.0, 20.0, 12.0, 13.0, 11.0, 7.0, 7.0, 10.0, 10.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.671875, -22.960693359375, -22.24951171875, -21.538330078125, -20.8271484375, -20.115966796875, -19.40478515625, -18.693603515625, -17.982421875, -17.271240234375, -16.56005859375, -15.848876953125, -15.1376953125, -14.426513671875, -13.71533203125, -13.004150390625, -12.29296875, -11.581787109375, -10.87060546875, -10.159423828125, -9.4482421875, -8.737060546875, -8.02587890625, -7.314697265625, -6.603515625, -5.892333984375, -5.18115234375, -4.469970703125, -3.7587890625, -3.047607421875, -2.33642578125, -1.625244140625, -0.9140625, -0.202880859375, 0.50830078125, 1.219482421875, 1.9306640625, 2.641845703125, 3.35302734375, 4.064208984375, 4.775390625, 5.486572265625, 6.19775390625, 6.908935546875, 7.6201171875, 8.331298828125, 9.04248046875, 9.753662109375, 10.46484375, 11.176025390625, 11.88720703125, 12.598388671875, 13.3095703125, 14.020751953125, 14.73193359375, 15.443115234375, 16.154296875, 16.865478515625, 17.57666015625, 18.287841796875, 18.9990234375, 19.710205078125, 20.42138671875, 21.132568359375, 21.84375]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 6.0, 4.0, 7.0, 8.0, 16.0, 26.0, 26.0, 30.0, 53.0, 71.0, 101.0, 145.0, 222.0, 322.0, 636.0, 4928.0, 3094396.0, 42413.0, 1097.0, 396.0, 252.0, 174.0, 114.0, 81.0, 49.0, 32.0, 25.0, 21.0, 17.0, 16.0, 8.0, 6.0, 6.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.8125, -72.4521484375, -70.091796875, -67.7314453125, -65.37109375, -63.0107421875, -60.650390625, -58.2900390625, -55.9296875, -53.5693359375, -51.208984375, -48.8486328125, -46.48828125, -44.1279296875, -41.767578125, -39.4072265625, -37.046875, -34.6865234375, -32.326171875, -29.9658203125, -27.60546875, -25.2451171875, -22.884765625, -20.5244140625, -18.1640625, -15.8037109375, -13.443359375, -11.0830078125, -8.72265625, -6.3623046875, -4.001953125, -1.6416015625, 0.71875, 3.0791015625, 5.439453125, 7.7998046875, 10.16015625, 12.5205078125, 14.880859375, 17.2412109375, 19.6015625, 21.9619140625, 24.322265625, 26.6826171875, 29.04296875, 31.4033203125, 33.763671875, 36.1240234375, 38.484375, 40.8447265625, 43.205078125, 45.5654296875, 47.92578125, 50.2861328125, 52.646484375, 55.0068359375, 57.3671875, 59.7275390625, 62.087890625, 64.4482421875, 66.80859375, 69.1689453125, 71.529296875, 73.8896484375, 76.25]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 14.0, 37.0, 76.0, 166.0, 222.0, 210.0, 156.0, 89.0, 30.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.444358825683594, -37.860782623291016, -36.27720642089844, -34.69363021850586, -33.11005401611328, -31.526477813720703, -29.942901611328125, -28.359325408935547, -26.77574920654297, -25.19217300415039, -23.608596801757812, -22.025020599365234, -20.441444396972656, -18.857868194580078, -17.2742919921875, -15.690715789794922, -14.107139587402344, -12.523563385009766, -10.939987182617188, -9.35641098022461, -7.772834777832031, -6.189258575439453, -4.605682373046875, -3.022106170654297, -1.4385299682617188, 0.14504623413085938, 1.7286224365234375, 3.3121986389160156, 4.895774841308594, 6.479351043701172, 8.06292724609375, 9.646503448486328, 11.230079650878906, 12.813655853271484, 14.397232055664062, 15.98080825805664, 17.56438446044922, 19.147960662841797, 20.731536865234375, 22.315113067626953, 23.89868927001953, 25.48226547241211, 27.065841674804688, 28.649417877197266, 30.232994079589844, 31.816570281982422, 33.400146484375, 34.98372268676758, 36.567298889160156, 38.150875091552734, 39.73445129394531, 41.31802749633789, 42.90160369873047, 44.48517990112305, 46.068756103515625, 47.6523323059082, 49.23590850830078, 50.81948471069336, 52.40306091308594, 53.986637115478516, 55.570213317871094, 57.15378952026367, 58.73736572265625, 60.32094192504883, 61.904518127441406]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 4.0, 6.0, 3.0, 9.0, 6.0, 6.0, 6.0, 5.0, 14.0, 17.0, 15.0, 18.0, 13.0, 28.0, 20.0, 18.0, 25.0, 34.0, 37.0, 23.0, 29.0, 36.0, 30.0, 31.0, 42.0, 40.0, 39.0, 35.0, 38.0, 35.0, 26.0, 33.0, 33.0, 30.0, 14.0, 27.0, 23.0, 30.0, 15.0, 18.0, 11.0, 18.0, 17.0, 9.0, 14.0, 5.0, 5.0, 6.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0], "bins": [-57.89659118652344, -56.148014068603516, -54.39943313598633, -52.650856018066406, -50.902278900146484, -49.15370178222656, -47.405120849609375, -45.65654373168945, -43.90796661376953, -42.15938949584961, -40.41080856323242, -38.6622314453125, -36.91365432739258, -35.165077209472656, -33.41649627685547, -31.667919158935547, -29.91933822631836, -28.170759201049805, -26.422182083129883, -24.673603057861328, -22.925025939941406, -21.17644691467285, -19.427867889404297, -17.679290771484375, -15.93071174621582, -14.182133674621582, -12.433555603027344, -10.684976577758789, -8.93639850616455, -7.1878204345703125, -5.439241409301758, -3.6906633377075195, -1.9420890808105469, -0.1935107707977295, 1.555067539215088, 3.3036460876464844, 5.052224159240723, 6.800802230834961, 8.549381256103516, 10.297959327697754, 12.046537399291992, 13.79511547088623, 15.543693542480469, 17.292272567749023, 19.040851593017578, 20.7894287109375, 22.538007736206055, 24.28658676147461, 26.03516387939453, 27.783742904663086, 29.532320022583008, 31.280899047851562, 33.029476165771484, 34.778053283691406, 36.526634216308594, 38.275211334228516, 40.02378845214844, 41.77236557006836, 43.52094650268555, 45.26952362060547, 47.01810073852539, 48.76667785644531, 50.5152587890625, 52.26383590698242, 54.01241683959961]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 3.0, 5.0, 1.0, 4.0, 1.0, 7.0, 8.0, 10.0, 6.0, 7.0, 9.0, 19.0, 13.0, 18.0, 25.0, 32.0, 26.0, 34.0, 33.0, 32.0, 43.0, 35.0, 47.0, 55.0, 49.0, 50.0, 44.0, 50.0, 32.0, 31.0, 36.0, 28.0, 35.0, 27.0, 19.0, 24.0, 20.0, 20.0, 9.0, 12.0, 11.0, 10.0, 7.0, 5.0, 7.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.2109375, -6.9835205078125, -6.756103515625, -6.5286865234375, -6.30126953125, -6.0738525390625, -5.846435546875, -5.6190185546875, -5.3916015625, -5.1641845703125, -4.936767578125, -4.7093505859375, -4.48193359375, -4.2545166015625, -4.027099609375, -3.7996826171875, -3.572265625, -3.3448486328125, -3.117431640625, -2.8900146484375, -2.66259765625, -2.4351806640625, -2.207763671875, -1.9803466796875, -1.7529296875, -1.5255126953125, -1.298095703125, -1.0706787109375, -0.84326171875, -0.6158447265625, -0.388427734375, -0.1610107421875, 0.06640625, 0.2938232421875, 0.521240234375, 0.7486572265625, 0.97607421875, 1.2034912109375, 1.430908203125, 1.6583251953125, 1.8857421875, 2.1131591796875, 2.340576171875, 2.5679931640625, 2.79541015625, 3.0228271484375, 3.250244140625, 3.4776611328125, 3.705078125, 3.9324951171875, 4.159912109375, 4.3873291015625, 4.61474609375, 4.8421630859375, 5.069580078125, 5.2969970703125, 5.5244140625, 5.7518310546875, 5.979248046875, 6.2066650390625, 6.43408203125, 6.6614990234375, 6.888916015625, 7.1163330078125, 7.34375]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 5.0, 3.0, 2.0, 3.0, 1.0, 4.0, 5.0, 9.0, 6.0, 5.0, 13.0, 17.0, 13.0, 19.0, 14.0, 23.0, 32.0, 27.0, 44.0, 83.0, 187.0, 382.0, 1289.0, 8848.0, 305545.0, 3514531.0, 351743.0, 9301.0, 1239.0, 417.0, 149.0, 81.0, 35.0, 34.0, 25.0, 37.0, 19.0, 21.0, 15.0, 13.0, 8.0, 6.0, 9.0, 5.0, 11.0, 5.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.328125, -23.50390625, -22.6796875, -21.85546875, -21.03125, -20.20703125, -19.3828125, -18.55859375, -17.734375, -16.91015625, -16.0859375, -15.26171875, -14.4375, -13.61328125, -12.7890625, -11.96484375, -11.140625, -10.31640625, -9.4921875, -8.66796875, -7.84375, -7.01953125, -6.1953125, -5.37109375, -4.546875, -3.72265625, -2.8984375, -2.07421875, -1.25, -0.42578125, 0.3984375, 1.22265625, 2.046875, 2.87109375, 3.6953125, 4.51953125, 5.34375, 6.16796875, 6.9921875, 7.81640625, 8.640625, 9.46484375, 10.2890625, 11.11328125, 11.9375, 12.76171875, 13.5859375, 14.41015625, 15.234375, 16.05859375, 16.8828125, 17.70703125, 18.53125, 19.35546875, 20.1796875, 21.00390625, 21.828125, 22.65234375, 23.4765625, 24.30078125, 25.125, 25.94921875, 26.7734375, 27.59765625, 28.421875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 10.0, 3.0, 9.0, 13.0, 24.0, 19.0, 29.0, 35.0, 54.0, 87.0, 108.0, 136.0, 182.0, 285.0, 352.0, 433.0, 522.0, 430.0, 365.0, 280.0, 179.0, 136.0, 87.0, 76.0, 68.0, 34.0, 32.0, 27.0, 16.0, 14.0, 14.0, 7.0, 1.0, 4.0, 2.0, 3.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.9296875, -14.4403076171875, -13.950927734375, -13.4615478515625, -12.97216796875, -12.4827880859375, -11.993408203125, -11.5040283203125, -11.0146484375, -10.5252685546875, -10.035888671875, -9.5465087890625, -9.05712890625, -8.5677490234375, -8.078369140625, -7.5889892578125, -7.099609375, -6.6102294921875, -6.120849609375, -5.6314697265625, -5.14208984375, -4.6527099609375, -4.163330078125, -3.6739501953125, -3.1845703125, -2.6951904296875, -2.205810546875, -1.7164306640625, -1.22705078125, -0.7376708984375, -0.248291015625, 0.2410888671875, 0.73046875, 1.2198486328125, 1.709228515625, 2.1986083984375, 2.68798828125, 3.1773681640625, 3.666748046875, 4.1561279296875, 4.6455078125, 5.1348876953125, 5.624267578125, 6.1136474609375, 6.60302734375, 7.0924072265625, 7.581787109375, 8.0711669921875, 8.560546875, 9.0499267578125, 9.539306640625, 10.0286865234375, 10.51806640625, 11.0074462890625, 11.496826171875, 11.9862060546875, 12.4755859375, 12.9649658203125, 13.454345703125, 13.9437255859375, 14.43310546875, 14.9224853515625, 15.411865234375, 15.9012451171875, 16.390625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 4.0, 5.0, 4.0, 7.0, 13.0, 11.0, 21.0, 21.0, 38.0, 29.0, 38.0, 51.0, 58.0, 79.0, 87.0, 120.0, 144.0, 171.0, 273.0, 408.0, 806.0, 8001.0, 2452483.0, 1722537.0, 6531.0, 779.0, 395.0, 255.0, 206.0, 148.0, 121.0, 86.0, 75.0, 53.0, 44.0, 25.0, 41.0, 22.0, 20.0, 14.0, 18.0, 11.0, 6.0, 7.0, 4.0, 5.0, 1.0, 1.0, 4.0, 4.0, 1.0, 1.0, 2.0], "bins": [-61.9375, -60.1142578125, -58.291015625, -56.4677734375, -54.64453125, -52.8212890625, -50.998046875, -49.1748046875, -47.3515625, -45.5283203125, -43.705078125, -41.8818359375, -40.05859375, -38.2353515625, -36.412109375, -34.5888671875, -32.765625, -30.9423828125, -29.119140625, -27.2958984375, -25.47265625, -23.6494140625, -21.826171875, -20.0029296875, -18.1796875, -16.3564453125, -14.533203125, -12.7099609375, -10.88671875, -9.0634765625, -7.240234375, -5.4169921875, -3.59375, -1.7705078125, 0.052734375, 1.8759765625, 3.69921875, 5.5224609375, 7.345703125, 9.1689453125, 10.9921875, 12.8154296875, 14.638671875, 16.4619140625, 18.28515625, 20.1083984375, 21.931640625, 23.7548828125, 25.578125, 27.4013671875, 29.224609375, 31.0478515625, 32.87109375, 34.6943359375, 36.517578125, 38.3408203125, 40.1640625, 41.9873046875, 43.810546875, 45.6337890625, 47.45703125, 49.2802734375, 51.103515625, 52.9267578125, 54.75]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 126.0, 808.0, 80.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-666.2037353515625, -649.3263549804688, -632.448974609375, -615.5716552734375, -598.6942749023438, -581.81689453125, -564.9395141601562, -548.0621337890625, -531.1847534179688, -514.307373046875, -497.4300231933594, -480.5526428222656, -463.6752624511719, -446.79791259765625, -429.9205322265625, -413.04315185546875, -396.1658020019531, -379.2884216308594, -362.41107177734375, -345.53369140625, -328.65631103515625, -311.7789306640625, -294.9015808105469, -278.0242004394531, -261.1468505859375, -244.2694854736328, -227.39210510253906, -210.51473999023438, -193.63735961914062, -176.75999450683594, -159.88262939453125, -143.0052490234375, -126.12786865234375, -109.25049591064453, -92.37312316894531, -75.49575805664062, -58.618385314941406, -41.74101257324219, -24.8636474609375, -7.986274719238281, 8.891098022460938, 25.768468856811523, 42.64583969116211, 59.52320861816406, 76.40058135986328, 93.2779541015625, 110.15531921386719, 127.0326919555664, 143.91006469726562, 160.7874298095703, 177.66481018066406, 194.54217529296875, 211.4195556640625, 228.2969207763672, 245.17428588867188, 262.0516662597656, 278.92901611328125, 295.806396484375, 312.6837463378906, 329.5611267089844, 346.4385070800781, 363.31585693359375, 380.1932373046875, 397.07061767578125, 413.947998046875]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 6.0, 4.0, 10.0, 13.0, 5.0, 11.0, 12.0, 9.0, 17.0, 19.0, 23.0, 27.0, 30.0, 32.0, 37.0, 38.0, 38.0, 42.0, 34.0, 34.0, 42.0, 42.0, 41.0, 44.0, 39.0, 35.0, 42.0, 32.0, 29.0, 28.0, 22.0, 30.0, 28.0, 20.0, 21.0, 11.0, 12.0, 7.0, 9.0, 5.0, 11.0, 6.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-50.709136962890625, -49.12135314941406, -47.533565521240234, -45.945777893066406, -44.357994079589844, -42.77021026611328, -41.18242263793945, -39.594635009765625, -38.00685119628906, -36.4190673828125, -34.83127975463867, -33.243492126464844, -31.65570831298828, -30.067922592163086, -28.48013687133789, -26.892351150512695, -25.3045654296875, -23.716779708862305, -22.12899398803711, -20.541208267211914, -18.95342254638672, -17.365636825561523, -15.777851104736328, -14.190065383911133, -12.602279663085938, -11.014493942260742, -9.426708221435547, -7.838922500610352, -6.251136779785156, -4.663351058959961, -3.0755653381347656, -1.4877796173095703, 0.10000991821289062, 1.687795639038086, 3.2755813598632812, 4.863367080688477, 6.451152801513672, 8.038938522338867, 9.626724243164062, 11.214509963989258, 12.802295684814453, 14.390081405639648, 15.977867126464844, 17.56565284729004, 19.153438568115234, 20.74122428894043, 22.329010009765625, 23.91679573059082, 25.504581451416016, 27.09236717224121, 28.680152893066406, 30.2679386138916, 31.855724334716797, 33.443511962890625, 35.03129577636719, 36.61907958984375, 38.20686721801758, 39.794654846191406, 41.38243865966797, 42.97022247314453, 44.55801010131836, 46.14579772949219, 47.73358154296875, 49.32136535644531, 50.90915298461914]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 3.0, 2.0, 4.0, 2.0, 3.0, 1.0, 6.0, 9.0, 4.0, 3.0, 6.0, 11.0, 14.0, 20.0, 31.0, 18.0, 29.0, 21.0, 25.0, 32.0, 32.0, 34.0, 41.0, 40.0, 38.0, 46.0, 45.0, 43.0, 37.0, 33.0, 41.0, 41.0, 40.0, 27.0, 35.0, 24.0, 25.0, 16.0, 20.0, 12.0, 21.0, 15.0, 8.0, 8.0, 7.0, 10.0, 9.0, 4.0, 2.0, 7.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.30859375, -6.09613037109375, -5.8836669921875, -5.67120361328125, -5.458740234375, -5.24627685546875, -5.0338134765625, -4.82135009765625, -4.60888671875, -4.39642333984375, -4.1839599609375, -3.97149658203125, -3.759033203125, -3.54656982421875, -3.3341064453125, -3.12164306640625, -2.9091796875, -2.69671630859375, -2.4842529296875, -2.27178955078125, -2.059326171875, -1.84686279296875, -1.6343994140625, -1.42193603515625, -1.20947265625, -0.99700927734375, -0.7845458984375, -0.57208251953125, -0.359619140625, -0.14715576171875, 0.0653076171875, 0.27777099609375, 0.490234375, 0.70269775390625, 0.9151611328125, 1.12762451171875, 1.340087890625, 1.55255126953125, 1.7650146484375, 1.97747802734375, 2.18994140625, 2.40240478515625, 2.6148681640625, 2.82733154296875, 3.039794921875, 3.25225830078125, 3.4647216796875, 3.67718505859375, 3.8896484375, 4.10211181640625, 4.3145751953125, 4.52703857421875, 4.739501953125, 4.95196533203125, 5.1644287109375, 5.37689208984375, 5.58935546875, 5.80181884765625, 6.0142822265625, 6.22674560546875, 6.439208984375, 6.65167236328125, 6.8641357421875, 7.07659912109375, 7.2890625]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 5.0, 4.0, 9.0, 13.0, 8.0, 15.0, 34.0, 33.0, 62.0, 101.0, 159.0, 199.0, 257.0, 368.0, 571.0, 775.0, 1197.0, 1817.0, 2612.0, 3735.0, 5782.0, 8711.0, 13512.0, 20590.0, 32359.0, 49988.0, 79980.0, 128146.0, 194834.0, 183455.0, 116178.0, 72263.0, 45612.0, 29371.0, 19133.0, 12209.0, 8045.0, 5192.0, 3607.0, 2453.0, 1598.0, 1102.0, 777.0, 538.0, 353.0, 251.0, 160.0, 135.0, 79.0, 53.0, 39.0, 32.0, 21.0, 14.0, 11.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.71142578125, -0.6884002685546875, -0.665374755859375, -0.6423492431640625, -0.61932373046875, -0.5962982177734375, -0.573272705078125, -0.5502471923828125, -0.5272216796875, -0.5041961669921875, -0.481170654296875, -0.4581451416015625, -0.43511962890625, -0.4120941162109375, -0.389068603515625, -0.3660430908203125, -0.343017578125, -0.3199920654296875, -0.296966552734375, -0.2739410400390625, -0.25091552734375, -0.2278900146484375, -0.204864501953125, -0.1818389892578125, -0.1588134765625, -0.1357879638671875, -0.112762451171875, -0.0897369384765625, -0.06671142578125, -0.0436859130859375, -0.020660400390625, 0.0023651123046875, 0.025390625, 0.0484161376953125, 0.071441650390625, 0.0944671630859375, 0.11749267578125, 0.1405181884765625, 0.163543701171875, 0.1865692138671875, 0.2095947265625, 0.2326202392578125, 0.255645751953125, 0.2786712646484375, 0.30169677734375, 0.3247222900390625, 0.347747802734375, 0.3707733154296875, 0.393798828125, 0.4168243408203125, 0.439849853515625, 0.4628753662109375, 0.48590087890625, 0.5089263916015625, 0.531951904296875, 0.5549774169921875, 0.5780029296875, 0.6010284423828125, 0.624053955078125, 0.6470794677734375, 0.67010498046875, 0.6931304931640625, 0.716156005859375, 0.7391815185546875, 0.76220703125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 2.0, 6.0, 4.0, 7.0, 3.0, 8.0, 9.0, 8.0, 12.0, 20.0, 18.0, 21.0, 29.0, 25.0, 41.0, 25.0, 51.0, 36.0, 36.0, 41.0, 48.0, 1076.0, 51.0, 56.0, 44.0, 35.0, 38.0, 38.0, 48.0, 28.0, 28.0, 25.0, 24.0, 23.0, 15.0, 15.0, 8.0, 8.0, 5.0, 5.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.77734375, -4.6171875, -4.45703125, -4.296875, -4.13671875, -3.9765625, -3.81640625, -3.65625, -3.49609375, -3.3359375, -3.17578125, -3.015625, -2.85546875, -2.6953125, -2.53515625, -2.375, -2.21484375, -2.0546875, -1.89453125, -1.734375, -1.57421875, -1.4140625, -1.25390625, -1.09375, -0.93359375, -0.7734375, -0.61328125, -0.453125, -0.29296875, -0.1328125, 0.02734375, 0.1875, 0.34765625, 0.5078125, 0.66796875, 0.828125, 0.98828125, 1.1484375, 1.30859375, 1.46875, 1.62890625, 1.7890625, 1.94921875, 2.109375, 2.26953125, 2.4296875, 2.58984375, 2.75, 2.91015625, 3.0703125, 3.23046875, 3.390625, 3.55078125, 3.7109375, 3.87109375, 4.03125, 4.19140625, 4.3515625, 4.51171875, 4.671875, 4.83203125, 4.9921875, 5.15234375, 5.3125, 5.47265625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 5.0, 5.0, 3.0, 12.0, 7.0, 18.0, 29.0, 30.0, 52.0, 75.0, 110.0, 160.0, 271.0, 379.0, 596.0, 888.0, 1333.0, 2101.0, 3396.0, 5394.0, 8920.0, 14886.0, 25253.0, 42063.0, 71404.0, 125740.0, 606137.0, 882732.0, 126622.0, 72303.0, 42283.0, 25223.0, 14676.0, 8977.0, 5462.0, 3483.0, 2125.0, 1397.0, 888.0, 545.0, 355.0, 271.0, 180.0, 118.0, 77.0, 57.0, 32.0, 24.0, 16.0, 11.0, 10.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.798828125, -0.7730636596679688, -0.7472991943359375, -0.7215347290039062, -0.695770263671875, -0.6700057983398438, -0.6442413330078125, -0.6184768676757812, -0.59271240234375, -0.5669479370117188, -0.5411834716796875, -0.5154190063476562, -0.489654541015625, -0.46389007568359375, -0.4381256103515625, -0.41236114501953125, -0.3865966796875, -0.36083221435546875, -0.3350677490234375, -0.30930328369140625, -0.283538818359375, -0.25777435302734375, -0.2320098876953125, -0.20624542236328125, -0.18048095703125, -0.15471649169921875, -0.1289520263671875, -0.10318756103515625, -0.077423095703125, -0.05165863037109375, -0.0258941650390625, -0.00012969970703125, 0.025634765625, 0.05139923095703125, 0.0771636962890625, 0.10292816162109375, 0.128692626953125, 0.15445709228515625, 0.1802215576171875, 0.20598602294921875, 0.23175048828125, 0.25751495361328125, 0.2832794189453125, 0.30904388427734375, 0.334808349609375, 0.36057281494140625, 0.3863372802734375, 0.41210174560546875, 0.4378662109375, 0.46363067626953125, 0.4893951416015625, 0.5151596069335938, 0.540924072265625, 0.5666885375976562, 0.5924530029296875, 0.6182174682617188, 0.64398193359375, 0.6697463989257812, 0.6955108642578125, 0.7212753295898438, 0.747039794921875, 0.7728042602539062, 0.7985687255859375, 0.8243331909179688, 0.85009765625]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 5.0, 3.0, 7.0, 9.0, 6.0, 14.0, 9.0, 14.0, 27.0, 22.0, 39.0, 36.0, 51.0, 55.0, 57.0, 67.0, 66.0, 66.0, 65.0, 69.0, 62.0, 50.0, 43.0, 36.0, 23.0, 23.0, 18.0, 14.0, 6.0, 8.0, 6.0, 6.0, 1.0, 6.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0023517608642578125, -0.0022701919078826904, -0.0021886229515075684, -0.0021070539951324463, -0.0020254850387573242, -0.0019439160823822021, -0.00186234712600708, -0.001780778169631958, -0.001699209213256836, -0.0016176402568817139, -0.0015360713005065918, -0.0014545023441314697, -0.0013729333877563477, -0.0012913644313812256, -0.0012097954750061035, -0.0011282265186309814, -0.0010466575622558594, -0.0009650886058807373, -0.0008835196495056152, -0.0008019506931304932, -0.0007203817367553711, -0.000638812780380249, -0.000557243824005127, -0.0004756748676300049, -0.0003941059112548828, -0.00031253695487976074, -0.00023096799850463867, -0.0001493990421295166, -6.783008575439453e-05, 1.3738870620727539e-05, 9.530782699584961e-05, 0.00017687678337097168, 0.00025844573974609375, 0.0003400146961212158, 0.0004215836524963379, 0.00050315260887146, 0.000584721565246582, 0.0006662905216217041, 0.0007478594779968262, 0.0008294284343719482, 0.0009109973907470703, 0.0009925663471221924, 0.0010741353034973145, 0.0011557042598724365, 0.0012372732162475586, 0.0013188421726226807, 0.0014004111289978027, 0.0014819800853729248, 0.0015635490417480469, 0.001645117998123169, 0.001726686954498291, 0.001808255910873413, 0.0018898248672485352, 0.0019713938236236572, 0.0020529627799987793, 0.0021345317363739014, 0.0022161006927490234, 0.0022976696491241455, 0.0023792386054992676, 0.0024608075618743896, 0.0025423765182495117, 0.002623945474624634, 0.002705514430999756, 0.002787083387374878, 0.00286865234375]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 4.0, 3.0, 7.0, 6.0, 9.0, 10.0, 17.0, 19.0, 13.0, 23.0, 33.0, 48.0, 61.0, 75.0, 134.0, 198.0, 347.0, 757.0, 5263.0, 1017606.0, 21865.0, 960.0, 382.0, 212.0, 132.0, 95.0, 69.0, 33.0, 36.0, 24.0, 17.0, 17.0, 26.0, 10.0, 8.0, 9.0, 7.0, 5.0, 3.0, 2.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.056610107421875, -0.054926395416259766, -0.05324268341064453, -0.0515589714050293, -0.04987525939941406, -0.04819154739379883, -0.046507835388183594, -0.04482412338256836, -0.043140411376953125, -0.04145669937133789, -0.039772987365722656, -0.03808927536010742, -0.03640556335449219, -0.03472185134887695, -0.03303813934326172, -0.031354427337646484, -0.02967071533203125, -0.027987003326416016, -0.02630329132080078, -0.024619579315185547, -0.022935867309570312, -0.021252155303955078, -0.019568443298339844, -0.01788473129272461, -0.016201019287109375, -0.01451730728149414, -0.012833595275878906, -0.011149883270263672, -0.009466171264648438, -0.007782459259033203, -0.006098747253417969, -0.004415035247802734, -0.0027313232421875, -0.0010476112365722656, 0.0006361007690429688, 0.002319812774658203, 0.0040035247802734375, 0.005687236785888672, 0.007370948791503906, 0.00905466079711914, 0.010738372802734375, 0.01242208480834961, 0.014105796813964844, 0.015789508819580078, 0.017473220825195312, 0.019156932830810547, 0.02084064483642578, 0.022524356842041016, 0.02420806884765625, 0.025891780853271484, 0.02757549285888672, 0.029259204864501953, 0.030942916870117188, 0.03262662887573242, 0.034310340881347656, 0.03599405288696289, 0.037677764892578125, 0.03936147689819336, 0.041045188903808594, 0.04272890090942383, 0.04441261291503906, 0.0460963249206543, 0.04778003692626953, 0.049463748931884766, 0.0511474609375]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 15.0, 57.0, 210.0, 330.0, 270.0, 95.0, 23.0, 8.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0024523695465177298, -0.002313684904947877, -0.0021750000305473804, -0.0020363153889775276, -0.0018976305145770311, -0.0017589458730071783, -0.0016202611150220037, -0.001481576357036829, -0.0013428915990516543, -0.0012042068410664797, -0.001065522083081305, -0.0009268373833037913, -0.0007881526253186166, -0.000649467867333442, -0.0005107831675559282, -0.0003720984095707536, -0.00023341365158557892, -9.472890815231949e-05, 4.395583528093994e-05, 0.00018264056416228414, 0.0003213253221474588, 0.00046001008013263345, 0.0005986947799101472, 0.0007373795378953218, 0.0008760642958804965, 0.0010147490538656712, 0.0011534338118508458, 0.0012921185698360205, 0.0014308032114058733, 0.0015694880858063698, 0.0017081727273762226, 0.0018468574853613973, 0.0019855424761772156, 0.0021242271177470684, 0.002262911992147565, 0.0024015966337174177, 0.002540281508117914, 0.002678966149687767, 0.00281765079125762, 0.0029563356656581163, 0.003095020540058613, 0.0032337051816284657, 0.003372390056028962, 0.003511074697598815, 0.0036497595719993114, 0.0037884442135691643, 0.003927128855139017, 0.00406581349670887, 0.00420449860394001, 0.004343183245509863, 0.004481867887079716, 0.004620552994310856, 0.004759237635880709, 0.0048979222774505615, 0.005036606919020414, 0.005175291560590267, 0.00531397620216012, 0.005452660843729973, 0.005591345485299826, 0.005730030592530966, 0.005868715234100819, 0.0060073998756706715, 0.006146084517240524, 0.006284769624471664, 0.006423454266041517]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 9.0, 14.0, 11.0, 15.0, 9.0, 21.0, 14.0, 24.0, 30.0, 33.0, 30.0, 32.0, 38.0, 30.0, 35.0, 36.0, 43.0, 43.0, 31.0, 36.0, 33.0, 35.0, 39.0, 44.0, 29.0, 27.0, 34.0, 32.0, 27.0, 19.0, 23.0, 13.0, 20.0, 16.0, 23.0, 10.0, 8.0, 12.0, 4.0, 7.0, 9.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0012775659561157227, -0.001238962635397911, -0.0012003593146800995, -0.001161755993962288, -0.0011231526732444763, -0.0010845493525266647, -0.0010459460318088531, -0.0010073427110910416, -0.00096873939037323, -0.0009301360696554184, -0.0008915327489376068, -0.0008529294282197952, -0.0008143261075019836, -0.0007757227867841721, -0.0007371194660663605, -0.0006985161453485489, -0.0006599128246307373, -0.0006213095039129257, -0.0005827061831951141, -0.0005441028624773026, -0.000505499541759491, -0.0004668962210416794, -0.0004282929003238678, -0.0003896895796060562, -0.00035108625888824463, -0.00031248293817043304, -0.00027387961745262146, -0.00023527629673480988, -0.0001966729760169983, -0.0001580696552991867, -0.00011946633458137512, -8.086301386356354e-05, -4.225969314575195e-05, -3.6563724279403687e-06, 3.4946948289871216e-05, 7.35502690076828e-05, 0.00011215358972549438, 0.00015075691044330597, 0.00018936023116111755, 0.00022796355187892914, 0.0002665668725967407, 0.0003051701933145523, 0.0003437735140323639, 0.0003823768347501755, 0.00042098015546798706, 0.00045958347618579865, 0.0004981867969036102, 0.0005367901176214218, 0.0005753934383392334, 0.000613996759057045, 0.0006526000797748566, 0.0006912034004926682, 0.0007298067212104797, 0.0007684100419282913, 0.0008070133626461029, 0.0008456166833639145, 0.0008842200040817261, 0.0009228233247995377, 0.0009614266455173492, 0.0010000299662351608, 0.0010386332869529724, 0.001077236607670784, 0.0011158399283885956, 0.0011544432491064072, 0.0011930465698242188]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 3.0, 2.0, 4.0, 2.0, 3.0, 1.0, 6.0, 9.0, 4.0, 3.0, 7.0, 10.0, 14.0, 20.0, 31.0, 18.0, 29.0, 21.0, 25.0, 32.0, 32.0, 34.0, 41.0, 40.0, 38.0, 46.0, 45.0, 43.0, 37.0, 33.0, 41.0, 41.0, 40.0, 27.0, 35.0, 24.0, 25.0, 16.0, 20.0, 12.0, 21.0, 15.0, 8.0, 8.0, 7.0, 10.0, 9.0, 4.0, 2.0, 7.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.30859375, -6.09613037109375, -5.8836669921875, -5.67120361328125, -5.458740234375, -5.24627685546875, -5.0338134765625, -4.82135009765625, -4.60888671875, -4.39642333984375, -4.1839599609375, -3.97149658203125, -3.759033203125, -3.54656982421875, -3.3341064453125, -3.12164306640625, -2.9091796875, -2.69671630859375, -2.4842529296875, -2.27178955078125, -2.059326171875, -1.84686279296875, -1.6343994140625, -1.42193603515625, -1.20947265625, -0.99700927734375, -0.7845458984375, -0.57208251953125, -0.359619140625, -0.14715576171875, 0.0653076171875, 0.27777099609375, 0.490234375, 0.70269775390625, 0.9151611328125, 1.12762451171875, 1.340087890625, 1.55255126953125, 1.7650146484375, 1.97747802734375, 2.18994140625, 2.40240478515625, 2.6148681640625, 2.82733154296875, 3.039794921875, 3.25225830078125, 3.4647216796875, 3.67718505859375, 3.8896484375, 4.10211181640625, 4.3145751953125, 4.52703857421875, 4.739501953125, 4.95196533203125, 5.1644287109375, 5.37689208984375, 5.58935546875, 5.80181884765625, 6.0142822265625, 6.22674560546875, 6.439208984375, 6.65167236328125, 6.8641357421875, 7.07659912109375, 7.2890625]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 7.0, 7.0, 7.0, 14.0, 22.0, 33.0, 32.0, 75.0, 74.0, 159.0, 228.0, 353.0, 583.0, 1040.0, 1796.0, 3692.0, 7315.0, 17012.0, 41367.0, 124062.0, 416936.0, 291193.0, 86022.0, 30859.0, 13012.0, 6060.0, 2863.0, 1496.0, 848.0, 472.0, 322.0, 191.0, 153.0, 76.0, 59.0, 35.0, 30.0, 19.0, 12.0, 11.0, 6.0, 2.0, 6.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.00390625, -5.802734375, -5.6015625, -5.400390625, -5.19921875, -4.998046875, -4.796875, -4.595703125, -4.39453125, -4.193359375, -3.9921875, -3.791015625, -3.58984375, -3.388671875, -3.1875, -2.986328125, -2.78515625, -2.583984375, -2.3828125, -2.181640625, -1.98046875, -1.779296875, -1.578125, -1.376953125, -1.17578125, -0.974609375, -0.7734375, -0.572265625, -0.37109375, -0.169921875, 0.03125, 0.232421875, 0.43359375, 0.634765625, 0.8359375, 1.037109375, 1.23828125, 1.439453125, 1.640625, 1.841796875, 2.04296875, 2.244140625, 2.4453125, 2.646484375, 2.84765625, 3.048828125, 3.25, 3.451171875, 3.65234375, 3.853515625, 4.0546875, 4.255859375, 4.45703125, 4.658203125, 4.859375, 5.060546875, 5.26171875, 5.462890625, 5.6640625, 5.865234375, 6.06640625, 6.267578125, 6.46875, 6.669921875, 6.87109375]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 5.0, 5.0, 5.0, 6.0, 11.0, 17.0, 21.0, 21.0, 24.0, 32.0, 22.0, 33.0, 43.0, 42.0, 46.0, 52.0, 64.0, 172.0, 1651.0, 291.0, 102.0, 53.0, 58.0, 35.0, 32.0, 33.0, 34.0, 25.0, 27.0, 24.0, 17.0, 13.0, 5.0, 9.0, 7.0, 6.0, 4.0, 2.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-30.828125, -29.98779296875, -29.1474609375, -28.30712890625, -27.466796875, -26.62646484375, -25.7861328125, -24.94580078125, -24.10546875, -23.26513671875, -22.4248046875, -21.58447265625, -20.744140625, -19.90380859375, -19.0634765625, -18.22314453125, -17.3828125, -16.54248046875, -15.7021484375, -14.86181640625, -14.021484375, -13.18115234375, -12.3408203125, -11.50048828125, -10.66015625, -9.81982421875, -8.9794921875, -8.13916015625, -7.298828125, -6.45849609375, -5.6181640625, -4.77783203125, -3.9375, -3.09716796875, -2.2568359375, -1.41650390625, -0.576171875, 0.26416015625, 1.1044921875, 1.94482421875, 2.78515625, 3.62548828125, 4.4658203125, 5.30615234375, 6.146484375, 6.98681640625, 7.8271484375, 8.66748046875, 9.5078125, 10.34814453125, 11.1884765625, 12.02880859375, 12.869140625, 13.70947265625, 14.5498046875, 15.39013671875, 16.23046875, 17.07080078125, 17.9111328125, 18.75146484375, 19.591796875, 20.43212890625, 21.2724609375, 22.11279296875, 22.953125]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 6.0, 12.0, 17.0, 20.0, 33.0, 42.0, 59.0, 119.0, 205.0, 331.0, 584.0, 5020.0, 3133291.0, 4465.0, 624.0, 314.0, 212.0, 120.0, 95.0, 48.0, 25.0, 23.0, 7.0, 10.0, 6.0, 5.0, 6.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.5, -77.212890625, -73.92578125, -70.638671875, -67.3515625, -64.064453125, -60.77734375, -57.490234375, -54.203125, -50.916015625, -47.62890625, -44.341796875, -41.0546875, -37.767578125, -34.48046875, -31.193359375, -27.90625, -24.619140625, -21.33203125, -18.044921875, -14.7578125, -11.470703125, -8.18359375, -4.896484375, -1.609375, 1.677734375, 4.96484375, 8.251953125, 11.5390625, 14.826171875, 18.11328125, 21.400390625, 24.6875, 27.974609375, 31.26171875, 34.548828125, 37.8359375, 41.123046875, 44.41015625, 47.697265625, 50.984375, 54.271484375, 57.55859375, 60.845703125, 64.1328125, 67.419921875, 70.70703125, 73.994140625, 77.28125, 80.568359375, 83.85546875, 87.142578125, 90.4296875, 93.716796875, 97.00390625, 100.291015625, 103.578125, 106.865234375, 110.15234375, 113.439453125, 116.7265625, 120.013671875, 123.30078125, 126.587890625, 129.875]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 44.0, 816.0, 155.0, 3.0, 2.0, 2.0], "bins": [-416.6565856933594, -409.6693420410156, -402.68212890625, -395.69488525390625, -388.7076721191406, -381.7204284667969, -374.73321533203125, -367.7459716796875, -360.75872802734375, -353.771484375, -346.7842712402344, -339.7970275878906, -332.809814453125, -325.82257080078125, -318.8353576660156, -311.8481140136719, -304.86090087890625, -297.8736572265625, -290.8864440917969, -283.8992004394531, -276.9119873046875, -269.92474365234375, -262.9375305175781, -255.95028686523438, -248.9630584716797, -241.975830078125, -234.9886016845703, -228.00137329101562, -221.01412963867188, -214.02691650390625, -207.0396728515625, -200.0524444580078, -193.06521606445312, -186.07798767089844, -179.09075927734375, -172.10353088378906, -165.11630249023438, -158.12905883789062, -151.14183044433594, -144.15460205078125, -137.16737365722656, -130.18014526367188, -123.19291687011719, -116.20568084716797, -109.21845245361328, -102.2312240600586, -95.24398803710938, -88.25675964355469, -81.26953125, -74.28230285644531, -67.29507446289062, -60.307838439941406, -53.32061004638672, -46.33338165283203, -39.34614944458008, -32.358917236328125, -25.371686935424805, -18.384456634521484, -11.397226333618164, -4.409996032714844, 2.5772342681884766, 9.564462661743164, 16.551694869995117, 23.53892707824707, 30.526155471801758]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 6.0, 6.0, 8.0, 7.0, 6.0, 8.0, 19.0, 15.0, 17.0, 23.0, 24.0, 33.0, 23.0, 32.0, 37.0, 38.0, 29.0, 37.0, 37.0, 51.0, 42.0, 39.0, 50.0, 37.0, 43.0, 40.0, 44.0, 39.0, 30.0, 25.0, 23.0, 19.0, 18.0, 24.0, 24.0, 13.0, 10.0, 11.0, 6.0, 7.0, 4.0, 0.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.74664306640625, -60.72026824951172, -58.69389724731445, -56.66752243041992, -54.641151428222656, -52.614776611328125, -50.588401794433594, -48.56203079223633, -46.53565979003906, -44.50928497314453, -42.482913970947266, -40.456539154052734, -38.43016815185547, -36.40379333496094, -34.377418518066406, -32.35104751586914, -30.32467269897461, -28.29829978942871, -26.271926879882812, -24.24555206298828, -22.219181060791016, -20.192806243896484, -18.166433334350586, -16.140060424804688, -14.113687515258789, -12.08731460571289, -10.060941696166992, -8.034567832946777, -6.008194923400879, -3.9818220138549805, -1.9554481506347656, 0.07092475891113281, 2.0972976684570312, 4.12367057800293, 6.150043964385986, 8.176417350769043, 10.202790260314941, 12.22916316986084, 14.255537033081055, 16.281909942626953, 18.30828285217285, 20.33465576171875, 22.36102867126465, 24.387401580810547, 26.413776397705078, 28.440147399902344, 30.466522216796875, 32.492897033691406, 34.51926803588867, 36.5456428527832, 38.57201385498047, 40.598388671875, 42.624759674072266, 44.6511344909668, 46.67750549316406, 48.703880310058594, 50.730255126953125, 52.756629943847656, 54.78300094604492, 56.80937576293945, 58.83574676513672, 60.86212158203125, 62.88849639892578, 64.91487121582031, 66.94123840332031]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 5.0, 4.0, 1.0, 4.0, 7.0, 3.0, 6.0, 9.0, 17.0, 14.0, 17.0, 22.0, 40.0, 19.0, 26.0, 14.0, 36.0, 40.0, 39.0, 49.0, 37.0, 47.0, 59.0, 32.0, 42.0, 42.0, 37.0, 47.0, 32.0, 34.0, 35.0, 35.0, 15.0, 20.0, 18.0, 23.0, 14.0, 9.0, 14.0, 12.0, 3.0, 7.0, 5.0, 2.0, 7.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.3359375, -7.09869384765625, -6.8614501953125, -6.62420654296875, -6.386962890625, -6.14971923828125, -5.9124755859375, -5.67523193359375, -5.43798828125, -5.20074462890625, -4.9635009765625, -4.72625732421875, -4.489013671875, -4.25177001953125, -4.0145263671875, -3.77728271484375, -3.5400390625, -3.30279541015625, -3.0655517578125, -2.82830810546875, -2.591064453125, -2.35382080078125, -2.1165771484375, -1.87933349609375, -1.64208984375, -1.40484619140625, -1.1676025390625, -0.93035888671875, -0.693115234375, -0.45587158203125, -0.2186279296875, 0.01861572265625, 0.255859375, 0.49310302734375, 0.7303466796875, 0.96759033203125, 1.204833984375, 1.44207763671875, 1.6793212890625, 1.91656494140625, 2.15380859375, 2.39105224609375, 2.6282958984375, 2.86553955078125, 3.102783203125, 3.34002685546875, 3.5772705078125, 3.81451416015625, 4.0517578125, 4.28900146484375, 4.5262451171875, 4.76348876953125, 5.000732421875, 5.23797607421875, 5.4752197265625, 5.71246337890625, 5.94970703125, 6.18695068359375, 6.4241943359375, 6.66143798828125, 6.898681640625, 7.13592529296875, 7.3731689453125, 7.61041259765625, 7.84765625]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 4.0, 4.0, 11.0, 2.0, 2.0, 10.0, 6.0, 12.0, 19.0, 24.0, 25.0, 31.0, 42.0, 60.0, 85.0, 145.0, 266.0, 557.0, 1698.0, 9812.0, 182215.0, 2743755.0, 1207504.0, 42061.0, 3978.0, 962.0, 377.0, 185.0, 133.0, 73.0, 44.0, 45.0, 27.0, 25.0, 18.0, 18.0, 12.0, 5.0, 7.0, 10.0, 7.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.21875, -18.551025390625, -17.88330078125, -17.215576171875, -16.5478515625, -15.880126953125, -15.21240234375, -14.544677734375, -13.876953125, -13.209228515625, -12.54150390625, -11.873779296875, -11.2060546875, -10.538330078125, -9.87060546875, -9.202880859375, -8.53515625, -7.867431640625, -7.19970703125, -6.531982421875, -5.8642578125, -5.196533203125, -4.52880859375, -3.861083984375, -3.193359375, -2.525634765625, -1.85791015625, -1.190185546875, -0.5224609375, 0.145263671875, 0.81298828125, 1.480712890625, 2.1484375, 2.816162109375, 3.48388671875, 4.151611328125, 4.8193359375, 5.487060546875, 6.15478515625, 6.822509765625, 7.490234375, 8.157958984375, 8.82568359375, 9.493408203125, 10.1611328125, 10.828857421875, 11.49658203125, 12.164306640625, 12.83203125, 13.499755859375, 14.16748046875, 14.835205078125, 15.5029296875, 16.170654296875, 16.83837890625, 17.506103515625, 18.173828125, 18.841552734375, 19.50927734375, 20.177001953125, 20.8447265625, 21.512451171875, 22.18017578125, 22.847900390625, 23.515625]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 10.0, 14.0, 23.0, 22.0, 34.0, 53.0, 87.0, 113.0, 179.0, 297.0, 387.0, 577.0, 597.0, 501.0, 391.0, 242.0, 185.0, 123.0, 69.0, 55.0, 37.0, 30.0, 18.0, 8.0, 8.0, 4.0, 3.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.09375, -20.478515625, -19.86328125, -19.248046875, -18.6328125, -18.017578125, -17.40234375, -16.787109375, -16.171875, -15.556640625, -14.94140625, -14.326171875, -13.7109375, -13.095703125, -12.48046875, -11.865234375, -11.25, -10.634765625, -10.01953125, -9.404296875, -8.7890625, -8.173828125, -7.55859375, -6.943359375, -6.328125, -5.712890625, -5.09765625, -4.482421875, -3.8671875, -3.251953125, -2.63671875, -2.021484375, -1.40625, -0.791015625, -0.17578125, 0.439453125, 1.0546875, 1.669921875, 2.28515625, 2.900390625, 3.515625, 4.130859375, 4.74609375, 5.361328125, 5.9765625, 6.591796875, 7.20703125, 7.822265625, 8.4375, 9.052734375, 9.66796875, 10.283203125, 10.8984375, 11.513671875, 12.12890625, 12.744140625, 13.359375, 13.974609375, 14.58984375, 15.205078125, 15.8203125, 16.435546875, 17.05078125, 17.666015625, 18.28125]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 7.0, 4.0, 20.0, 18.0, 25.0, 26.0, 38.0, 52.0, 69.0, 80.0, 137.0, 171.0, 226.0, 343.0, 632.0, 2492.0, 1217744.0, 2966841.0, 3486.0, 670.0, 333.0, 216.0, 157.0, 117.0, 76.0, 73.0, 70.0, 44.0, 31.0, 25.0, 17.0, 9.0, 10.0, 4.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.625, -69.2421875, -66.859375, -64.4765625, -62.09375, -59.7109375, -57.328125, -54.9453125, -52.5625, -50.1796875, -47.796875, -45.4140625, -43.03125, -40.6484375, -38.265625, -35.8828125, -33.5, -31.1171875, -28.734375, -26.3515625, -23.96875, -21.5859375, -19.203125, -16.8203125, -14.4375, -12.0546875, -9.671875, -7.2890625, -4.90625, -2.5234375, -0.140625, 2.2421875, 4.625, 7.0078125, 9.390625, 11.7734375, 14.15625, 16.5390625, 18.921875, 21.3046875, 23.6875, 26.0703125, 28.453125, 30.8359375, 33.21875, 35.6015625, 37.984375, 40.3671875, 42.75, 45.1328125, 47.515625, 49.8984375, 52.28125, 54.6640625, 57.046875, 59.4296875, 61.8125, 64.1953125, 66.578125, 68.9609375, 71.34375, 73.7265625, 76.109375, 78.4921875, 80.875]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 7.0, 5.0, 8.0, 29.0, 39.0, 44.0, 76.0, 82.0, 126.0, 120.0, 122.0, 97.0, 82.0, 68.0, 36.0, 29.0, 14.0, 12.0, 9.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.39915466308594, -42.5806999206543, -40.762245178222656, -38.943790435791016, -37.125335693359375, -35.306884765625, -33.48843002319336, -31.66997528076172, -29.851520538330078, -28.033065795898438, -26.214611053466797, -24.39615821838379, -22.57770347595215, -20.759248733520508, -18.9407958984375, -17.12234115600586, -15.303886413574219, -13.485431671142578, -11.666977882385254, -9.84852409362793, -8.030069351196289, -6.211614608764648, -4.393160820007324, -2.57470703125, -0.7562522888183594, 1.062201976776123, 2.8806562423706055, 4.699110507965088, 6.51756477355957, 8.336019515991211, 10.154473304748535, 11.97292709350586, 13.7913818359375, 15.60983657836914, 17.42829132080078, 19.24674415588379, 21.06519889831543, 22.88365364074707, 24.702106475830078, 26.52056121826172, 28.33901596069336, 30.157470703125, 31.97592544555664, 33.79438018798828, 35.612831115722656, 37.43128967285156, 39.24974060058594, 41.06819534301758, 42.88665008544922, 44.70510482788086, 46.5235595703125, 48.34201431274414, 50.16046905517578, 51.978919982910156, 53.7973747253418, 55.61582946777344, 57.43428421020508, 59.25273895263672, 61.07119369506836, 62.8896484375, 64.70809936523438, 66.52655792236328, 68.34500885009766, 70.16346740722656, 71.98191833496094]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 6.0, 8.0, 5.0, 5.0, 8.0, 8.0, 19.0, 26.0, 17.0, 24.0, 23.0, 20.0, 29.0, 38.0, 39.0, 48.0, 54.0, 53.0, 48.0, 43.0, 50.0, 45.0, 42.0, 44.0, 48.0, 37.0, 42.0, 27.0, 22.0, 20.0, 18.0, 17.0, 18.0, 16.0, 11.0, 6.0, 5.0, 6.0, 6.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.81658935546875, -61.10207748413086, -59.387569427490234, -57.673057556152344, -55.95854949951172, -54.24403762817383, -52.52952575683594, -50.81501770019531, -49.10050582885742, -47.38599395751953, -45.671485900878906, -43.956974029541016, -42.242462158203125, -40.5279541015625, -38.81344223022461, -37.09893035888672, -35.384422302246094, -33.6699104309082, -31.955402374267578, -30.240890502929688, -28.52638053894043, -26.811870574951172, -25.09735870361328, -23.382848739624023, -21.668338775634766, -19.953828811645508, -18.23931884765625, -16.52480697631836, -14.810297012329102, -13.095787048339844, -11.38127613067627, -9.666765213012695, -7.9522552490234375, -6.2377448081970215, -4.5232343673706055, -2.8087239265441895, -1.0942134857177734, 0.6202964782714844, 2.3348073959350586, 4.049318313598633, 5.763828277587891, 7.478338718414307, 9.192849159240723, 10.907360076904297, 12.621870040893555, 14.336380004882812, 16.050891876220703, 17.76540184020996, 19.47991180419922, 21.194421768188477, 22.908931732177734, 24.623443603515625, 26.337953567504883, 28.05246353149414, 29.76697540283203, 31.48148536682129, 33.19599533081055, 34.91050720214844, 36.62501525878906, 38.33952713012695, 40.054039001464844, 41.76854705810547, 43.48305892944336, 45.19757080078125, 46.912078857421875]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 7.0, 10.0, 8.0, 7.0, 15.0, 11.0, 15.0, 18.0, 19.0, 26.0, 26.0, 31.0, 31.0, 36.0, 31.0, 34.0, 40.0, 41.0, 42.0, 42.0, 39.0, 43.0, 42.0, 40.0, 37.0, 33.0, 39.0, 32.0, 36.0, 30.0, 26.0, 21.0, 18.0, 8.0, 7.0, 12.0, 10.0, 12.0, 7.0, 9.0, 3.0, 5.0, 6.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.921875, -7.6961669921875, -7.470458984375, -7.2447509765625, -7.01904296875, -6.7933349609375, -6.567626953125, -6.3419189453125, -6.1162109375, -5.8905029296875, -5.664794921875, -5.4390869140625, -5.21337890625, -4.9876708984375, -4.761962890625, -4.5362548828125, -4.310546875, -4.0848388671875, -3.859130859375, -3.6334228515625, -3.40771484375, -3.1820068359375, -2.956298828125, -2.7305908203125, -2.5048828125, -2.2791748046875, -2.053466796875, -1.8277587890625, -1.60205078125, -1.3763427734375, -1.150634765625, -0.9249267578125, -0.69921875, -0.4735107421875, -0.247802734375, -0.0220947265625, 0.20361328125, 0.4293212890625, 0.655029296875, 0.8807373046875, 1.1064453125, 1.3321533203125, 1.557861328125, 1.7835693359375, 2.00927734375, 2.2349853515625, 2.460693359375, 2.6864013671875, 2.912109375, 3.1378173828125, 3.363525390625, 3.5892333984375, 3.81494140625, 4.0406494140625, 4.266357421875, 4.4920654296875, 4.7177734375, 4.9434814453125, 5.169189453125, 5.3948974609375, 5.62060546875, 5.8463134765625, 6.072021484375, 6.2977294921875, 6.5234375]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 9.0, 10.0, 15.0, 27.0, 21.0, 57.0, 79.0, 125.0, 169.0, 280.0, 453.0, 726.0, 1103.0, 1714.0, 2865.0, 4508.0, 7743.0, 12971.0, 22313.0, 39110.0, 68555.0, 120920.0, 207914.0, 230793.0, 138720.0, 78950.0, 45062.0, 25779.0, 15154.0, 8679.0, 5157.0, 3250.0, 1913.0, 1230.0, 813.0, 485.0, 303.0, 190.0, 146.0, 75.0, 57.0, 43.0, 21.0, 18.0, 10.0, 13.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.99853515625, -0.9701080322265625, -0.941680908203125, -0.9132537841796875, -0.88482666015625, -0.8563995361328125, -0.827972412109375, -0.7995452880859375, -0.7711181640625, -0.7426910400390625, -0.714263916015625, -0.6858367919921875, -0.65740966796875, -0.6289825439453125, -0.600555419921875, -0.5721282958984375, -0.543701171875, -0.5152740478515625, -0.486846923828125, -0.4584197998046875, -0.42999267578125, -0.4015655517578125, -0.373138427734375, -0.3447113037109375, -0.3162841796875, -0.2878570556640625, -0.259429931640625, -0.2310028076171875, -0.20257568359375, -0.1741485595703125, -0.145721435546875, -0.1172943115234375, -0.0888671875, -0.0604400634765625, -0.032012939453125, -0.0035858154296875, 0.02484130859375, 0.0532684326171875, 0.081695556640625, 0.1101226806640625, 0.1385498046875, 0.1669769287109375, 0.195404052734375, 0.2238311767578125, 0.25225830078125, 0.2806854248046875, 0.309112548828125, 0.3375396728515625, 0.365966796875, 0.3943939208984375, 0.422821044921875, 0.4512481689453125, 0.47967529296875, 0.5081024169921875, 0.536529541015625, 0.5649566650390625, 0.5933837890625, 0.6218109130859375, 0.650238037109375, 0.6786651611328125, 0.70709228515625, 0.7355194091796875, 0.763946533203125, 0.7923736572265625, 0.82080078125]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 4.0, 2.0, 8.0, 13.0, 11.0, 8.0, 16.0, 17.0, 24.0, 32.0, 36.0, 33.0, 29.0, 41.0, 45.0, 36.0, 48.0, 45.0, 1071.0, 50.0, 50.0, 49.0, 52.0, 43.0, 51.0, 31.0, 32.0, 20.0, 18.0, 19.0, 15.0, 16.0, 15.0, 7.0, 10.0, 6.0, 9.0, 6.0, 5.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.78515625, -5.623779296875, -5.46240234375, -5.301025390625, -5.1396484375, -4.978271484375, -4.81689453125, -4.655517578125, -4.494140625, -4.332763671875, -4.17138671875, -4.010009765625, -3.8486328125, -3.687255859375, -3.52587890625, -3.364501953125, -3.203125, -3.041748046875, -2.88037109375, -2.718994140625, -2.5576171875, -2.396240234375, -2.23486328125, -2.073486328125, -1.912109375, -1.750732421875, -1.58935546875, -1.427978515625, -1.2666015625, -1.105224609375, -0.94384765625, -0.782470703125, -0.62109375, -0.459716796875, -0.29833984375, -0.136962890625, 0.0244140625, 0.185791015625, 0.34716796875, 0.508544921875, 0.669921875, 0.831298828125, 0.99267578125, 1.154052734375, 1.3154296875, 1.476806640625, 1.63818359375, 1.799560546875, 1.9609375, 2.122314453125, 2.28369140625, 2.445068359375, 2.6064453125, 2.767822265625, 2.92919921875, 3.090576171875, 3.251953125, 3.413330078125, 3.57470703125, 3.736083984375, 3.8974609375, 4.058837890625, 4.22021484375, 4.381591796875, 4.54296875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 5.0, 6.0, 11.0, 16.0, 24.0, 30.0, 51.0, 79.0, 123.0, 186.0, 334.0, 457.0, 715.0, 1125.0, 1776.0, 2849.0, 4710.0, 7837.0, 13650.0, 23487.0, 40951.0, 72312.0, 128326.0, 1066416.0, 437465.0, 126328.0, 71024.0, 40348.0, 23086.0, 13339.0, 7791.0, 4711.0, 2820.0, 1675.0, 1118.0, 698.0, 434.0, 252.0, 196.0, 120.0, 88.0, 58.0, 43.0, 19.0, 17.0, 15.0, 6.0, 3.0, 3.0, 1.0, 3.0, 3.0, 2.0], "bins": [-0.97021484375, -0.9424819946289062, -0.9147491455078125, -0.8870162963867188, -0.859283447265625, -0.8315505981445312, -0.8038177490234375, -0.7760848999023438, -0.74835205078125, -0.7206192016601562, -0.6928863525390625, -0.6651535034179688, -0.637420654296875, -0.6096878051757812, -0.5819549560546875, -0.5542221069335938, -0.5264892578125, -0.49875640869140625, -0.4710235595703125, -0.44329071044921875, -0.415557861328125, -0.38782501220703125, -0.3600921630859375, -0.33235931396484375, -0.30462646484375, -0.27689361572265625, -0.2491607666015625, -0.22142791748046875, -0.193695068359375, -0.16596221923828125, -0.1382293701171875, -0.11049652099609375, -0.082763671875, -0.05503082275390625, -0.0272979736328125, 0.00043487548828125, 0.028167724609375, 0.05590057373046875, 0.0836334228515625, 0.11136627197265625, 0.13909912109375, 0.16683197021484375, 0.1945648193359375, 0.22229766845703125, 0.250030517578125, 0.27776336669921875, 0.3054962158203125, 0.33322906494140625, 0.3609619140625, 0.38869476318359375, 0.4164276123046875, 0.44416046142578125, 0.471893310546875, 0.49962615966796875, 0.5273590087890625, 0.5550918579101562, 0.58282470703125, 0.6105575561523438, 0.6382904052734375, 0.6660232543945312, 0.693756103515625, 0.7214889526367188, 0.7492218017578125, 0.7769546508789062, 0.8046875]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 1.0, 3.0, 5.0, 8.0, 4.0, 12.0, 11.0, 14.0, 14.0, 12.0, 21.0, 44.0, 37.0, 39.0, 41.0, 50.0, 61.0, 66.0, 60.0, 65.0, 59.0, 63.0, 52.0, 45.0, 39.0, 31.0, 24.0, 23.0, 13.0, 18.0, 14.0, 14.0, 9.0, 5.0, 6.0, 4.0, 6.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0034809112548828125, -0.0033723413944244385, -0.0032637715339660645, -0.0031552016735076904, -0.0030466318130493164, -0.0029380619525909424, -0.0028294920921325684, -0.0027209222316741943, -0.0026123523712158203, -0.0025037825107574463, -0.0023952126502990723, -0.0022866427898406982, -0.0021780729293823242, -0.00206950306892395, -0.001960933208465576, -0.0018523633480072021, -0.0017437934875488281, -0.001635223627090454, -0.00152665376663208, -0.001418083906173706, -0.001309514045715332, -0.001200944185256958, -0.001092374324798584, -0.00098380446434021, -0.0008752346038818359, -0.0007666647434234619, -0.0006580948829650879, -0.0005495250225067139, -0.00044095516204833984, -0.0003323853015899658, -0.0002238154411315918, -0.00011524558067321777, -6.67572021484375e-06, 0.00010189414024353027, 0.0002104640007019043, 0.0003190338611602783, 0.00042760372161865234, 0.0005361735820770264, 0.0006447434425354004, 0.0007533133029937744, 0.0008618831634521484, 0.0009704530239105225, 0.0010790228843688965, 0.0011875927448272705, 0.0012961626052856445, 0.0014047324657440186, 0.0015133023262023926, 0.0016218721866607666, 0.0017304420471191406, 0.0018390119075775146, 0.0019475817680358887, 0.0020561516284942627, 0.0021647214889526367, 0.0022732913494110107, 0.0023818612098693848, 0.002490431070327759, 0.002599000930786133, 0.002707570791244507, 0.002816140651702881, 0.002924710512161255, 0.003033280372619629, 0.003141850233078003, 0.003250420093536377, 0.003358989953994751, 0.003467559814453125]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 0.0, 2.0, 2.0, 5.0, 2.0, 4.0, 7.0, 11.0, 6.0, 15.0, 22.0, 22.0, 16.0, 43.0, 45.0, 51.0, 90.0, 143.0, 397.0, 1668.0, 1036413.0, 8419.0, 543.0, 202.0, 109.0, 65.0, 53.0, 53.0, 42.0, 21.0, 12.0, 14.0, 13.0, 14.0, 9.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.09417724609375, -0.09129524230957031, -0.08841323852539062, -0.08553123474121094, -0.08264923095703125, -0.07976722717285156, -0.07688522338867188, -0.07400321960449219, -0.0711212158203125, -0.06823921203613281, -0.06535720825195312, -0.06247520446777344, -0.05959320068359375, -0.05671119689941406, -0.053829193115234375, -0.05094718933105469, -0.048065185546875, -0.04518318176269531, -0.042301177978515625, -0.03941917419433594, -0.03653717041015625, -0.03365516662597656, -0.030773162841796875, -0.027891159057617188, -0.0250091552734375, -0.022127151489257812, -0.019245147705078125, -0.016363143920898438, -0.01348114013671875, -0.010599136352539062, -0.007717132568359375, -0.0048351287841796875, -0.001953125, 0.0009288787841796875, 0.003810882568359375, 0.0066928863525390625, 0.00957489013671875, 0.012456893920898438, 0.015338897705078125, 0.018220901489257812, 0.0211029052734375, 0.023984909057617188, 0.026866912841796875, 0.029748916625976562, 0.03263092041015625, 0.03551292419433594, 0.038394927978515625, 0.04127693176269531, 0.044158935546875, 0.04704093933105469, 0.049922943115234375, 0.05280494689941406, 0.05568695068359375, 0.05856895446777344, 0.061450958251953125, 0.06433296203613281, 0.0672149658203125, 0.07009696960449219, 0.07297897338867188, 0.07586097717285156, 0.07874298095703125, 0.08162498474121094, 0.08450698852539062, 0.08738899230957031, 0.09027099609375]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 9.0, 28.0, 116.0, 329.0, 372.0, 136.0, 21.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015001518186181784, -0.0013345691841095686, -0.0011689866660162807, -0.0010034041479229927, -0.0008378215134143829, -0.0006722389371134341, -0.0005066563608124852, -0.0003410738427191973, -0.0001754912082105875, -9.908631909638643e-06, 0.00015567394439131021, 0.0003212565206922591, 0.00048683909699320793, 0.0006524216732941568, 0.0008180042495951056, 0.0009835867676883936, 0.0011491694021970034, 0.0013147520367056131, 0.001480334554798901, 0.001645917072892189, 0.0018114997074007988, 0.0019770823419094086, 0.0021426649764180183, 0.0023082473780959845, 0.0024738300126045942, 0.002639412647113204, 0.00280499504879117, 0.00297057768329978, 0.0031361603178083897, 0.0033017429523169994, 0.003467325586825609, 0.0036329079885035753, 0.0037984903901815414, 0.003964073024690151, 0.004129655659198761, 0.004295238293707371, 0.0044608209282159805, 0.004626403097063303, 0.004791985731571913, 0.0049575683660805225, 0.005123151000589132, 0.005288733635097742, 0.005454316269606352, 0.005619898904114962, 0.005785481072962284, 0.005951063707470894, 0.006116646341979504, 0.006282228976488113, 0.006447811610996723, 0.006613394245505333, 0.006778976880013943, 0.0069445595145225525, 0.007110142149031162, 0.007275724317878485, 0.0074413069523870945, 0.007606889586895704, 0.007772472221404314, 0.007938054390251637, 0.008103637024760246, 0.008269219659268856, 0.008434802293777466, 0.008600384928286076, 0.008765967562794685, 0.008931550197303295, 0.009097132831811905]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 7.0, 5.0, 7.0, 7.0, 4.0, 16.0, 12.0, 18.0, 13.0, 24.0, 22.0, 35.0, 37.0, 26.0, 26.0, 36.0, 40.0, 40.0, 37.0, 40.0, 36.0, 46.0, 38.0, 51.0, 46.0, 37.0, 35.0, 29.0, 37.0, 25.0, 22.0, 26.0, 23.0, 21.0, 13.0, 13.0, 13.0, 3.0, 13.0, 7.0, 5.0, 12.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0018528103828430176, -0.0017948895692825317, -0.001736968755722046, -0.00167904794216156, -0.0016211271286010742, -0.0015632063150405884, -0.0015052855014801025, -0.0014473646879196167, -0.0013894438743591309, -0.001331523060798645, -0.0012736022472381592, -0.0012156814336776733, -0.0011577606201171875, -0.0010998398065567017, -0.0010419189929962158, -0.00098399817943573, -0.0009260773658752441, -0.0008681565523147583, -0.0008102357387542725, -0.0007523149251937866, -0.0006943941116333008, -0.0006364732980728149, -0.0005785524845123291, -0.0005206316709518433, -0.0004627108573913574, -0.0004047900438308716, -0.00034686923027038574, -0.0002889484167098999, -0.00023102760314941406, -0.00017310678958892822, -0.00011518597602844238, -5.726516246795654e-05, 6.556510925292969e-07, 5.857646465301514e-05, 0.00011649727821350098, 0.00017441809177398682, 0.00023233890533447266, 0.0002902597188949585, 0.00034818053245544434, 0.0004061013460159302, 0.000464022159576416, 0.0005219429731369019, 0.0005798637866973877, 0.0006377846002578735, 0.0006957054138183594, 0.0007536262273788452, 0.0008115470409393311, 0.0008694678544998169, 0.0009273886680603027, 0.0009853094816207886, 0.0010432302951812744, 0.0011011511087417603, 0.001159071922302246, 0.001216992735862732, 0.0012749135494232178, 0.0013328343629837036, 0.0013907551765441895, 0.0014486759901046753, 0.0015065968036651611, 0.001564517617225647, 0.0016224384307861328, 0.0016803592443466187, 0.0017382800579071045, 0.0017962008714675903, 0.0018541216850280762]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 7.0, 10.0, 8.0, 7.0, 15.0, 11.0, 15.0, 18.0, 19.0, 26.0, 26.0, 31.0, 31.0, 36.0, 31.0, 34.0, 40.0, 40.0, 43.0, 42.0, 39.0, 43.0, 42.0, 40.0, 37.0, 33.0, 39.0, 32.0, 36.0, 30.0, 26.0, 21.0, 18.0, 8.0, 7.0, 12.0, 10.0, 12.0, 7.0, 9.0, 3.0, 5.0, 6.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.921875, -7.6961669921875, -7.470458984375, -7.2447509765625, -7.01904296875, -6.7933349609375, -6.567626953125, -6.3419189453125, -6.1162109375, -5.8905029296875, -5.664794921875, -5.4390869140625, -5.21337890625, -4.9876708984375, -4.761962890625, -4.5362548828125, -4.310546875, -4.0848388671875, -3.859130859375, -3.6334228515625, -3.40771484375, -3.1820068359375, -2.956298828125, -2.7305908203125, -2.5048828125, -2.2791748046875, -2.053466796875, -1.8277587890625, -1.60205078125, -1.3763427734375, -1.150634765625, -0.9249267578125, -0.69921875, -0.4735107421875, -0.247802734375, -0.0220947265625, 0.20361328125, 0.4293212890625, 0.655029296875, 0.8807373046875, 1.1064453125, 1.3321533203125, 1.557861328125, 1.7835693359375, 2.00927734375, 2.2349853515625, 2.460693359375, 2.6864013671875, 2.912109375, 3.1378173828125, 3.363525390625, 3.5892333984375, 3.81494140625, 4.0406494140625, 4.266357421875, 4.4920654296875, 4.7177734375, 4.9434814453125, 5.169189453125, 5.3948974609375, 5.62060546875, 5.8463134765625, 6.072021484375, 6.2977294921875, 6.5234375]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 5.0, 5.0, 9.0, 12.0, 12.0, 14.0, 34.0, 40.0, 52.0, 74.0, 122.0, 181.0, 301.0, 609.0, 1187.0, 2839.0, 7880.0, 25483.0, 100505.0, 470687.0, 332924.0, 74641.0, 20111.0, 6161.0, 2349.0, 1006.0, 499.0, 285.0, 184.0, 124.0, 61.0, 46.0, 28.0, 23.0, 15.0, 18.0, 12.0, 6.0, 8.0, 8.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-9.8125, -9.56024169921875, -9.3079833984375, -9.05572509765625, -8.803466796875, -8.55120849609375, -8.2989501953125, -8.04669189453125, -7.79443359375, -7.54217529296875, -7.2899169921875, -7.03765869140625, -6.785400390625, -6.53314208984375, -6.2808837890625, -6.02862548828125, -5.7763671875, -5.52410888671875, -5.2718505859375, -5.01959228515625, -4.767333984375, -4.51507568359375, -4.2628173828125, -4.01055908203125, -3.75830078125, -3.50604248046875, -3.2537841796875, -3.00152587890625, -2.749267578125, -2.49700927734375, -2.2447509765625, -1.99249267578125, -1.740234375, -1.48797607421875, -1.2357177734375, -0.98345947265625, -0.731201171875, -0.47894287109375, -0.2266845703125, 0.02557373046875, 0.27783203125, 0.53009033203125, 0.7823486328125, 1.03460693359375, 1.286865234375, 1.53912353515625, 1.7913818359375, 2.04364013671875, 2.2958984375, 2.54815673828125, 2.8004150390625, 3.05267333984375, 3.304931640625, 3.55718994140625, 3.8094482421875, 4.06170654296875, 4.31396484375, 4.56622314453125, 4.8184814453125, 5.07073974609375, 5.322998046875, 5.57525634765625, 5.8275146484375, 6.07977294921875, 6.33203125]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 4.0, 3.0, 5.0, 6.0, 5.0, 3.0, 8.0, 8.0, 9.0, 10.0, 16.0, 22.0, 25.0, 24.0, 20.0, 34.0, 21.0, 40.0, 29.0, 39.0, 47.0, 54.0, 68.0, 206.0, 1626.0, 209.0, 83.0, 52.0, 28.0, 32.0, 34.0, 35.0, 29.0, 29.0, 26.0, 30.0, 25.0, 17.0, 11.0, 11.0, 10.0, 14.0, 11.0, 7.0, 12.0, 7.0, 2.0, 4.0, 0.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-20.328125, -19.661376953125, -18.99462890625, -18.327880859375, -17.6611328125, -16.994384765625, -16.32763671875, -15.660888671875, -14.994140625, -14.327392578125, -13.66064453125, -12.993896484375, -12.3271484375, -11.660400390625, -10.99365234375, -10.326904296875, -9.66015625, -8.993408203125, -8.32666015625, -7.659912109375, -6.9931640625, -6.326416015625, -5.65966796875, -4.992919921875, -4.326171875, -3.659423828125, -2.99267578125, -2.325927734375, -1.6591796875, -0.992431640625, -0.32568359375, 0.341064453125, 1.0078125, 1.674560546875, 2.34130859375, 3.008056640625, 3.6748046875, 4.341552734375, 5.00830078125, 5.675048828125, 6.341796875, 7.008544921875, 7.67529296875, 8.342041015625, 9.0087890625, 9.675537109375, 10.34228515625, 11.009033203125, 11.67578125, 12.342529296875, 13.00927734375, 13.676025390625, 14.3427734375, 15.009521484375, 15.67626953125, 16.343017578125, 17.009765625, 17.676513671875, 18.34326171875, 19.010009765625, 19.6767578125, 20.343505859375, 21.01025390625, 21.677001953125, 22.34375]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 6.0, 3.0, 8.0, 5.0, 11.0, 18.0, 26.0, 35.0, 41.0, 74.0, 133.0, 199.0, 305.0, 545.0, 2965.0, 3101445.0, 37726.0, 1095.0, 397.0, 234.0, 146.0, 109.0, 64.0, 36.0, 23.0, 13.0, 13.0, 12.0, 7.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-111.875, -108.990234375, -106.10546875, -103.220703125, -100.3359375, -97.451171875, -94.56640625, -91.681640625, -88.796875, -85.912109375, -83.02734375, -80.142578125, -77.2578125, -74.373046875, -71.48828125, -68.603515625, -65.71875, -62.833984375, -59.94921875, -57.064453125, -54.1796875, -51.294921875, -48.41015625, -45.525390625, -42.640625, -39.755859375, -36.87109375, -33.986328125, -31.1015625, -28.216796875, -25.33203125, -22.447265625, -19.5625, -16.677734375, -13.79296875, -10.908203125, -8.0234375, -5.138671875, -2.25390625, 0.630859375, 3.515625, 6.400390625, 9.28515625, 12.169921875, 15.0546875, 17.939453125, 20.82421875, 23.708984375, 26.59375, 29.478515625, 32.36328125, 35.248046875, 38.1328125, 41.017578125, 43.90234375, 46.787109375, 49.671875, 52.556640625, 55.44140625, 58.326171875, 61.2109375, 64.095703125, 66.98046875, 69.865234375, 72.75]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 7.0, 53.0, 250.0, 439.0, 222.0, 39.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.88502311706543, -7.67278528213501, -5.46054744720459, -3.24830961227417, -1.03607177734375, 1.1761665344238281, 3.38840389251709, 5.600641250610352, 7.81287956237793, 10.025117874145508, 12.23735523223877, 14.449592590332031, 16.66183090209961, 18.874069213867188, 21.086307525634766, 23.29854393005371, 25.51078224182129, 27.723020553588867, 29.935256958007812, 32.14749526977539, 34.35973358154297, 36.57197189331055, 38.784210205078125, 40.99644470214844, 43.20868682861328, 45.42092514038086, 47.63316345214844, 49.845401763916016, 52.057640075683594, 54.269874572753906, 56.482112884521484, 58.69435119628906, 60.906585693359375, 63.11882400512695, 65.33106231689453, 67.54329681396484, 69.75553894042969, 71.9677734375, 74.18001556396484, 76.39225006103516, 78.6044921875, 80.81672668457031, 83.02896881103516, 85.24120330810547, 87.45344543457031, 89.66567993164062, 91.87792205810547, 94.09015655517578, 96.3023910522461, 98.5146255493164, 100.72686767578125, 102.93910217285156, 105.1513442993164, 107.36357879638672, 109.57582092285156, 111.78805541992188, 114.00028991699219, 116.2125244140625, 118.42476654052734, 120.63700103759766, 122.8492431640625, 125.06147766113281, 127.27371978759766, 129.4859619140625, 131.6981964111328]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 5.0, 2.0, 6.0, 2.0, 8.0, 2.0, 8.0, 5.0, 15.0, 16.0, 20.0, 28.0, 26.0, 25.0, 30.0, 30.0, 53.0, 37.0, 38.0, 48.0, 45.0, 41.0, 47.0, 44.0, 52.0, 53.0, 33.0, 34.0, 44.0, 30.0, 40.0, 25.0, 13.0, 31.0, 13.0, 15.0, 14.0, 6.0, 5.0, 7.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-77.80258178710938, -75.69921875, -73.5958480834961, -71.49248504638672, -69.38911437988281, -67.28575134277344, -65.18238067626953, -63.079017639160156, -60.97564697265625, -58.87228012084961, -56.76891326904297, -54.66554641723633, -52.56217956542969, -50.45881271362305, -48.355445861816406, -46.25208282470703, -44.14871597290039, -42.04534912109375, -39.94198226928711, -37.83861541748047, -35.73524856567383, -33.63188171386719, -31.52851676940918, -29.42514991760254, -27.3217830657959, -25.218416213989258, -23.115049362182617, -21.01168441772461, -18.90831756591797, -16.804950714111328, -14.701583862304688, -12.598217010498047, -10.494850158691406, -8.391483306884766, -6.288116931915283, -4.184750556945801, -2.08138370513916, 0.02198314666748047, 2.1253490447998047, 4.228715896606445, 6.332082748413086, 8.435449600219727, 10.538816452026367, 12.642182350158691, 14.745549201965332, 16.848915100097656, 18.952281951904297, 21.055648803710938, 23.159015655517578, 25.26238250732422, 27.36574935913086, 29.4691162109375, 31.57248306274414, 33.67584991455078, 35.779212951660156, 37.88258361816406, 39.98594665527344, 42.08931350708008, 44.19268035888672, 46.29604721069336, 48.3994140625, 50.50278091430664, 52.60614776611328, 54.709510803222656, 56.81288146972656]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 9.0, 11.0, 13.0, 9.0, 11.0, 24.0, 15.0, 19.0, 31.0, 29.0, 23.0, 35.0, 27.0, 42.0, 34.0, 35.0, 53.0, 39.0, 54.0, 37.0, 45.0, 32.0, 37.0, 42.0, 41.0, 36.0, 38.0, 32.0, 28.0, 15.0, 16.0, 9.0, 12.0, 9.0, 12.0, 9.0, 5.0, 9.0, 8.0, 5.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0], "bins": [-8.6328125, -8.39654541015625, -8.1602783203125, -7.92401123046875, -7.687744140625, -7.45147705078125, -7.2152099609375, -6.97894287109375, -6.74267578125, -6.50640869140625, -6.2701416015625, -6.03387451171875, -5.797607421875, -5.56134033203125, -5.3250732421875, -5.08880615234375, -4.8525390625, -4.61627197265625, -4.3800048828125, -4.14373779296875, -3.907470703125, -3.67120361328125, -3.4349365234375, -3.19866943359375, -2.96240234375, -2.72613525390625, -2.4898681640625, -2.25360107421875, -2.017333984375, -1.78106689453125, -1.5447998046875, -1.30853271484375, -1.072265625, -0.83599853515625, -0.5997314453125, -0.36346435546875, -0.127197265625, 0.10906982421875, 0.3453369140625, 0.58160400390625, 0.81787109375, 1.05413818359375, 1.2904052734375, 1.52667236328125, 1.762939453125, 1.99920654296875, 2.2354736328125, 2.47174072265625, 2.7080078125, 2.94427490234375, 3.1805419921875, 3.41680908203125, 3.653076171875, 3.88934326171875, 4.1256103515625, 4.36187744140625, 4.59814453125, 4.83441162109375, 5.0706787109375, 5.30694580078125, 5.543212890625, 5.77947998046875, 6.0157470703125, 6.25201416015625, 6.48828125]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 4.0, 5.0, 9.0, 8.0, 13.0, 13.0, 17.0, 20.0, 28.0, 46.0, 49.0, 49.0, 71.0, 79.0, 118.0, 170.0, 293.0, 561.0, 1727.0, 8916.0, 116723.0, 2079093.0, 1876139.0, 99024.0, 7934.0, 1668.0, 534.0, 282.0, 169.0, 121.0, 89.0, 49.0, 54.0, 35.0, 26.0, 30.0, 21.0, 22.0, 24.0, 17.0, 6.0, 8.0, 9.0, 2.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-22.640625, -22.01123046875, -21.3818359375, -20.75244140625, -20.123046875, -19.49365234375, -18.8642578125, -18.23486328125, -17.60546875, -16.97607421875, -16.3466796875, -15.71728515625, -15.087890625, -14.45849609375, -13.8291015625, -13.19970703125, -12.5703125, -11.94091796875, -11.3115234375, -10.68212890625, -10.052734375, -9.42333984375, -8.7939453125, -8.16455078125, -7.53515625, -6.90576171875, -6.2763671875, -5.64697265625, -5.017578125, -4.38818359375, -3.7587890625, -3.12939453125, -2.5, -1.87060546875, -1.2412109375, -0.61181640625, 0.017578125, 0.64697265625, 1.2763671875, 1.90576171875, 2.53515625, 3.16455078125, 3.7939453125, 4.42333984375, 5.052734375, 5.68212890625, 6.3115234375, 6.94091796875, 7.5703125, 8.19970703125, 8.8291015625, 9.45849609375, 10.087890625, 10.71728515625, 11.3466796875, 11.97607421875, 12.60546875, 13.23486328125, 13.8642578125, 14.49365234375, 15.123046875, 15.75244140625, 16.3818359375, 17.01123046875, 17.640625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 5.0, 4.0, 5.0, 4.0, 5.0, 16.0, 14.0, 29.0, 20.0, 50.0, 50.0, 70.0, 106.0, 136.0, 162.0, 210.0, 294.0, 368.0, 451.0, 432.0, 397.0, 317.0, 249.0, 164.0, 129.0, 104.0, 81.0, 53.0, 48.0, 28.0, 25.0, 14.0, 15.0, 7.0, 6.0, 4.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.15625, -15.7078857421875, -15.259521484375, -14.8111572265625, -14.36279296875, -13.9144287109375, -13.466064453125, -13.0177001953125, -12.5693359375, -12.1209716796875, -11.672607421875, -11.2242431640625, -10.77587890625, -10.3275146484375, -9.879150390625, -9.4307861328125, -8.982421875, -8.5340576171875, -8.085693359375, -7.6373291015625, -7.18896484375, -6.7406005859375, -6.292236328125, -5.8438720703125, -5.3955078125, -4.9471435546875, -4.498779296875, -4.0504150390625, -3.60205078125, -3.1536865234375, -2.705322265625, -2.2569580078125, -1.80859375, -1.3602294921875, -0.911865234375, -0.4635009765625, -0.01513671875, 0.4332275390625, 0.881591796875, 1.3299560546875, 1.7783203125, 2.2266845703125, 2.675048828125, 3.1234130859375, 3.57177734375, 4.0201416015625, 4.468505859375, 4.9168701171875, 5.365234375, 5.8135986328125, 6.261962890625, 6.7103271484375, 7.15869140625, 7.6070556640625, 8.055419921875, 8.5037841796875, 8.9521484375, 9.4005126953125, 9.848876953125, 10.2972412109375, 10.74560546875, 11.1939697265625, 11.642333984375, 12.0906982421875, 12.5390625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 8.0, 6.0, 11.0, 15.0, 12.0, 19.0, 28.0, 56.0, 40.0, 68.0, 99.0, 101.0, 124.0, 196.0, 228.0, 293.0, 464.0, 1275.0, 90654.0, 4079293.0, 18788.0, 880.0, 390.0, 256.0, 246.0, 170.0, 126.0, 89.0, 91.0, 72.0, 46.0, 38.0, 35.0, 22.0, 13.0, 9.0, 5.0, 7.0, 7.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.34375, -59.10302734375, -56.8623046875, -54.62158203125, -52.380859375, -50.14013671875, -47.8994140625, -45.65869140625, -43.41796875, -41.17724609375, -38.9365234375, -36.69580078125, -34.455078125, -32.21435546875, -29.9736328125, -27.73291015625, -25.4921875, -23.25146484375, -21.0107421875, -18.77001953125, -16.529296875, -14.28857421875, -12.0478515625, -9.80712890625, -7.56640625, -5.32568359375, -3.0849609375, -0.84423828125, 1.396484375, 3.63720703125, 5.8779296875, 8.11865234375, 10.359375, 12.60009765625, 14.8408203125, 17.08154296875, 19.322265625, 21.56298828125, 23.8037109375, 26.04443359375, 28.28515625, 30.52587890625, 32.7666015625, 35.00732421875, 37.248046875, 39.48876953125, 41.7294921875, 43.97021484375, 46.2109375, 48.45166015625, 50.6923828125, 52.93310546875, 55.173828125, 57.41455078125, 59.6552734375, 61.89599609375, 64.13671875, 66.37744140625, 68.6181640625, 70.85888671875, 73.099609375, 75.34033203125, 77.5810546875, 79.82177734375, 82.0625]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 7.0, 11.0, 14.0, 48.0, 85.0, 131.0, 173.0, 172.0, 161.0, 96.0, 58.0, 32.0, 11.0, 9.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-112.76527404785156, -110.2177963256836, -107.67031860351562, -105.12284851074219, -102.57537078857422, -100.02789306640625, -97.48041534423828, -94.93293762207031, -92.38545989990234, -89.83798217773438, -87.2905044555664, -84.74302673339844, -82.195556640625, -79.64807891845703, -77.10060119628906, -74.5531234741211, -72.00564575195312, -69.45816802978516, -66.91069030761719, -64.36322021484375, -61.815738677978516, -59.26826477050781, -56.720787048339844, -54.173309326171875, -51.62583923339844, -49.07836151123047, -46.530887603759766, -43.9834098815918, -41.43593215942383, -38.888458251953125, -36.340980529785156, -33.79350280761719, -31.24602508544922, -28.698549270629883, -26.151071548461914, -23.603595733642578, -21.05611801147461, -18.508642196655273, -15.961166381835938, -13.413688659667969, -10.866212844848633, -8.31873607635498, -5.771259784698486, -3.223783493041992, -0.6763067245483398, 1.8711700439453125, 4.418645858764648, 6.966123580932617, 9.513599395751953, 12.061076164245605, 14.608552932739258, 17.156028747558594, 19.703506469726562, 22.2509822845459, 24.798458099365234, 27.345935821533203, 29.89341163635254, 32.440887451171875, 34.988365173339844, 37.53584289550781, 40.083316802978516, 42.630794525146484, 45.17826843261719, 47.725746154785156, 50.273223876953125]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 5.0, 16.0, 14.0, 13.0, 16.0, 21.0, 27.0, 14.0, 15.0, 33.0, 28.0, 36.0, 40.0, 38.0, 38.0, 42.0, 44.0, 45.0, 49.0, 30.0, 45.0, 39.0, 54.0, 37.0, 31.0, 29.0, 31.0, 29.0, 20.0, 24.0, 20.0, 10.0, 17.0, 12.0, 10.0, 8.0, 5.0, 5.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-50.079833984375, -48.545677185058594, -47.01152038574219, -45.47736358642578, -43.943206787109375, -42.40904998779297, -40.87489318847656, -39.340736389160156, -37.80657958984375, -36.272422790527344, -34.73826599121094, -33.20410919189453, -31.669952392578125, -30.13579559326172, -28.601640701293945, -27.06748390197754, -25.533329010009766, -23.99917221069336, -22.465015411376953, -20.930858612060547, -19.39670181274414, -17.862545013427734, -16.32839012145996, -14.794233322143555, -13.260076522827148, -11.725919723510742, -10.191762924194336, -8.657607078552246, -7.12345027923584, -5.589293479919434, -4.055137634277344, -2.5209808349609375, -0.9868240356445312, 0.5473325252532959, 2.081489086151123, 3.615645408630371, 5.149802207946777, 6.683959007263184, 8.218114852905273, 9.75227165222168, 11.286428451538086, 12.820585250854492, 14.354742050170898, 15.888897895812988, 17.423053741455078, 18.957210540771484, 20.49136734008789, 22.025524139404297, 23.559680938720703, 25.09383773803711, 26.627994537353516, 28.162151336669922, 29.696308135986328, 31.230464935302734, 32.764617919921875, 34.29877471923828, 35.83293151855469, 37.367088317871094, 38.9012451171875, 40.435401916503906, 41.96955871582031, 43.50371551513672, 45.037872314453125, 46.57202911376953, 48.10618591308594]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 4.0, 6.0, 5.0, 11.0, 13.0, 10.0, 14.0, 21.0, 19.0, 29.0, 26.0, 33.0, 29.0, 34.0, 26.0, 41.0, 45.0, 46.0, 53.0, 48.0, 51.0, 60.0, 41.0, 38.0, 35.0, 39.0, 41.0, 36.0, 28.0, 15.0, 20.0, 15.0, 13.0, 9.0, 6.0, 14.0, 7.0, 7.0, 4.0, 3.0, 2.0, 6.0, 0.0, 3.0, 1.0, 1.0], "bins": [-9.265625, -9.0181884765625, -8.770751953125, -8.5233154296875, -8.27587890625, -8.0284423828125, -7.781005859375, -7.5335693359375, -7.2861328125, -7.0386962890625, -6.791259765625, -6.5438232421875, -6.29638671875, -6.0489501953125, -5.801513671875, -5.5540771484375, -5.306640625, -5.0592041015625, -4.811767578125, -4.5643310546875, -4.31689453125, -4.0694580078125, -3.822021484375, -3.5745849609375, -3.3271484375, -3.0797119140625, -2.832275390625, -2.5848388671875, -2.33740234375, -2.0899658203125, -1.842529296875, -1.5950927734375, -1.34765625, -1.1002197265625, -0.852783203125, -0.6053466796875, -0.35791015625, -0.1104736328125, 0.136962890625, 0.3843994140625, 0.6318359375, 0.8792724609375, 1.126708984375, 1.3741455078125, 1.62158203125, 1.8690185546875, 2.116455078125, 2.3638916015625, 2.611328125, 2.8587646484375, 3.106201171875, 3.3536376953125, 3.60107421875, 3.8485107421875, 4.095947265625, 4.3433837890625, 4.5908203125, 4.8382568359375, 5.085693359375, 5.3331298828125, 5.58056640625, 5.8280029296875, 6.075439453125, 6.3228759765625, 6.5703125]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 6.0, 5.0, 11.0, 8.0, 19.0, 25.0, 31.0, 41.0, 79.0, 124.0, 194.0, 293.0, 481.0, 717.0, 1180.0, 2023.0, 3324.0, 5669.0, 9528.0, 16388.0, 28751.0, 50588.0, 88526.0, 156397.0, 246604.0, 187778.0, 106856.0, 60624.0, 34753.0, 19656.0, 11197.0, 6677.0, 3939.0, 2321.0, 1470.0, 830.0, 511.0, 363.0, 217.0, 134.0, 93.0, 42.0, 26.0, 25.0, 14.0, 5.0, 8.0, 4.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.82958984375, -0.7995986938476562, -0.7696075439453125, -0.7396163940429688, -0.709625244140625, -0.6796340942382812, -0.6496429443359375, -0.6196517944335938, -0.58966064453125, -0.5596694946289062, -0.5296783447265625, -0.49968719482421875, -0.469696044921875, -0.43970489501953125, -0.4097137451171875, -0.37972259521484375, -0.3497314453125, -0.31974029541015625, -0.2897491455078125, -0.25975799560546875, -0.229766845703125, -0.19977569580078125, -0.1697845458984375, -0.13979339599609375, -0.10980224609375, -0.07981109619140625, -0.0498199462890625, -0.01982879638671875, 0.010162353515625, 0.04015350341796875, 0.0701446533203125, 0.10013580322265625, 0.130126953125, 0.16011810302734375, 0.1901092529296875, 0.22010040283203125, 0.250091552734375, 0.28008270263671875, 0.3100738525390625, 0.34006500244140625, 0.37005615234375, 0.40004730224609375, 0.4300384521484375, 0.46002960205078125, 0.490020751953125, 0.5200119018554688, 0.5500030517578125, 0.5799942016601562, 0.6099853515625, 0.6399765014648438, 0.6699676513671875, 0.6999588012695312, 0.729949951171875, 0.7599411010742188, 0.7899322509765625, 0.8199234008789062, 0.84991455078125, 0.8799057006835938, 0.9098968505859375, 0.9398880004882812, 0.969879150390625, 0.9998703002929688, 1.0298614501953125, 1.0598526000976562, 1.08984375]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 1.0, 0.0, 4.0, 4.0, 4.0, 5.0, 10.0, 9.0, 17.0, 17.0, 13.0, 30.0, 18.0, 25.0, 32.0, 35.0, 34.0, 29.0, 48.0, 38.0, 47.0, 40.0, 1063.0, 35.0, 45.0, 53.0, 43.0, 44.0, 39.0, 29.0, 31.0, 23.0, 30.0, 16.0, 22.0, 15.0, 13.0, 11.0, 15.0, 11.0, 5.0, 1.0, 4.0, 5.0, 4.0, 5.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.41796875, -4.2696533203125, -4.121337890625, -3.9730224609375, -3.82470703125, -3.6763916015625, -3.528076171875, -3.3797607421875, -3.2314453125, -3.0831298828125, -2.934814453125, -2.7864990234375, -2.63818359375, -2.4898681640625, -2.341552734375, -2.1932373046875, -2.044921875, -1.8966064453125, -1.748291015625, -1.5999755859375, -1.45166015625, -1.3033447265625, -1.155029296875, -1.0067138671875, -0.8583984375, -0.7100830078125, -0.561767578125, -0.4134521484375, -0.26513671875, -0.1168212890625, 0.031494140625, 0.1798095703125, 0.328125, 0.4764404296875, 0.624755859375, 0.7730712890625, 0.92138671875, 1.0697021484375, 1.218017578125, 1.3663330078125, 1.5146484375, 1.6629638671875, 1.811279296875, 1.9595947265625, 2.10791015625, 2.2562255859375, 2.404541015625, 2.5528564453125, 2.701171875, 2.8494873046875, 2.997802734375, 3.1461181640625, 3.29443359375, 3.4427490234375, 3.591064453125, 3.7393798828125, 3.8876953125, 4.0360107421875, 4.184326171875, 4.3326416015625, 4.48095703125, 4.6292724609375, 4.777587890625, 4.9259033203125, 5.07421875]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 4.0, 6.0, 4.0, 11.0, 17.0, 23.0, 26.0, 29.0, 50.0, 83.0, 133.0, 142.0, 217.0, 313.0, 491.0, 699.0, 967.0, 1482.0, 2160.0, 3382.0, 5165.0, 7710.0, 12140.0, 19296.0, 30744.0, 49216.0, 79040.0, 130933.0, 1251747.0, 191988.0, 117109.0, 70895.0, 43802.0, 27336.0, 17567.0, 11248.0, 7016.0, 4705.0, 3041.0, 1974.0, 1327.0, 880.0, 582.0, 433.0, 337.0, 178.0, 151.0, 90.0, 96.0, 49.0, 36.0, 27.0, 17.0, 11.0, 3.0, 10.0, 2.0, 3.0, 3.0, 0.0, 3.0], "bins": [-0.75634765625, -0.7326278686523438, -0.7089080810546875, -0.6851882934570312, -0.661468505859375, -0.6377487182617188, -0.6140289306640625, -0.5903091430664062, -0.56658935546875, -0.5428695678710938, -0.5191497802734375, -0.49542999267578125, -0.471710205078125, -0.44799041748046875, -0.4242706298828125, -0.40055084228515625, -0.3768310546875, -0.35311126708984375, -0.3293914794921875, -0.30567169189453125, -0.281951904296875, -0.25823211669921875, -0.2345123291015625, -0.21079254150390625, -0.18707275390625, -0.16335296630859375, -0.1396331787109375, -0.11591339111328125, -0.092193603515625, -0.06847381591796875, -0.0447540283203125, -0.02103424072265625, 0.002685546875, 0.02640533447265625, 0.0501251220703125, 0.07384490966796875, 0.097564697265625, 0.12128448486328125, 0.1450042724609375, 0.16872406005859375, 0.19244384765625, 0.21616363525390625, 0.2398834228515625, 0.26360321044921875, 0.287322998046875, 0.31104278564453125, 0.3347625732421875, 0.35848236083984375, 0.3822021484375, 0.40592193603515625, 0.4296417236328125, 0.45336151123046875, 0.477081298828125, 0.5008010864257812, 0.5245208740234375, 0.5482406616210938, 0.57196044921875, 0.5956802368164062, 0.6194000244140625, 0.6431198120117188, 0.666839599609375, 0.6905593872070312, 0.7142791748046875, 0.7379989624023438, 0.76171875]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 3.0, 3.0, 2.0, 11.0, 9.0, 7.0, 12.0, 16.0, 21.0, 27.0, 33.0, 36.0, 50.0, 53.0, 59.0, 59.0, 63.0, 70.0, 61.0, 49.0, 64.0, 49.0, 40.0, 42.0, 30.0, 26.0, 22.0, 21.0, 7.0, 12.0, 14.0, 8.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0], "bins": [-0.00348663330078125, -0.0033979415893554688, -0.0033092498779296875, -0.0032205581665039062, -0.003131866455078125, -0.0030431747436523438, -0.0029544830322265625, -0.0028657913208007812, -0.002777099609375, -0.0026884078979492188, -0.0025997161865234375, -0.0025110244750976562, -0.002422332763671875, -0.0023336410522460938, -0.0022449493408203125, -0.0021562576293945312, -0.00206756591796875, -0.0019788742065429688, -0.0018901824951171875, -0.0018014907836914062, -0.001712799072265625, -0.0016241073608398438, -0.0015354156494140625, -0.0014467239379882812, -0.0013580322265625, -0.0012693405151367188, -0.0011806488037109375, -0.0010919570922851562, -0.001003265380859375, -0.0009145736694335938, -0.0008258819580078125, -0.0007371902465820312, -0.00064849853515625, -0.0005598068237304688, -0.0004711151123046875, -0.00038242340087890625, -0.000293731689453125, -0.00020503997802734375, -0.0001163482666015625, -2.765655517578125e-05, 6.103515625e-05, 0.00014972686767578125, 0.0002384185791015625, 0.00032711029052734375, 0.000415802001953125, 0.0005044937133789062, 0.0005931854248046875, 0.0006818771362304688, 0.00077056884765625, 0.0008592605590820312, 0.0009479522705078125, 0.0010366439819335938, 0.001125335693359375, 0.0012140274047851562, 0.0013027191162109375, 0.0013914108276367188, 0.0014801025390625, 0.0015687942504882812, 0.0016574859619140625, 0.0017461776733398438, 0.001834869384765625, 0.0019235610961914062, 0.0020122528076171875, 0.0021009445190429688, 0.00218963623046875]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 5.0, 4.0, 12.0, 6.0, 12.0, 23.0, 17.0, 23.0, 41.0, 39.0, 53.0, 81.0, 107.0, 207.0, 473.0, 2127.0, 1028758.0, 15147.0, 667.0, 265.0, 133.0, 86.0, 62.0, 42.0, 39.0, 28.0, 21.0, 18.0, 8.0, 12.0, 8.0, 5.0, 6.0, 3.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.056884765625, -0.05466938018798828, -0.05245399475097656, -0.050238609313964844, -0.048023223876953125, -0.045807838439941406, -0.04359245300292969, -0.04137706756591797, -0.03916168212890625, -0.03694629669189453, -0.03473091125488281, -0.032515525817871094, -0.030300140380859375, -0.028084754943847656, -0.025869369506835938, -0.02365398406982422, -0.0214385986328125, -0.01922321319580078, -0.017007827758789062, -0.014792442321777344, -0.012577056884765625, -0.010361671447753906, -0.008146286010742188, -0.005930900573730469, -0.00371551513671875, -0.0015001296997070312, 0.0007152557373046875, 0.0029306411743164062, 0.005146026611328125, 0.007361412048339844, 0.009576797485351562, 0.011792182922363281, 0.014007568359375, 0.01622295379638672, 0.018438339233398438, 0.020653724670410156, 0.022869110107421875, 0.025084495544433594, 0.027299880981445312, 0.02951526641845703, 0.03173065185546875, 0.03394603729248047, 0.03616142272949219, 0.038376808166503906, 0.040592193603515625, 0.042807579040527344, 0.04502296447753906, 0.04723834991455078, 0.0494537353515625, 0.05166912078857422, 0.05388450622558594, 0.056099891662597656, 0.058315277099609375, 0.060530662536621094, 0.06274604797363281, 0.06496143341064453, 0.06717681884765625, 0.06939220428466797, 0.07160758972167969, 0.0738229751586914, 0.07603836059570312, 0.07825374603271484, 0.08046913146972656, 0.08268451690673828, 0.08489990234375]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 41.0, 161.0, 352.0, 303.0, 118.0, 22.0, 7.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.008545036427676678, -0.008389276452362537, -0.008233517408370972, -0.008077757433056831, -0.007921997457742691, -0.007766237482428551, -0.007610477972775698, -0.007454718463122845, -0.007298958487808704, -0.007143198512494564, -0.006987439002841711, -0.006831679493188858, -0.006675919517874718, -0.006520159542560577, -0.006364400032907724, -0.006208640523254871, -0.006052880547940731, -0.005897120572626591, -0.005741361062973738, -0.005585601553320885, -0.005429841578006744, -0.005274081602692604, -0.005118322093039751, -0.004962562583386898, -0.004806802608072758, -0.004651042632758617, -0.004495283123105764, -0.004339523613452911, -0.004183763638138771, -0.004028003662824631, -0.0038722441531717777, -0.003716484410688281, -0.0035607246682047844, -0.0034049649257212877, -0.003249205183237791, -0.0030934454407542944, -0.0029376856982707977, -0.002781925955787301, -0.0026261662133038044, -0.0024704064708203077, -0.002314646728336811, -0.0021588869858533144, -0.0020031272433698177, -0.001847367500886321, -0.0016916077584028244, -0.0015358480159193277, -0.001380088273435831, -0.0012243285309523344, -0.0010685687884688377, -0.0009128090459853411, -0.0007570493035018444, -0.0006012895610183477, -0.0004455298185348511, -0.0002897700760513544, -0.00013401033356785774, 2.1749408915638924e-05, 0.0001775091513991356, 0.00033326889388263226, 0.0004890286363661289, 0.0006447883788496256, 0.0008005481213331223, 0.0009563078638166189, 0.0011120676063001156, 0.0012678273487836123, 0.001423587091267109]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 8.0, 9.0, 8.0, 5.0, 12.0, 11.0, 15.0, 20.0, 23.0, 20.0, 25.0, 25.0, 39.0, 31.0, 27.0, 37.0, 40.0, 46.0, 38.0, 45.0, 34.0, 49.0, 50.0, 48.0, 44.0, 34.0, 34.0, 31.0, 31.0, 35.0, 27.0, 15.0, 17.0, 14.0, 13.0, 11.0, 5.0, 7.0, 5.0, 6.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0014801025390625, -0.0014339238405227661, -0.0013877451419830322, -0.0013415664434432983, -0.0012953877449035645, -0.0012492090463638306, -0.0012030303478240967, -0.0011568516492843628, -0.001110672950744629, -0.001064494252204895, -0.0010183155536651611, -0.0009721368551254272, -0.0009259581565856934, -0.0008797794580459595, -0.0008336007595062256, -0.0007874220609664917, -0.0007412433624267578, -0.0006950646638870239, -0.00064888596534729, -0.0006027072668075562, -0.0005565285682678223, -0.0005103498697280884, -0.0004641711711883545, -0.0004179924726486206, -0.0003718137741088867, -0.00032563507556915283, -0.00027945637702941895, -0.00023327767848968506, -0.00018709897994995117, -0.00014092028141021729, -9.47415828704834e-05, -4.856288433074951e-05, -2.384185791015625e-06, 4.379451274871826e-05, 8.997321128845215e-05, 0.00013615190982818604, 0.00018233060836791992, 0.0002285093069076538, 0.0002746880054473877, 0.0003208667039871216, 0.00036704540252685547, 0.00041322410106658936, 0.00045940279960632324, 0.0005055814981460571, 0.000551760196685791, 0.0005979388952255249, 0.0006441175937652588, 0.0006902962923049927, 0.0007364749908447266, 0.0007826536893844604, 0.0008288323879241943, 0.0008750110864639282, 0.0009211897850036621, 0.000967368483543396, 0.0010135471820831299, 0.0010597258806228638, 0.0011059045791625977, 0.0011520832777023315, 0.0011982619762420654, 0.0012444406747817993, 0.0012906193733215332, 0.001336798071861267, 0.001382976770401001, 0.0014291554689407349, 0.0014753341674804688]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 4.0, 6.0, 4.0, 12.0, 13.0, 10.0, 14.0, 21.0, 18.0, 30.0, 26.0, 33.0, 29.0, 33.0, 26.0, 42.0, 45.0, 45.0, 54.0, 48.0, 49.0, 61.0, 41.0, 39.0, 35.0, 39.0, 41.0, 36.0, 26.0, 17.0, 20.0, 15.0, 13.0, 9.0, 6.0, 14.0, 7.0, 7.0, 4.0, 3.0, 2.0, 6.0, 0.0, 3.0, 1.0, 1.0], "bins": [-9.265625, -9.01824951171875, -8.7708740234375, -8.52349853515625, -8.276123046875, -8.02874755859375, -7.7813720703125, -7.53399658203125, -7.28662109375, -7.03924560546875, -6.7918701171875, -6.54449462890625, -6.297119140625, -6.04974365234375, -5.8023681640625, -5.55499267578125, -5.3076171875, -5.06024169921875, -4.8128662109375, -4.56549072265625, -4.318115234375, -4.07073974609375, -3.8233642578125, -3.57598876953125, -3.32861328125, -3.08123779296875, -2.8338623046875, -2.58648681640625, -2.339111328125, -2.09173583984375, -1.8443603515625, -1.59698486328125, -1.349609375, -1.10223388671875, -0.8548583984375, -0.60748291015625, -0.360107421875, -0.11273193359375, 0.1346435546875, 0.38201904296875, 0.62939453125, 0.87677001953125, 1.1241455078125, 1.37152099609375, 1.618896484375, 1.86627197265625, 2.1136474609375, 2.36102294921875, 2.6083984375, 2.85577392578125, 3.1031494140625, 3.35052490234375, 3.597900390625, 3.84527587890625, 4.0926513671875, 4.34002685546875, 4.58740234375, 4.83477783203125, 5.0821533203125, 5.32952880859375, 5.576904296875, 5.82427978515625, 6.0716552734375, 6.31903076171875, 6.56640625]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 1.0, 6.0, 10.0, 12.0, 13.0, 16.0, 28.0, 55.0, 89.0, 114.0, 220.0, 345.0, 666.0, 1262.0, 2520.0, 5384.0, 11801.0, 27633.0, 68539.0, 191210.0, 431228.0, 189425.0, 68084.0, 27290.0, 12025.0, 5289.0, 2483.0, 1254.0, 639.0, 354.0, 202.0, 138.0, 68.0, 51.0, 34.0, 25.0, 10.0, 8.0, 10.0, 3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-5.85546875, -5.6695556640625, -5.483642578125, -5.2977294921875, -5.11181640625, -4.9259033203125, -4.739990234375, -4.5540771484375, -4.3681640625, -4.1822509765625, -3.996337890625, -3.8104248046875, -3.62451171875, -3.4385986328125, -3.252685546875, -3.0667724609375, -2.880859375, -2.6949462890625, -2.509033203125, -2.3231201171875, -2.13720703125, -1.9512939453125, -1.765380859375, -1.5794677734375, -1.3935546875, -1.2076416015625, -1.021728515625, -0.8358154296875, -0.64990234375, -0.4639892578125, -0.278076171875, -0.0921630859375, 0.09375, 0.2796630859375, 0.465576171875, 0.6514892578125, 0.83740234375, 1.0233154296875, 1.209228515625, 1.3951416015625, 1.5810546875, 1.7669677734375, 1.952880859375, 2.1387939453125, 2.32470703125, 2.5106201171875, 2.696533203125, 2.8824462890625, 3.068359375, 3.2542724609375, 3.440185546875, 3.6260986328125, 3.81201171875, 3.9979248046875, 4.183837890625, 4.3697509765625, 4.5556640625, 4.7415771484375, 4.927490234375, 5.1134033203125, 5.29931640625, 5.4852294921875, 5.671142578125, 5.8570556640625, 6.04296875]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 4.0, 5.0, 3.0, 5.0, 4.0, 4.0, 9.0, 10.0, 9.0, 20.0, 12.0, 18.0, 18.0, 21.0, 28.0, 35.0, 37.0, 38.0, 40.0, 56.0, 49.0, 89.0, 184.0, 1570.0, 286.0, 99.0, 51.0, 34.0, 42.0, 36.0, 28.0, 41.0, 28.0, 24.0, 16.0, 16.0, 15.0, 15.0, 12.0, 9.0, 10.0, 6.0, 5.0, 1.0, 9.0, 4.0, 0.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-26.171875, -25.41650390625, -24.6611328125, -23.90576171875, -23.150390625, -22.39501953125, -21.6396484375, -20.88427734375, -20.12890625, -19.37353515625, -18.6181640625, -17.86279296875, -17.107421875, -16.35205078125, -15.5966796875, -14.84130859375, -14.0859375, -13.33056640625, -12.5751953125, -11.81982421875, -11.064453125, -10.30908203125, -9.5537109375, -8.79833984375, -8.04296875, -7.28759765625, -6.5322265625, -5.77685546875, -5.021484375, -4.26611328125, -3.5107421875, -2.75537109375, -2.0, -1.24462890625, -0.4892578125, 0.26611328125, 1.021484375, 1.77685546875, 2.5322265625, 3.28759765625, 4.04296875, 4.79833984375, 5.5537109375, 6.30908203125, 7.064453125, 7.81982421875, 8.5751953125, 9.33056640625, 10.0859375, 10.84130859375, 11.5966796875, 12.35205078125, 13.107421875, 13.86279296875, 14.6181640625, 15.37353515625, 16.12890625, 16.88427734375, 17.6396484375, 18.39501953125, 19.150390625, 19.90576171875, 20.6611328125, 21.41650390625, 22.171875]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 4.0, 4.0, 2.0, 5.0, 9.0, 9.0, 15.0, 18.0, 16.0, 25.0, 26.0, 45.0, 65.0, 77.0, 120.0, 152.0, 205.0, 336.0, 572.0, 4498.0, 3064999.0, 71799.0, 1246.0, 449.0, 313.0, 176.0, 139.0, 102.0, 68.0, 60.0, 38.0, 29.0, 21.0, 18.0, 16.0, 12.0, 6.0, 7.0, 5.0, 5.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-80.875, -78.67431640625, -76.4736328125, -74.27294921875, -72.072265625, -69.87158203125, -67.6708984375, -65.47021484375, -63.26953125, -61.06884765625, -58.8681640625, -56.66748046875, -54.466796875, -52.26611328125, -50.0654296875, -47.86474609375, -45.6640625, -43.46337890625, -41.2626953125, -39.06201171875, -36.861328125, -34.66064453125, -32.4599609375, -30.25927734375, -28.05859375, -25.85791015625, -23.6572265625, -21.45654296875, -19.255859375, -17.05517578125, -14.8544921875, -12.65380859375, -10.453125, -8.25244140625, -6.0517578125, -3.85107421875, -1.650390625, 0.55029296875, 2.7509765625, 4.95166015625, 7.15234375, 9.35302734375, 11.5537109375, 13.75439453125, 15.955078125, 18.15576171875, 20.3564453125, 22.55712890625, 24.7578125, 26.95849609375, 29.1591796875, 31.35986328125, 33.560546875, 35.76123046875, 37.9619140625, 40.16259765625, 42.36328125, 44.56396484375, 46.7646484375, 48.96533203125, 51.166015625, 53.36669921875, 55.5673828125, 57.76806640625, 59.96875]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 33.0, 288.0, 533.0, 150.0, 8.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-183.6324005126953, -180.37060546875, -177.10879516601562, -173.8470001220703, -170.585205078125, -167.32339477539062, -164.0615997314453, -160.7998046875, -157.53799438476562, -154.2761993408203, -151.01438903808594, -147.75259399414062, -144.4907989501953, -141.22898864746094, -137.96719360351562, -134.7053985595703, -131.443603515625, -128.1818084716797, -124.92000579833984, -121.658203125, -118.39640045166016, -115.13459777832031, -111.872802734375, -108.61100006103516, -105.34919738769531, -102.08739471435547, -98.82559967041016, -95.56379699707031, -92.30199432373047, -89.04019165039062, -85.77839660644531, -82.51659393310547, -79.25479125976562, -75.99298858642578, -72.73119354248047, -69.46939086914062, -66.20758819580078, -62.9457893371582, -59.683990478515625, -56.42218780517578, -53.1603889465332, -49.898590087890625, -46.63678741455078, -43.3749885559082, -40.113189697265625, -36.85138702392578, -33.5895881652832, -30.327787399291992, -27.06598663330078, -23.80418586730957, -20.54238510131836, -17.28058624267578, -14.01878547668457, -10.75698471069336, -7.495185852050781, -4.23338508605957, -0.9715843200683594, 2.2902159690856934, 5.552016258239746, 8.81381607055664, 12.075616836547852, 15.337417602539062, 18.59921646118164, 21.86101722717285, 25.122817993164062]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 5.0, 3.0, 2.0, 7.0, 5.0, 8.0, 14.0, 9.0, 10.0, 14.0, 22.0, 20.0, 23.0, 29.0, 30.0, 32.0, 44.0, 39.0, 52.0, 31.0, 44.0, 50.0, 45.0, 53.0, 50.0, 42.0, 46.0, 45.0, 38.0, 33.0, 27.0, 19.0, 23.0, 17.0, 17.0, 16.0, 9.0, 8.0, 9.0, 2.0, 9.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-61.78178787231445, -59.80503845214844, -57.828285217285156, -55.85153579711914, -53.874786376953125, -51.898033142089844, -49.92128372192383, -47.94453430175781, -45.96778106689453, -43.991031646728516, -42.014278411865234, -40.03752899169922, -38.0607795715332, -36.08403015136719, -34.107276916503906, -32.13052749633789, -30.153778076171875, -28.177026748657227, -26.20027732849121, -24.223526000976562, -22.246776580810547, -20.2700252532959, -18.29327392578125, -16.316524505615234, -14.339773178100586, -12.363022804260254, -10.386272430419922, -8.409521102905273, -6.432770729064941, -4.456020355224609, -2.479269027709961, -0.5025186538696289, 1.4742355346679688, 3.45098614692688, 5.427736759185791, 7.404487609863281, 9.381237983703613, 11.357988357543945, 13.334739685058594, 15.311490058898926, 17.288240432739258, 19.264991760253906, 21.241741180419922, 23.21849250793457, 25.19524383544922, 27.171993255615234, 29.148744583129883, 31.12549591064453, 33.10224533081055, 35.07899475097656, 37.055747985839844, 39.03249740600586, 41.009246826171875, 42.986000061035156, 44.96274948120117, 46.93949890136719, 48.91625213623047, 50.893001556396484, 52.869754791259766, 54.84650421142578, 56.8232536315918, 58.80000305175781, 60.776756286621094, 62.75350570678711, 64.73025512695312]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 5.0, 7.0, 7.0, 6.0, 10.0, 13.0, 14.0, 13.0, 16.0, 27.0, 25.0, 28.0, 32.0, 37.0, 36.0, 46.0, 35.0, 41.0, 46.0, 41.0, 43.0, 63.0, 53.0, 38.0, 40.0, 33.0, 40.0, 38.0, 22.0, 27.0, 23.0, 16.0, 11.0, 11.0, 7.0, 15.0, 10.0, 6.0, 6.0, 9.0, 1.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0], "bins": [-9.4609375, -9.205322265625, -8.94970703125, -8.694091796875, -8.4384765625, -8.182861328125, -7.92724609375, -7.671630859375, -7.416015625, -7.160400390625, -6.90478515625, -6.649169921875, -6.3935546875, -6.137939453125, -5.88232421875, -5.626708984375, -5.37109375, -5.115478515625, -4.85986328125, -4.604248046875, -4.3486328125, -4.093017578125, -3.83740234375, -3.581787109375, -3.326171875, -3.070556640625, -2.81494140625, -2.559326171875, -2.3037109375, -2.048095703125, -1.79248046875, -1.536865234375, -1.28125, -1.025634765625, -0.77001953125, -0.514404296875, -0.2587890625, -0.003173828125, 0.25244140625, 0.508056640625, 0.763671875, 1.019287109375, 1.27490234375, 1.530517578125, 1.7861328125, 2.041748046875, 2.29736328125, 2.552978515625, 2.80859375, 3.064208984375, 3.31982421875, 3.575439453125, 3.8310546875, 4.086669921875, 4.34228515625, 4.597900390625, 4.853515625, 5.109130859375, 5.36474609375, 5.620361328125, 5.8759765625, 6.131591796875, 6.38720703125, 6.642822265625, 6.8984375]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 6.0, 4.0, 12.0, 10.0, 12.0, 12.0, 16.0, 16.0, 31.0, 29.0, 34.0, 55.0, 96.0, 184.0, 344.0, 850.0, 3430.0, 38590.0, 2113743.0, 1995634.0, 36439.0, 3132.0, 829.0, 301.0, 137.0, 85.0, 56.0, 42.0, 29.0, 17.0, 18.0, 11.0, 17.0, 9.0, 7.0, 9.0, 8.0, 6.0, 8.0, 5.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-32.625, -31.718505859375, -30.81201171875, -29.905517578125, -28.9990234375, -28.092529296875, -27.18603515625, -26.279541015625, -25.373046875, -24.466552734375, -23.56005859375, -22.653564453125, -21.7470703125, -20.840576171875, -19.93408203125, -19.027587890625, -18.12109375, -17.214599609375, -16.30810546875, -15.401611328125, -14.4951171875, -13.588623046875, -12.68212890625, -11.775634765625, -10.869140625, -9.962646484375, -9.05615234375, -8.149658203125, -7.2431640625, -6.336669921875, -5.43017578125, -4.523681640625, -3.6171875, -2.710693359375, -1.80419921875, -0.897705078125, 0.0087890625, 0.915283203125, 1.82177734375, 2.728271484375, 3.634765625, 4.541259765625, 5.44775390625, 6.354248046875, 7.2607421875, 8.167236328125, 9.07373046875, 9.980224609375, 10.88671875, 11.793212890625, 12.69970703125, 13.606201171875, 14.5126953125, 15.419189453125, 16.32568359375, 17.232177734375, 18.138671875, 19.045166015625, 19.95166015625, 20.858154296875, 21.7646484375, 22.671142578125, 23.57763671875, 24.484130859375, 25.390625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 4.0, 3.0, 7.0, 6.0, 5.0, 15.0, 20.0, 16.0, 27.0, 30.0, 53.0, 50.0, 75.0, 81.0, 90.0, 150.0, 184.0, 205.0, 303.0, 369.0, 436.0, 377.0, 317.0, 301.0, 242.0, 155.0, 128.0, 95.0, 72.0, 59.0, 39.0, 40.0, 24.0, 27.0, 17.0, 18.0, 13.0, 8.0, 7.0, 4.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.59375, -11.1915283203125, -10.789306640625, -10.3870849609375, -9.98486328125, -9.5826416015625, -9.180419921875, -8.7781982421875, -8.3759765625, -7.9737548828125, -7.571533203125, -7.1693115234375, -6.76708984375, -6.3648681640625, -5.962646484375, -5.5604248046875, -5.158203125, -4.7559814453125, -4.353759765625, -3.9515380859375, -3.54931640625, -3.1470947265625, -2.744873046875, -2.3426513671875, -1.9404296875, -1.5382080078125, -1.135986328125, -0.7337646484375, -0.33154296875, 0.0706787109375, 0.472900390625, 0.8751220703125, 1.27734375, 1.6795654296875, 2.081787109375, 2.4840087890625, 2.88623046875, 3.2884521484375, 3.690673828125, 4.0928955078125, 4.4951171875, 4.8973388671875, 5.299560546875, 5.7017822265625, 6.10400390625, 6.5062255859375, 6.908447265625, 7.3106689453125, 7.712890625, 8.1151123046875, 8.517333984375, 8.9195556640625, 9.32177734375, 9.7239990234375, 10.126220703125, 10.5284423828125, 10.9306640625, 11.3328857421875, 11.735107421875, 12.1373291015625, 12.53955078125, 12.9417724609375, 13.343994140625, 13.7462158203125, 14.1484375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 4.0, 9.0, 8.0, 7.0, 11.0, 11.0, 26.0, 18.0, 38.0, 49.0, 66.0, 61.0, 79.0, 98.0, 113.0, 173.0, 181.0, 254.0, 364.0, 687.0, 5324.0, 2775443.0, 1405573.0, 3553.0, 598.0, 332.0, 254.0, 183.0, 136.0, 120.0, 103.0, 70.0, 81.0, 64.0, 43.0, 35.0, 32.0, 21.0, 20.0, 10.0, 11.0, 9.0, 3.0, 1.0, 4.0, 5.0, 2.0, 3.0, 0.0, 1.0], "bins": [-75.5, -73.39990234375, -71.2998046875, -69.19970703125, -67.099609375, -64.99951171875, -62.8994140625, -60.79931640625, -58.69921875, -56.59912109375, -54.4990234375, -52.39892578125, -50.298828125, -48.19873046875, -46.0986328125, -43.99853515625, -41.8984375, -39.79833984375, -37.6982421875, -35.59814453125, -33.498046875, -31.39794921875, -29.2978515625, -27.19775390625, -25.09765625, -22.99755859375, -20.8974609375, -18.79736328125, -16.697265625, -14.59716796875, -12.4970703125, -10.39697265625, -8.296875, -6.19677734375, -4.0966796875, -1.99658203125, 0.103515625, 2.20361328125, 4.3037109375, 6.40380859375, 8.50390625, 10.60400390625, 12.7041015625, 14.80419921875, 16.904296875, 19.00439453125, 21.1044921875, 23.20458984375, 25.3046875, 27.40478515625, 29.5048828125, 31.60498046875, 33.705078125, 35.80517578125, 37.9052734375, 40.00537109375, 42.10546875, 44.20556640625, 46.3056640625, 48.40576171875, 50.505859375, 52.60595703125, 54.7060546875, 56.80615234375, 58.90625]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 34.0, 86.0, 162.0, 294.0, 240.0, 127.0, 50.0, 11.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.5203628540039, -86.55103302001953, -82.58169555664062, -78.61236572265625, -74.64303588867188, -70.67369842529297, -66.7043685913086, -62.73503494262695, -58.76570129394531, -54.79636764526367, -50.82703399658203, -46.857704162597656, -42.888370513916016, -38.919036865234375, -34.94970703125, -30.98037338256836, -27.01103973388672, -23.041706085205078, -19.07237434387207, -15.103041648864746, -11.133708953857422, -7.164375305175781, -3.1950435638427734, 0.7742881774902344, 4.743621826171875, 8.7129545211792, 12.682287216186523, 16.65161895751953, 20.620952606201172, 24.590286254882812, 28.55961799621582, 32.52894973754883, 36.498291015625, 40.46762466430664, 44.43695831298828, 48.406288146972656, 52.3756217956543, 56.34495544433594, 60.31428527832031, 64.28361511230469, 68.2529525756836, 72.22228240966797, 76.19161987304688, 80.16094970703125, 84.13027954101562, 88.09961700439453, 92.0689468383789, 96.03828430175781, 100.00761413574219, 103.97694396972656, 107.94628143310547, 111.91561126708984, 115.88494873046875, 119.85427856445312, 123.8236083984375, 127.79293823242188, 131.76226806640625, 135.73159790039062, 139.700927734375, 143.67027282714844, 147.6396026611328, 151.6089324951172, 155.57826232910156, 159.54759216308594, 163.51693725585938]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 3.0, 8.0, 8.0, 11.0, 15.0, 18.0, 8.0, 18.0, 21.0, 22.0, 25.0, 16.0, 30.0, 30.0, 37.0, 36.0, 42.0, 42.0, 45.0, 45.0, 33.0, 39.0, 42.0, 32.0, 45.0, 43.0, 37.0, 26.0, 27.0, 17.0, 28.0, 25.0, 23.0, 14.0, 23.0, 12.0, 10.0, 7.0, 5.0, 10.0, 4.0, 3.0, 6.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-48.53730773925781, -47.08234786987305, -45.62739181518555, -44.17243194580078, -42.71747589111328, -41.262516021728516, -39.80755615234375, -38.35260009765625, -36.89764404296875, -35.442684173583984, -33.987728118896484, -32.53276824951172, -31.07781219482422, -29.622852325439453, -28.16789436340332, -26.712936401367188, -25.257976531982422, -23.80301856994629, -22.348060607910156, -20.89310073852539, -19.43814468383789, -17.983184814453125, -16.528226852416992, -15.07326889038086, -13.618310928344727, -12.163352966308594, -10.708395004272461, -9.253436088562012, -7.798478126525879, -6.343520164489746, -4.888561248779297, -3.433603286743164, -1.9786453247070312, -0.5236871242523193, 0.9312710762023926, 2.3862295150756836, 3.8411874771118164, 5.296145439147949, 6.751104354858398, 8.206062316894531, 9.661020278930664, 11.115978240966797, 12.57093620300293, 14.025895118713379, 15.480853080749512, 16.935810089111328, 18.390769958496094, 19.845727920532227, 21.30068588256836, 22.755643844604492, 24.210601806640625, 25.66556167602539, 27.12051773071289, 28.575477600097656, 30.03043556213379, 31.485393524169922, 32.94035339355469, 34.39531326293945, 35.85026931762695, 37.30522918701172, 38.76018524169922, 40.215145111083984, 41.67010498046875, 43.12506103515625, 44.58001708984375]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 6.0, 9.0, 8.0, 8.0, 8.0, 17.0, 22.0, 13.0, 19.0, 23.0, 29.0, 29.0, 32.0, 45.0, 35.0, 38.0, 34.0, 41.0, 45.0, 51.0, 58.0, 45.0, 51.0, 38.0, 40.0, 35.0, 35.0, 41.0, 36.0, 18.0, 14.0, 19.0, 12.0, 11.0, 12.0, 10.0, 5.0, 3.0, 6.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-8.7421875, -8.48065185546875, -8.2191162109375, -7.95758056640625, -7.696044921875, -7.43450927734375, -7.1729736328125, -6.91143798828125, -6.64990234375, -6.38836669921875, -6.1268310546875, -5.86529541015625, -5.603759765625, -5.34222412109375, -5.0806884765625, -4.81915283203125, -4.5576171875, -4.29608154296875, -4.0345458984375, -3.77301025390625, -3.511474609375, -3.24993896484375, -2.9884033203125, -2.72686767578125, -2.46533203125, -2.20379638671875, -1.9422607421875, -1.68072509765625, -1.419189453125, -1.15765380859375, -0.8961181640625, -0.63458251953125, -0.373046875, -0.11151123046875, 0.1500244140625, 0.41156005859375, 0.673095703125, 0.93463134765625, 1.1961669921875, 1.45770263671875, 1.71923828125, 1.98077392578125, 2.2423095703125, 2.50384521484375, 2.765380859375, 3.02691650390625, 3.2884521484375, 3.54998779296875, 3.8115234375, 4.07305908203125, 4.3345947265625, 4.59613037109375, 4.857666015625, 5.11920166015625, 5.3807373046875, 5.64227294921875, 5.90380859375, 6.16534423828125, 6.4268798828125, 6.68841552734375, 6.949951171875, 7.21148681640625, 7.4730224609375, 7.73455810546875, 7.99609375]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 8.0, 10.0, 9.0, 19.0, 29.0, 46.0, 57.0, 91.0, 126.0, 190.0, 287.0, 468.0, 740.0, 1191.0, 1911.0, 3049.0, 5046.0, 8638.0, 14334.0, 24240.0, 40788.0, 68829.0, 116634.0, 206998.0, 228548.0, 134115.0, 77555.0, 46042.0, 27513.0, 16434.0, 9789.0, 5707.0, 3466.0, 2032.0, 1288.0, 789.0, 514.0, 343.0, 235.0, 160.0, 92.0, 59.0, 39.0, 38.0, 14.0, 13.0, 10.0, 8.0, 7.0, 5.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9306640625, -0.9016876220703125, -0.872711181640625, -0.8437347412109375, -0.81475830078125, -0.7857818603515625, -0.756805419921875, -0.7278289794921875, -0.6988525390625, -0.6698760986328125, -0.640899658203125, -0.6119232177734375, -0.58294677734375, -0.5539703369140625, -0.524993896484375, -0.4960174560546875, -0.467041015625, -0.4380645751953125, -0.409088134765625, -0.3801116943359375, -0.35113525390625, -0.3221588134765625, -0.293182373046875, -0.2642059326171875, -0.2352294921875, -0.2062530517578125, -0.177276611328125, -0.1483001708984375, -0.11932373046875, -0.0903472900390625, -0.061370849609375, -0.0323944091796875, -0.00341796875, 0.0255584716796875, 0.054534912109375, 0.0835113525390625, 0.11248779296875, 0.1414642333984375, 0.170440673828125, 0.1994171142578125, 0.2283935546875, 0.2573699951171875, 0.286346435546875, 0.3153228759765625, 0.34429931640625, 0.3732757568359375, 0.402252197265625, 0.4312286376953125, 0.460205078125, 0.4891815185546875, 0.518157958984375, 0.5471343994140625, 0.57611083984375, 0.6050872802734375, 0.634063720703125, 0.6630401611328125, 0.6920166015625, 0.7209930419921875, 0.749969482421875, 0.7789459228515625, 0.80792236328125, 0.8368988037109375, 0.865875244140625, 0.8948516845703125, 0.923828125]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 5.0, 1.0, 5.0, 2.0, 7.0, 4.0, 6.0, 8.0, 9.0, 8.0, 16.0, 17.0, 16.0, 28.0, 26.0, 31.0, 30.0, 39.0, 29.0, 47.0, 45.0, 45.0, 43.0, 44.0, 1084.0, 47.0, 35.0, 48.0, 42.0, 26.0, 30.0, 25.0, 19.0, 23.0, 18.0, 22.0, 17.0, 17.0, 12.0, 7.0, 10.0, 10.0, 8.0, 4.0, 4.0, 2.0, 4.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 2.0], "bins": [-5.19140625, -5.0404052734375, -4.889404296875, -4.7384033203125, -4.58740234375, -4.4364013671875, -4.285400390625, -4.1343994140625, -3.9833984375, -3.8323974609375, -3.681396484375, -3.5303955078125, -3.37939453125, -3.2283935546875, -3.077392578125, -2.9263916015625, -2.775390625, -2.6243896484375, -2.473388671875, -2.3223876953125, -2.17138671875, -2.0203857421875, -1.869384765625, -1.7183837890625, -1.5673828125, -1.4163818359375, -1.265380859375, -1.1143798828125, -0.96337890625, -0.8123779296875, -0.661376953125, -0.5103759765625, -0.359375, -0.2083740234375, -0.057373046875, 0.0936279296875, 0.24462890625, 0.3956298828125, 0.546630859375, 0.6976318359375, 0.8486328125, 0.9996337890625, 1.150634765625, 1.3016357421875, 1.45263671875, 1.6036376953125, 1.754638671875, 1.9056396484375, 2.056640625, 2.2076416015625, 2.358642578125, 2.5096435546875, 2.66064453125, 2.8116455078125, 2.962646484375, 3.1136474609375, 3.2646484375, 3.4156494140625, 3.566650390625, 3.7176513671875, 3.86865234375, 4.0196533203125, 4.170654296875, 4.3216552734375, 4.47265625]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 7.0, 6.0, 17.0, 13.0, 25.0, 46.0, 51.0, 59.0, 107.0, 133.0, 191.0, 297.0, 476.0, 650.0, 905.0, 1428.0, 2131.0, 3169.0, 4882.0, 7748.0, 12015.0, 19509.0, 31906.0, 52933.0, 87907.0, 146580.0, 1265216.0, 178955.0, 108564.0, 65494.0, 39128.0, 24596.0, 14981.0, 9507.0, 5997.0, 3836.0, 2473.0, 1667.0, 1075.0, 730.0, 502.0, 373.0, 233.0, 188.0, 141.0, 94.0, 57.0, 41.0, 37.0, 28.0, 11.0, 6.0, 5.0, 7.0, 1.0, 3.0], "bins": [-0.87060546875, -0.8455276489257812, -0.8204498291015625, -0.7953720092773438, -0.770294189453125, -0.7452163696289062, -0.7201385498046875, -0.6950607299804688, -0.66998291015625, -0.6449050903320312, -0.6198272705078125, -0.5947494506835938, -0.569671630859375, -0.5445938110351562, -0.5195159912109375, -0.49443817138671875, -0.4693603515625, -0.44428253173828125, -0.4192047119140625, -0.39412689208984375, -0.369049072265625, -0.34397125244140625, -0.3188934326171875, -0.29381561279296875, -0.26873779296875, -0.24365997314453125, -0.2185821533203125, -0.19350433349609375, -0.168426513671875, -0.14334869384765625, -0.1182708740234375, -0.09319305419921875, -0.068115234375, -0.04303741455078125, -0.0179595947265625, 0.00711822509765625, 0.032196044921875, 0.05727386474609375, 0.0823516845703125, 0.10742950439453125, 0.13250732421875, 0.15758514404296875, 0.1826629638671875, 0.20774078369140625, 0.232818603515625, 0.25789642333984375, 0.2829742431640625, 0.30805206298828125, 0.3331298828125, 0.35820770263671875, 0.3832855224609375, 0.40836334228515625, 0.433441162109375, 0.45851898193359375, 0.4835968017578125, 0.5086746215820312, 0.53375244140625, 0.5588302612304688, 0.5839080810546875, 0.6089859008789062, 0.634063720703125, 0.6591415405273438, 0.6842193603515625, 0.7092971801757812, 0.734375]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 2.0, 0.0, 3.0, 4.0, 6.0, 8.0, 7.0, 6.0, 13.0, 13.0, 15.0, 19.0, 15.0, 36.0, 30.0, 30.0, 42.0, 45.0, 57.0, 58.0, 65.0, 71.0, 56.0, 60.0, 53.0, 32.0, 49.0, 33.0, 30.0, 19.0, 27.0, 15.0, 23.0, 10.0, 13.0, 7.0, 9.0, 8.0, 6.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0032100677490234375, -0.0031102895736694336, -0.0030105113983154297, -0.0029107332229614258, -0.002810955047607422, -0.002711176872253418, -0.002611398696899414, -0.00251162052154541, -0.0024118423461914062, -0.0023120641708374023, -0.0022122859954833984, -0.0021125078201293945, -0.0020127296447753906, -0.0019129514694213867, -0.0018131732940673828, -0.001713395118713379, -0.001613616943359375, -0.001513838768005371, -0.0014140605926513672, -0.0013142824172973633, -0.0012145042419433594, -0.0011147260665893555, -0.0010149478912353516, -0.0009151697158813477, -0.0008153915405273438, -0.0007156133651733398, -0.0006158351898193359, -0.000516057014465332, -0.0004162788391113281, -0.0003165006637573242, -0.0002167224884033203, -0.0001169443130493164, -1.71661376953125e-05, 8.26120376586914e-05, 0.0001823902130126953, 0.0002821683883666992, 0.0003819465637207031, 0.00048172473907470703, 0.0005815029144287109, 0.0006812810897827148, 0.0007810592651367188, 0.0008808374404907227, 0.0009806156158447266, 0.0010803937911987305, 0.0011801719665527344, 0.0012799501419067383, 0.0013797283172607422, 0.001479506492614746, 0.00157928466796875, 0.001679062843322754, 0.0017788410186767578, 0.0018786191940307617, 0.0019783973693847656, 0.0020781755447387695, 0.0021779537200927734, 0.0022777318954467773, 0.0023775100708007812, 0.002477288246154785, 0.002577066421508789, 0.002676844596862793, 0.002776622772216797, 0.0028764009475708008, 0.0029761791229248047, 0.0030759572982788086, 0.0031757354736328125]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 5.0, 8.0, 7.0, 7.0, 10.0, 16.0, 15.0, 21.0, 27.0, 33.0, 49.0, 49.0, 88.0, 135.0, 244.0, 755.0, 85618.0, 959670.0, 1047.0, 276.0, 142.0, 89.0, 61.0, 49.0, 29.0, 18.0, 20.0, 15.0, 9.0, 12.0, 8.0, 8.0, 5.0, 5.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09197998046875, -0.08911609649658203, -0.08625221252441406, -0.0833883285522461, -0.08052444458007812, -0.07766056060791016, -0.07479667663574219, -0.07193279266357422, -0.06906890869140625, -0.06620502471923828, -0.06334114074707031, -0.060477256774902344, -0.057613372802734375, -0.054749488830566406, -0.05188560485839844, -0.04902172088623047, -0.0461578369140625, -0.04329395294189453, -0.04043006896972656, -0.037566184997558594, -0.034702301025390625, -0.031838417053222656, -0.028974533081054688, -0.02611064910888672, -0.02324676513671875, -0.02038288116455078, -0.017518997192382812, -0.014655113220214844, -0.011791229248046875, -0.008927345275878906, -0.0060634613037109375, -0.0031995773315429688, -0.000335693359375, 0.0025281906127929688, 0.0053920745849609375, 0.008255958557128906, 0.011119842529296875, 0.013983726501464844, 0.016847610473632812, 0.01971149444580078, 0.02257537841796875, 0.02543926239013672, 0.028303146362304688, 0.031167030334472656, 0.034030914306640625, 0.036894798278808594, 0.03975868225097656, 0.04262256622314453, 0.0454864501953125, 0.04835033416748047, 0.05121421813964844, 0.054078102111816406, 0.056941986083984375, 0.059805870056152344, 0.06266975402832031, 0.06553363800048828, 0.06839752197265625, 0.07126140594482422, 0.07412528991699219, 0.07698917388916016, 0.07985305786132812, 0.0827169418334961, 0.08558082580566406, 0.08844470977783203, 0.09130859375]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 8.0, 47.0, 178.0, 348.0, 316.0, 95.0, 18.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018742933170869946, -0.0017148256301879883, -0.00155535782687366, -0.0013958901399746537, -0.0012364224530756474, -0.0010769546497613192, -0.0009174869628623128, -0.0007580191595479846, -0.0005985514726489782, -0.00043908372754231095, -0.00027961601153947413, -0.0001201482955366373, 3.9319449570029974e-05, 0.00019878719467669725, 0.0003582548815757036, 0.0005177226848900318, 0.0006771903717890382, 0.0008366581168957055, 0.0009961258620023727, 0.0011555935489013791, 0.0013150612358003855, 0.0014745290391147137, 0.00163399672601372, 0.0017934645293280482, 0.0019529322162270546, 0.002112400019541383, 0.0022718675900250673, 0.0024313353933393955, 0.0025908031966537237, 0.002750270999968052, 0.0029097385704517365, 0.0030692063737660646, 0.003228674177080393, 0.003388141980394721, 0.0035476095508784056, 0.0037070773541927338, 0.003866545157507062, 0.00402601296082139, 0.004185480531305075, 0.0043449485674500465, 0.004504416137933731, 0.004663883708417416, 0.0048233517445623875, 0.004982819315046072, 0.0051422868855297565, 0.005301754921674728, 0.005461222492158413, 0.0056206900626420975, 0.005780157633125782, 0.0059396252036094666, 0.006099093239754438, 0.006258560810238123, 0.0064180283807218075, 0.006577496416866779, 0.006736963987350464, 0.006896431557834148, 0.00705589959397912, 0.007215367164462805, 0.007374835200607777, 0.007534302771091461, 0.007693770341575146, 0.00785323791205883, 0.00801270641386509, 0.008172173984348774, 0.008331641554832458]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 5.0, 6.0, 7.0, 3.0, 7.0, 7.0, 8.0, 14.0, 14.0, 20.0, 22.0, 18.0, 16.0, 23.0, 21.0, 19.0, 27.0, 24.0, 21.0, 28.0, 42.0, 30.0, 47.0, 31.0, 42.0, 44.0, 14.0, 29.0, 32.0, 31.0, 44.0, 28.0, 33.0, 30.0, 30.0, 31.0, 19.0, 13.0, 12.0, 17.0, 11.0, 12.0, 14.0, 13.0, 4.0, 11.0, 7.0, 5.0, 7.0, 5.0, 5.0, 4.0, 1.0, 2.0, 1.0], "bins": [-0.0016112327575683594, -0.001564408652484417, -0.0015175845474004745, -0.0014707604423165321, -0.0014239363372325897, -0.0013771122321486473, -0.001330288127064705, -0.0012834640219807625, -0.00123663991689682, -0.0011898158118128777, -0.0011429917067289352, -0.0010961676016449928, -0.0010493434965610504, -0.001002519391477108, -0.0009556952863931656, -0.0009088711813092232, -0.0008620470762252808, -0.0008152229711413383, -0.0007683988660573959, -0.0007215747609734535, -0.0006747506558895111, -0.0006279265508055687, -0.0005811024457216263, -0.0005342783406376839, -0.00048745423555374146, -0.00044063013046979904, -0.00039380602538585663, -0.0003469819203019142, -0.0003001578152179718, -0.0002533337101340294, -0.00020650960505008698, -0.00015968549996614456, -0.00011286139488220215, -6.603728979825974e-05, -1.9213184714317322e-05, 2.761092036962509e-05, 7.44350254535675e-05, 0.00012125913053750992, 0.00016808323562145233, 0.00021490734070539474, 0.00026173144578933716, 0.00030855555087327957, 0.000355379655957222, 0.0004022037610411644, 0.0004490278661251068, 0.0004958519712090492, 0.0005426760762929916, 0.000589500181376934, 0.0006363242864608765, 0.0006831483915448189, 0.0007299724966287613, 0.0007767966017127037, 0.0008236207067966461, 0.0008704448118805885, 0.0009172689169645309, 0.0009640930220484734, 0.0010109171271324158, 0.0010577412322163582, 0.0011045653373003006, 0.001151389442384243, 0.0011982135474681854, 0.0012450376525521278, 0.0012918617576360703, 0.0013386858627200127, 0.001385509967803955]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 6.0, 9.0, 8.0, 8.0, 8.0, 17.0, 22.0, 13.0, 19.0, 23.0, 29.0, 29.0, 32.0, 45.0, 35.0, 38.0, 34.0, 41.0, 45.0, 51.0, 58.0, 45.0, 51.0, 38.0, 41.0, 34.0, 35.0, 41.0, 36.0, 18.0, 14.0, 19.0, 12.0, 11.0, 12.0, 10.0, 5.0, 3.0, 6.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-8.7421875, -8.48065185546875, -8.2191162109375, -7.95758056640625, -7.696044921875, -7.43450927734375, -7.1729736328125, -6.91143798828125, -6.64990234375, -6.38836669921875, -6.1268310546875, -5.86529541015625, -5.603759765625, -5.34222412109375, -5.0806884765625, -4.81915283203125, -4.5576171875, -4.29608154296875, -4.0345458984375, -3.77301025390625, -3.511474609375, -3.24993896484375, -2.9884033203125, -2.72686767578125, -2.46533203125, -2.20379638671875, -1.9422607421875, -1.68072509765625, -1.419189453125, -1.15765380859375, -0.8961181640625, -0.63458251953125, -0.373046875, -0.11151123046875, 0.1500244140625, 0.41156005859375, 0.673095703125, 0.93463134765625, 1.1961669921875, 1.45770263671875, 1.71923828125, 1.98077392578125, 2.2423095703125, 2.50384521484375, 2.765380859375, 3.02691650390625, 3.2884521484375, 3.54998779296875, 3.8115234375, 4.07305908203125, 4.3345947265625, 4.59613037109375, 4.857666015625, 5.11920166015625, 5.3807373046875, 5.64227294921875, 5.90380859375, 6.16534423828125, 6.4268798828125, 6.68841552734375, 6.949951171875, 7.21148681640625, 7.4730224609375, 7.73455810546875, 7.99609375]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 8.0, 5.0, 7.0, 9.0, 17.0, 19.0, 28.0, 47.0, 61.0, 68.0, 83.0, 124.0, 163.0, 297.0, 540.0, 1250.0, 3709.0, 11459.0, 38833.0, 140019.0, 515103.0, 244494.0, 64239.0, 18534.0, 5666.0, 1854.0, 824.0, 373.0, 203.0, 144.0, 98.0, 82.0, 50.0, 35.0, 22.0, 26.0, 17.0, 12.0, 11.0, 9.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-9.4453125, -9.1650390625, -8.884765625, -8.6044921875, -8.32421875, -8.0439453125, -7.763671875, -7.4833984375, -7.203125, -6.9228515625, -6.642578125, -6.3623046875, -6.08203125, -5.8017578125, -5.521484375, -5.2412109375, -4.9609375, -4.6806640625, -4.400390625, -4.1201171875, -3.83984375, -3.5595703125, -3.279296875, -2.9990234375, -2.71875, -2.4384765625, -2.158203125, -1.8779296875, -1.59765625, -1.3173828125, -1.037109375, -0.7568359375, -0.4765625, -0.1962890625, 0.083984375, 0.3642578125, 0.64453125, 0.9248046875, 1.205078125, 1.4853515625, 1.765625, 2.0458984375, 2.326171875, 2.6064453125, 2.88671875, 3.1669921875, 3.447265625, 3.7275390625, 4.0078125, 4.2880859375, 4.568359375, 4.8486328125, 5.12890625, 5.4091796875, 5.689453125, 5.9697265625, 6.25, 6.5302734375, 6.810546875, 7.0908203125, 7.37109375, 7.6513671875, 7.931640625, 8.2119140625, 8.4921875]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 4.0, 4.0, 8.0, 4.0, 4.0, 14.0, 12.0, 9.0, 14.0, 22.0, 25.0, 22.0, 40.0, 37.0, 43.0, 47.0, 34.0, 37.0, 72.0, 119.0, 1564.0, 372.0, 99.0, 67.0, 46.0, 35.0, 43.0, 38.0, 39.0, 28.0, 19.0, 27.0, 11.0, 17.0, 10.0, 9.0, 8.0, 14.0, 12.0, 9.0, 6.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.1875, -22.412353515625, -21.63720703125, -20.862060546875, -20.0869140625, -19.311767578125, -18.53662109375, -17.761474609375, -16.986328125, -16.211181640625, -15.43603515625, -14.660888671875, -13.8857421875, -13.110595703125, -12.33544921875, -11.560302734375, -10.78515625, -10.010009765625, -9.23486328125, -8.459716796875, -7.6845703125, -6.909423828125, -6.13427734375, -5.359130859375, -4.583984375, -3.808837890625, -3.03369140625, -2.258544921875, -1.4833984375, -0.708251953125, 0.06689453125, 0.842041015625, 1.6171875, 2.392333984375, 3.16748046875, 3.942626953125, 4.7177734375, 5.492919921875, 6.26806640625, 7.043212890625, 7.818359375, 8.593505859375, 9.36865234375, 10.143798828125, 10.9189453125, 11.694091796875, 12.46923828125, 13.244384765625, 14.01953125, 14.794677734375, 15.56982421875, 16.344970703125, 17.1201171875, 17.895263671875, 18.67041015625, 19.445556640625, 20.220703125, 20.995849609375, 21.77099609375, 22.546142578125, 23.3212890625, 24.096435546875, 24.87158203125, 25.646728515625, 26.421875]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 11.0, 6.0, 8.0, 11.0, 14.0, 24.0, 22.0, 38.0, 38.0, 41.0, 51.0, 97.0, 135.0, 196.0, 350.0, 664.0, 2000.0, 154629.0, 2981288.0, 3904.0, 909.0, 444.0, 238.0, 159.0, 119.0, 80.0, 49.0, 43.0, 35.0, 21.0, 17.0, 12.0, 12.0, 8.0, 5.0, 7.0, 6.0, 3.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-79.1875, -76.935546875, -74.68359375, -72.431640625, -70.1796875, -67.927734375, -65.67578125, -63.423828125, -61.171875, -58.919921875, -56.66796875, -54.416015625, -52.1640625, -49.912109375, -47.66015625, -45.408203125, -43.15625, -40.904296875, -38.65234375, -36.400390625, -34.1484375, -31.896484375, -29.64453125, -27.392578125, -25.140625, -22.888671875, -20.63671875, -18.384765625, -16.1328125, -13.880859375, -11.62890625, -9.376953125, -7.125, -4.873046875, -2.62109375, -0.369140625, 1.8828125, 4.134765625, 6.38671875, 8.638671875, 10.890625, 13.142578125, 15.39453125, 17.646484375, 19.8984375, 22.150390625, 24.40234375, 26.654296875, 28.90625, 31.158203125, 33.41015625, 35.662109375, 37.9140625, 40.166015625, 42.41796875, 44.669921875, 46.921875, 49.173828125, 51.42578125, 53.677734375, 55.9296875, 58.181640625, 60.43359375, 62.685546875, 64.9375]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 8.0, 40.0, 239.0, 435.0, 238.0, 50.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.77983856201172, -39.25804901123047, -36.73625946044922, -34.21446990966797, -31.692678451538086, -29.170888900756836, -26.649097442626953, -24.127307891845703, -21.605518341064453, -19.083728790283203, -16.561939239501953, -14.04014778137207, -11.51835823059082, -8.99656867980957, -6.474778175354004, -3.9529876708984375, -1.4311981201171875, 1.0905919075012207, 3.612381935119629, 6.134171962738037, 8.655961990356445, 11.177751541137695, 13.699542045593262, 16.221332550048828, 18.743122100830078, 21.264911651611328, 23.786701202392578, 26.30849266052246, 28.83028221130371, 31.35207176208496, 33.873863220214844, 36.395652770996094, 38.91743469238281, 41.43922424316406, 43.96101379394531, 46.48280334472656, 49.00459289550781, 51.52638244628906, 54.04817581176758, 56.56996536254883, 59.09175491333008, 61.61354446411133, 64.13533782958984, 66.6571273803711, 69.17891693115234, 71.7007064819336, 74.22249603271484, 76.7442855834961, 79.26607513427734, 81.7878646850586, 84.30965423583984, 86.8314437866211, 89.35323333740234, 91.8750228881836, 94.39681243896484, 96.91860961914062, 99.44039916992188, 101.96218872070312, 104.48397827148438, 107.00576782226562, 109.52755737304688, 112.04934692382812, 114.57113647460938, 117.09292602539062, 119.61471557617188]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 7.0, 3.0, 3.0, 5.0, 6.0, 13.0, 11.0, 11.0, 18.0, 14.0, 14.0, 16.0, 21.0, 29.0, 23.0, 24.0, 22.0, 28.0, 33.0, 31.0, 24.0, 45.0, 44.0, 49.0, 38.0, 43.0, 28.0, 46.0, 33.0, 36.0, 32.0, 33.0, 35.0, 20.0, 26.0, 20.0, 20.0, 16.0, 16.0, 13.0, 14.0, 7.0, 8.0, 6.0, 6.0, 4.0, 2.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0], "bins": [-55.95088195800781, -54.147010803222656, -52.343143463134766, -50.53927230834961, -48.73540115356445, -46.93153381347656, -45.127662658691406, -43.32379150390625, -41.519920349121094, -39.71604919433594, -37.91218185424805, -36.10831069946289, -34.304439544677734, -32.500572204589844, -30.696701049804688, -28.89282989501953, -27.08896255493164, -25.285093307495117, -23.48122215270996, -21.677352905273438, -19.87348175048828, -18.069612503051758, -16.265743255615234, -14.461873054504395, -12.658002853393555, -10.854132652282715, -9.050262451171875, -7.246393203735352, -5.442523002624512, -3.638652801513672, -1.8347835540771484, -0.030913352966308594, 1.7729568481445312, 3.576826810836792, 5.380696773529053, 7.184566497802734, 8.988436698913574, 10.792306900024414, 12.596176147460938, 14.400046348571777, 16.203916549682617, 18.00778579711914, 19.811656951904297, 21.61552619934082, 23.419395446777344, 25.2232666015625, 27.027135848999023, 28.831005096435547, 30.634876251220703, 32.43874740600586, 34.24261474609375, 36.046485900878906, 37.85035705566406, 39.65422821044922, 41.45809555053711, 43.261966705322266, 45.065834045410156, 46.86970520019531, 48.6735725402832, 50.47744369506836, 52.281314849853516, 54.085182189941406, 55.88905334472656, 57.69292449951172, 59.496795654296875]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 7.0, 9.0, 3.0, 14.0, 14.0, 15.0, 23.0, 20.0, 16.0, 34.0, 25.0, 26.0, 41.0, 49.0, 34.0, 43.0, 45.0, 51.0, 49.0, 55.0, 43.0, 53.0, 58.0, 38.0, 40.0, 35.0, 27.0, 38.0, 14.0, 15.0, 19.0, 9.0, 12.0, 7.0, 6.0, 5.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.0546875, -9.7615966796875, -9.468505859375, -9.1754150390625, -8.88232421875, -8.5892333984375, -8.296142578125, -8.0030517578125, -7.7099609375, -7.4168701171875, -7.123779296875, -6.8306884765625, -6.53759765625, -6.2445068359375, -5.951416015625, -5.6583251953125, -5.365234375, -5.0721435546875, -4.779052734375, -4.4859619140625, -4.19287109375, -3.8997802734375, -3.606689453125, -3.3135986328125, -3.0205078125, -2.7274169921875, -2.434326171875, -2.1412353515625, -1.84814453125, -1.5550537109375, -1.261962890625, -0.9688720703125, -0.67578125, -0.3826904296875, -0.089599609375, 0.2034912109375, 0.49658203125, 0.7896728515625, 1.082763671875, 1.3758544921875, 1.6689453125, 1.9620361328125, 2.255126953125, 2.5482177734375, 2.84130859375, 3.1343994140625, 3.427490234375, 3.7205810546875, 4.013671875, 4.3067626953125, 4.599853515625, 4.8929443359375, 5.18603515625, 5.4791259765625, 5.772216796875, 6.0653076171875, 6.3583984375, 6.6514892578125, 6.944580078125, 7.2376708984375, 7.53076171875, 7.8238525390625, 8.116943359375, 8.4100341796875, 8.703125]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 5.0, 3.0, 0.0, 5.0, 6.0, 3.0, 9.0, 16.0, 12.0, 17.0, 17.0, 24.0, 25.0, 37.0, 46.0, 62.0, 105.0, 140.0, 246.0, 529.0, 1886.0, 28342.0, 2317875.0, 1820746.0, 21321.0, 1599.0, 480.0, 239.0, 139.0, 87.0, 62.0, 48.0, 34.0, 29.0, 24.0, 18.0, 11.0, 5.0, 11.0, 7.0, 10.0, 3.0, 2.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-34.5, -33.51318359375, -32.5263671875, -31.53955078125, -30.552734375, -29.56591796875, -28.5791015625, -27.59228515625, -26.60546875, -25.61865234375, -24.6318359375, -23.64501953125, -22.658203125, -21.67138671875, -20.6845703125, -19.69775390625, -18.7109375, -17.72412109375, -16.7373046875, -15.75048828125, -14.763671875, -13.77685546875, -12.7900390625, -11.80322265625, -10.81640625, -9.82958984375, -8.8427734375, -7.85595703125, -6.869140625, -5.88232421875, -4.8955078125, -3.90869140625, -2.921875, -1.93505859375, -0.9482421875, 0.03857421875, 1.025390625, 2.01220703125, 2.9990234375, 3.98583984375, 4.97265625, 5.95947265625, 6.9462890625, 7.93310546875, 8.919921875, 9.90673828125, 10.8935546875, 11.88037109375, 12.8671875, 13.85400390625, 14.8408203125, 15.82763671875, 16.814453125, 17.80126953125, 18.7880859375, 19.77490234375, 20.76171875, 21.74853515625, 22.7353515625, 23.72216796875, 24.708984375, 25.69580078125, 26.6826171875, 27.66943359375, 28.65625]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 5.0, 10.0, 4.0, 16.0, 14.0, 25.0, 49.0, 56.0, 95.0, 117.0, 150.0, 236.0, 357.0, 481.0, 531.0, 512.0, 432.0, 279.0, 192.0, 173.0, 96.0, 64.0, 52.0, 48.0, 24.0, 17.0, 12.0, 10.0, 8.0, 5.0, 4.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.890625, -12.34912109375, -11.8076171875, -11.26611328125, -10.724609375, -10.18310546875, -9.6416015625, -9.10009765625, -8.55859375, -8.01708984375, -7.4755859375, -6.93408203125, -6.392578125, -5.85107421875, -5.3095703125, -4.76806640625, -4.2265625, -3.68505859375, -3.1435546875, -2.60205078125, -2.060546875, -1.51904296875, -0.9775390625, -0.43603515625, 0.10546875, 0.64697265625, 1.1884765625, 1.72998046875, 2.271484375, 2.81298828125, 3.3544921875, 3.89599609375, 4.4375, 4.97900390625, 5.5205078125, 6.06201171875, 6.603515625, 7.14501953125, 7.6865234375, 8.22802734375, 8.76953125, 9.31103515625, 9.8525390625, 10.39404296875, 10.935546875, 11.47705078125, 12.0185546875, 12.56005859375, 13.1015625, 13.64306640625, 14.1845703125, 14.72607421875, 15.267578125, 15.80908203125, 16.3505859375, 16.89208984375, 17.43359375, 17.97509765625, 18.5166015625, 19.05810546875, 19.599609375, 20.14111328125, 20.6826171875, 21.22412109375, 21.765625]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 5.0, 15.0, 15.0, 17.0, 18.0, 28.0, 34.0, 51.0, 92.0, 109.0, 139.0, 177.0, 269.0, 266.0, 600.0, 3489.0, 4005076.0, 181184.0, 1107.0, 446.0, 321.0, 227.0, 170.0, 120.0, 82.0, 70.0, 54.0, 32.0, 25.0, 15.0, 11.0, 6.0, 9.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-112.25, -109.1982421875, -106.146484375, -103.0947265625, -100.04296875, -96.9912109375, -93.939453125, -90.8876953125, -87.8359375, -84.7841796875, -81.732421875, -78.6806640625, -75.62890625, -72.5771484375, -69.525390625, -66.4736328125, -63.421875, -60.3701171875, -57.318359375, -54.2666015625, -51.21484375, -48.1630859375, -45.111328125, -42.0595703125, -39.0078125, -35.9560546875, -32.904296875, -29.8525390625, -26.80078125, -23.7490234375, -20.697265625, -17.6455078125, -14.59375, -11.5419921875, -8.490234375, -5.4384765625, -2.38671875, 0.6650390625, 3.716796875, 6.7685546875, 9.8203125, 12.8720703125, 15.923828125, 18.9755859375, 22.02734375, 25.0791015625, 28.130859375, 31.1826171875, 34.234375, 37.2861328125, 40.337890625, 43.3896484375, 46.44140625, 49.4931640625, 52.544921875, 55.5966796875, 58.6484375, 61.7001953125, 64.751953125, 67.8037109375, 70.85546875, 73.9072265625, 76.958984375, 80.0107421875, 83.0625]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 6.0, 15.0, 26.0, 63.0, 122.0, 175.0, 197.0, 182.0, 120.0, 64.0, 23.0, 14.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-62.806365966796875, -60.00883483886719, -57.211299896240234, -54.41376876831055, -51.616233825683594, -48.818702697753906, -46.02117156982422, -43.223636627197266, -40.42610168457031, -37.628570556640625, -34.83103561401367, -32.033504486083984, -29.23596954345703, -26.438438415527344, -23.640905380249023, -20.843372344970703, -18.045841217041016, -15.248308181762695, -12.450775146484375, -9.653243064880371, -6.855710029602051, -4.0581769943237305, -1.2606449127197266, 1.5368881225585938, 4.334421157836914, 7.131954193115234, 9.929487228393555, 12.727019309997559, 15.524552345275879, 18.322086334228516, 21.119617462158203, 23.917150497436523, 26.714683532714844, 29.512216567993164, 32.309749603271484, 35.10728073120117, 37.904815673828125, 40.70234680175781, 43.4998779296875, 46.29741287231445, 49.094947814941406, 51.892478942871094, 54.69001388549805, 57.487545013427734, 60.28507995605469, 63.082611083984375, 65.88014221191406, 68.67767333984375, 71.47520446777344, 74.27273559570312, 77.07026672363281, 79.86780548095703, 82.66533660888672, 85.4628677368164, 88.2603988647461, 91.05793762207031, 93.85546875, 96.65299987792969, 99.45053100585938, 102.2480697631836, 105.04560089111328, 107.84313201904297, 110.64066314697266, 113.43820190429688, 116.23573303222656]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 7.0, 4.0, 5.0, 6.0, 7.0, 6.0, 9.0, 11.0, 23.0, 23.0, 20.0, 24.0, 25.0, 33.0, 34.0, 43.0, 28.0, 42.0, 49.0, 36.0, 38.0, 40.0, 42.0, 40.0, 45.0, 41.0, 50.0, 38.0, 35.0, 23.0, 30.0, 19.0, 21.0, 20.0, 12.0, 16.0, 13.0, 7.0, 10.0, 8.0, 6.0, 7.0, 6.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.248687744140625, -47.606300354003906, -45.96391677856445, -44.321529388427734, -42.67914581298828, -41.03675842285156, -39.394371032714844, -37.751983642578125, -36.10960006713867, -34.46721267700195, -32.8248291015625, -31.18244171142578, -29.540056228637695, -27.89767074584961, -26.25528335571289, -24.612897872924805, -22.97051239013672, -21.328126907348633, -19.685741424560547, -18.043354034423828, -16.400968551635742, -14.758583068847656, -13.116196632385254, -11.473810195922852, -9.831424713134766, -8.18903923034668, -6.546652793884277, -4.904266834259033, -3.261880874633789, -1.6194953918457031, 0.02289104461669922, 1.6652774810791016, 3.3076629638671875, 4.950048923492432, 6.592434883117676, 8.234821319580078, 9.877206802368164, 11.51959228515625, 13.161978721618652, 14.804365158081055, 16.44675064086914, 18.089136123657227, 19.731521606445312, 21.37390899658203, 23.016294479370117, 24.658679962158203, 26.301067352294922, 27.943452835083008, 29.585838317871094, 31.22822380065918, 32.870609283447266, 34.512996673583984, 36.15538024902344, 37.797767639160156, 39.440155029296875, 41.082542419433594, 42.72492599487305, 44.367313385009766, 46.00969696044922, 47.65208435058594, 49.294471740722656, 50.93685531616211, 52.57924270629883, 54.22162628173828, 55.864013671875]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 4.0, 1.0, 5.0, 6.0, 8.0, 8.0, 20.0, 12.0, 12.0, 18.0, 15.0, 21.0, 22.0, 33.0, 32.0, 30.0, 33.0, 37.0, 36.0, 41.0, 37.0, 50.0, 59.0, 30.0, 52.0, 39.0, 43.0, 44.0, 34.0, 30.0, 30.0, 22.0, 20.0, 27.0, 16.0, 19.0, 9.0, 13.0, 5.0, 10.0, 8.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.5078125, -8.2423095703125, -7.976806640625, -7.7113037109375, -7.44580078125, -7.1802978515625, -6.914794921875, -6.6492919921875, -6.3837890625, -6.1182861328125, -5.852783203125, -5.5872802734375, -5.32177734375, -5.0562744140625, -4.790771484375, -4.5252685546875, -4.259765625, -3.9942626953125, -3.728759765625, -3.4632568359375, -3.19775390625, -2.9322509765625, -2.666748046875, -2.4012451171875, -2.1357421875, -1.8702392578125, -1.604736328125, -1.3392333984375, -1.07373046875, -0.8082275390625, -0.542724609375, -0.2772216796875, -0.01171875, 0.2537841796875, 0.519287109375, 0.7847900390625, 1.05029296875, 1.3157958984375, 1.581298828125, 1.8468017578125, 2.1123046875, 2.3778076171875, 2.643310546875, 2.9088134765625, 3.17431640625, 3.4398193359375, 3.705322265625, 3.9708251953125, 4.236328125, 4.5018310546875, 4.767333984375, 5.0328369140625, 5.29833984375, 5.5638427734375, 5.829345703125, 6.0948486328125, 6.3603515625, 6.6258544921875, 6.891357421875, 7.1568603515625, 7.42236328125, 7.6878662109375, 7.953369140625, 8.2188720703125, 8.484375]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 6.0, 4.0, 11.0, 28.0, 28.0, 37.0, 57.0, 66.0, 95.0, 158.0, 234.0, 340.0, 512.0, 789.0, 1141.0, 1769.0, 2646.0, 4000.0, 6147.0, 9636.0, 15359.0, 23988.0, 38303.0, 61965.0, 100592.0, 165365.0, 218097.0, 151569.0, 92346.0, 56214.0, 35321.0, 21931.0, 13999.0, 8868.0, 5710.0, 3894.0, 2437.0, 1605.0, 1051.0, 763.0, 459.0, 317.0, 224.0, 149.0, 109.0, 83.0, 42.0, 42.0, 21.0, 11.0, 13.0, 9.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.8896484375, -0.8621978759765625, -0.834747314453125, -0.8072967529296875, -0.77984619140625, -0.7523956298828125, -0.724945068359375, -0.6974945068359375, -0.6700439453125, -0.6425933837890625, -0.615142822265625, -0.5876922607421875, -0.56024169921875, -0.5327911376953125, -0.505340576171875, -0.4778900146484375, -0.450439453125, -0.4229888916015625, -0.395538330078125, -0.3680877685546875, -0.34063720703125, -0.3131866455078125, -0.285736083984375, -0.2582855224609375, -0.2308349609375, -0.2033843994140625, -0.175933837890625, -0.1484832763671875, -0.12103271484375, -0.0935821533203125, -0.066131591796875, -0.0386810302734375, -0.01123046875, 0.0162200927734375, 0.043670654296875, 0.0711212158203125, 0.09857177734375, 0.1260223388671875, 0.153472900390625, 0.1809234619140625, 0.2083740234375, 0.2358245849609375, 0.263275146484375, 0.2907257080078125, 0.31817626953125, 0.3456268310546875, 0.373077392578125, 0.4005279541015625, 0.427978515625, 0.4554290771484375, 0.482879638671875, 0.5103302001953125, 0.53778076171875, 0.5652313232421875, 0.592681884765625, 0.6201324462890625, 0.6475830078125, 0.6750335693359375, 0.702484130859375, 0.7299346923828125, 0.75738525390625, 0.7848358154296875, 0.812286376953125, 0.8397369384765625, 0.8671875]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 2.0, 7.0, 8.0, 9.0, 7.0, 7.0, 13.0, 24.0, 16.0, 23.0, 26.0, 23.0, 22.0, 35.0, 40.0, 47.0, 42.0, 51.0, 57.0, 39.0, 1066.0, 40.0, 45.0, 43.0, 37.0, 48.0, 36.0, 33.0, 27.0, 30.0, 20.0, 22.0, 28.0, 12.0, 11.0, 11.0, 4.0, 11.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.94921875, -5.770751953125, -5.59228515625, -5.413818359375, -5.2353515625, -5.056884765625, -4.87841796875, -4.699951171875, -4.521484375, -4.343017578125, -4.16455078125, -3.986083984375, -3.8076171875, -3.629150390625, -3.45068359375, -3.272216796875, -3.09375, -2.915283203125, -2.73681640625, -2.558349609375, -2.3798828125, -2.201416015625, -2.02294921875, -1.844482421875, -1.666015625, -1.487548828125, -1.30908203125, -1.130615234375, -0.9521484375, -0.773681640625, -0.59521484375, -0.416748046875, -0.23828125, -0.059814453125, 0.11865234375, 0.297119140625, 0.4755859375, 0.654052734375, 0.83251953125, 1.010986328125, 1.189453125, 1.367919921875, 1.54638671875, 1.724853515625, 1.9033203125, 2.081787109375, 2.26025390625, 2.438720703125, 2.6171875, 2.795654296875, 2.97412109375, 3.152587890625, 3.3310546875, 3.509521484375, 3.68798828125, 3.866455078125, 4.044921875, 4.223388671875, 4.40185546875, 4.580322265625, 4.7587890625, 4.937255859375, 5.11572265625, 5.294189453125, 5.47265625]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 7.0, 7.0, 14.0, 18.0, 25.0, 39.0, 71.0, 79.0, 112.0, 163.0, 293.0, 421.0, 651.0, 986.0, 1643.0, 2577.0, 4258.0, 6766.0, 11221.0, 18018.0, 30363.0, 49916.0, 83925.0, 145113.0, 1275853.0, 188877.0, 110976.0, 65356.0, 38950.0, 23366.0, 14135.0, 8607.0, 5316.0, 3221.0, 2070.0, 1312.0, 825.0, 550.0, 348.0, 253.0, 144.0, 98.0, 74.0, 42.0, 29.0, 18.0, 11.0, 9.0, 3.0, 5.0, 2.0, 4.0, 2.0, 3.0], "bins": [-0.9892578125, -0.9607925415039062, -0.9323272705078125, -0.9038619995117188, -0.875396728515625, -0.8469314575195312, -0.8184661865234375, -0.7900009155273438, -0.76153564453125, -0.7330703735351562, -0.7046051025390625, -0.6761398315429688, -0.647674560546875, -0.6192092895507812, -0.5907440185546875, -0.5622787475585938, -0.5338134765625, -0.5053482055664062, -0.4768829345703125, -0.44841766357421875, -0.419952392578125, -0.39148712158203125, -0.3630218505859375, -0.33455657958984375, -0.30609130859375, -0.27762603759765625, -0.2491607666015625, -0.22069549560546875, -0.192230224609375, -0.16376495361328125, -0.1352996826171875, -0.10683441162109375, -0.078369140625, -0.04990386962890625, -0.0214385986328125, 0.00702667236328125, 0.035491943359375, 0.06395721435546875, 0.0924224853515625, 0.12088775634765625, 0.14935302734375, 0.17781829833984375, 0.2062835693359375, 0.23474884033203125, 0.263214111328125, 0.29167938232421875, 0.3201446533203125, 0.34860992431640625, 0.3770751953125, 0.40554046630859375, 0.4340057373046875, 0.46247100830078125, 0.490936279296875, 0.5194015502929688, 0.5478668212890625, 0.5763320922851562, 0.60479736328125, 0.6332626342773438, 0.6617279052734375, 0.6901931762695312, 0.718658447265625, 0.7471237182617188, 0.7755889892578125, 0.8040542602539062, 0.83251953125]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 11.0, 2.0, 10.0, 10.0, 5.0, 14.0, 17.0, 26.0, 23.0, 26.0, 33.0, 54.0, 68.0, 60.0, 64.0, 74.0, 82.0, 75.0, 64.0, 60.0, 47.0, 40.0, 22.0, 27.0, 18.0, 13.0, 13.0, 15.0, 7.0, 6.0, 6.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0031585693359375, -0.00305098295211792, -0.00294339656829834, -0.0028358101844787598, -0.0027282238006591797, -0.0026206374168395996, -0.0025130510330200195, -0.0024054646492004395, -0.0022978782653808594, -0.0021902918815612793, -0.0020827054977416992, -0.001975119113922119, -0.001867532730102539, -0.001759946346282959, -0.001652359962463379, -0.0015447735786437988, -0.0014371871948242188, -0.0013296008110046387, -0.0012220144271850586, -0.0011144280433654785, -0.0010068416595458984, -0.0008992552757263184, -0.0007916688919067383, -0.0006840825080871582, -0.0005764961242675781, -0.00046890974044799805, -0.00036132335662841797, -0.0002537369728088379, -0.0001461505889892578, -3.8564205169677734e-05, 6.902217864990234e-05, 0.00017660856246948242, 0.0002841949462890625, 0.0003917813301086426, 0.0004993677139282227, 0.0006069540977478027, 0.0007145404815673828, 0.0008221268653869629, 0.000929713249206543, 0.001037299633026123, 0.0011448860168457031, 0.0012524724006652832, 0.0013600587844848633, 0.0014676451683044434, 0.0015752315521240234, 0.0016828179359436035, 0.0017904043197631836, 0.0018979907035827637, 0.0020055770874023438, 0.002113163471221924, 0.002220749855041504, 0.002328336238861084, 0.002435922622680664, 0.002543509006500244, 0.0026510953903198242, 0.0027586817741394043, 0.0028662681579589844, 0.0029738545417785645, 0.0030814409255981445, 0.0031890273094177246, 0.0032966136932373047, 0.0034042000770568848, 0.003511786460876465, 0.003619372844696045, 0.003726959228515625]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 3.0, 8.0, 10.0, 12.0, 10.0, 17.0, 19.0, 27.0, 36.0, 69.0, 104.0, 123.0, 229.0, 633.0, 4940.0, 1038171.0, 2767.0, 583.0, 261.0, 157.0, 93.0, 63.0, 43.0, 40.0, 37.0, 19.0, 15.0, 18.0, 14.0, 10.0, 4.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.08892822265625, -0.08641910552978516, -0.08390998840332031, -0.08140087127685547, -0.07889175415039062, -0.07638263702392578, -0.07387351989746094, -0.0713644027709961, -0.06885528564453125, -0.0663461685180664, -0.06383705139160156, -0.06132793426513672, -0.058818817138671875, -0.05630970001220703, -0.05380058288574219, -0.051291465759277344, -0.0487823486328125, -0.046273231506347656, -0.04376411437988281, -0.04125499725341797, -0.038745880126953125, -0.03623676300048828, -0.03372764587402344, -0.031218528747558594, -0.02870941162109375, -0.026200294494628906, -0.023691177368164062, -0.02118206024169922, -0.018672943115234375, -0.01616382598876953, -0.013654708862304688, -0.011145591735839844, -0.008636474609375, -0.006127357482910156, -0.0036182403564453125, -0.0011091232299804688, 0.001399993896484375, 0.003909111022949219, 0.0064182281494140625, 0.008927345275878906, 0.01143646240234375, 0.013945579528808594, 0.016454696655273438, 0.01896381378173828, 0.021472930908203125, 0.02398204803466797, 0.026491165161132812, 0.029000282287597656, 0.0315093994140625, 0.034018516540527344, 0.03652763366699219, 0.03903675079345703, 0.041545867919921875, 0.04405498504638672, 0.04656410217285156, 0.049073219299316406, 0.05158233642578125, 0.054091453552246094, 0.05660057067871094, 0.05910968780517578, 0.061618804931640625, 0.06412792205810547, 0.06663703918457031, 0.06914615631103516, 0.0716552734375]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 10.0, 27.0, 93.0, 183.0, 233.0, 240.0, 140.0, 65.0, 9.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003044694662094116, -0.0029390710406005383, -0.0028334471862763166, -0.0027278235647827387, -0.0026221999432891607, -0.002516576088964939, -0.002410952467471361, -0.002305328845977783, -0.0021997052244842052, -0.0020940816029906273, -0.0019884577486664057, -0.0018828341271728277, -0.0017772105056792498, -0.00167158676777035, -0.0015659630298614502, -0.0014603394083678722, -0.0013547156704589725, -0.0012490919325500727, -0.0011434683110564947, -0.001037844573147595, -0.000932220951654017, -0.0008265972137451172, -0.0007209735340438783, -0.0006153498543426394, -0.0005097261746414006, -0.0004041024949401617, -0.00029847881523892283, -0.0001928551064338535, -8.723142673261464e-05, 1.839228207245469e-05, 0.00012401596177369356, 0.00022963964147493243, 0.0003352633211761713, 0.0004408870008774102, 0.000546510680578649, 0.0006521344184875488, 0.0007577580399811268, 0.0008633817778900266, 0.0009690054575912654, 0.0010746291372925043, 0.0011802527587860823, 0.001285876496694982, 0.00139150011818856, 0.0014971238560974598, 0.0016027474775910378, 0.0017083712154999375, 0.0018139949534088373, 0.0019196185749024153, 0.002025242429226637, 0.002130866050720215, 0.0022364899050444365, 0.0023421135265380144, 0.0024477371480315924, 0.002553361002355814, 0.002658984623849392, 0.00276460824534297, 0.002870231866836548, 0.002975855488330126, 0.0030814793426543474, 0.0031871029641479254, 0.0032927265856415033, 0.003398350439965725, 0.003503974061459303, 0.003609597682952881, 0.003715221304446459]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 6.0, 5.0, 6.0, 12.0, 15.0, 7.0, 15.0, 24.0, 17.0, 25.0, 23.0, 28.0, 41.0, 44.0, 36.0, 34.0, 51.0, 42.0, 47.0, 46.0, 46.0, 31.0, 42.0, 47.0, 27.0, 29.0, 40.0, 36.0, 24.0, 27.0, 27.0, 22.0, 13.0, 14.0, 11.0, 9.0, 10.0, 10.0, 5.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015001296997070312, -0.0014485390856862068, -0.0013969484716653824, -0.001345357857644558, -0.0012937672436237335, -0.001242176629602909, -0.0011905860155820847, -0.0011389954015612602, -0.0010874047875404358, -0.0010358141735196114, -0.000984223559498787, -0.0009326329454779625, -0.0008810423314571381, -0.0008294517174363136, -0.0007778611034154892, -0.0007262704893946648, -0.0006746798753738403, -0.0006230892613530159, -0.0005714986473321915, -0.000519908033311367, -0.0004683174192905426, -0.00041672680526971817, -0.00036513619124889374, -0.0003135455772280693, -0.0002619549632072449, -0.00021036434918642044, -0.000158773735165596, -0.00010718312114477158, -5.5592507123947144e-05, -4.001893103122711e-06, 4.758872091770172e-05, 9.917933493852615e-05, 0.00015076994895935059, 0.00020236056298017502, 0.00025395117700099945, 0.0003055417910218239, 0.0003571324050426483, 0.00040872301906347275, 0.0004603136330842972, 0.0005119042471051216, 0.000563494861125946, 0.0006150854751467705, 0.0006666760891675949, 0.0007182667031884193, 0.0007698573172092438, 0.0008214479312300682, 0.0008730385452508926, 0.0009246291592717171, 0.0009762197732925415, 0.001027810387313366, 0.0010794010013341904, 0.0011309916153550148, 0.0011825822293758392, 0.0012341728433966637, 0.001285763457417488, 0.0013373540714383125, 0.001388944685459137, 0.0014405352994799614, 0.0014921259135007858, 0.0015437165275216103, 0.0015953071415424347, 0.0016468977555632591, 0.0016984883695840836, 0.001750078983604908, 0.0018016695976257324]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 4.0, 1.0, 5.0, 6.0, 8.0, 8.0, 20.0, 12.0, 12.0, 18.0, 15.0, 21.0, 22.0, 33.0, 32.0, 30.0, 33.0, 37.0, 36.0, 41.0, 37.0, 50.0, 59.0, 30.0, 52.0, 40.0, 42.0, 44.0, 34.0, 30.0, 30.0, 22.0, 20.0, 27.0, 16.0, 19.0, 9.0, 13.0, 5.0, 10.0, 8.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.5078125, -8.2423095703125, -7.976806640625, -7.7113037109375, -7.44580078125, -7.1802978515625, -6.914794921875, -6.6492919921875, -6.3837890625, -6.1182861328125, -5.852783203125, -5.5872802734375, -5.32177734375, -5.0562744140625, -4.790771484375, -4.5252685546875, -4.259765625, -3.9942626953125, -3.728759765625, -3.4632568359375, -3.19775390625, -2.9322509765625, -2.666748046875, -2.4012451171875, -2.1357421875, -1.8702392578125, -1.604736328125, -1.3392333984375, -1.07373046875, -0.8082275390625, -0.542724609375, -0.2772216796875, -0.01171875, 0.2537841796875, 0.519287109375, 0.7847900390625, 1.05029296875, 1.3157958984375, 1.581298828125, 1.8468017578125, 2.1123046875, 2.3778076171875, 2.643310546875, 2.9088134765625, 3.17431640625, 3.4398193359375, 3.705322265625, 3.9708251953125, 4.236328125, 4.5018310546875, 4.767333984375, 5.0328369140625, 5.29833984375, 5.5638427734375, 5.829345703125, 6.0948486328125, 6.3603515625, 6.6258544921875, 6.891357421875, 7.1568603515625, 7.42236328125, 7.6878662109375, 7.953369140625, 8.2188720703125, 8.484375]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 5.0, 5.0, 5.0, 10.0, 9.0, 14.0, 29.0, 20.0, 20.0, 34.0, 50.0, 63.0, 74.0, 112.0, 169.0, 202.0, 384.0, 697.0, 1714.0, 6652.0, 41239.0, 572528.0, 384062.0, 31655.0, 5501.0, 1500.0, 606.0, 374.0, 207.0, 161.0, 122.0, 84.0, 53.0, 54.0, 32.0, 27.0, 23.0, 12.0, 9.0, 13.0, 9.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-15.71875, -15.2265625, -14.734375, -14.2421875, -13.75, -13.2578125, -12.765625, -12.2734375, -11.78125, -11.2890625, -10.796875, -10.3046875, -9.8125, -9.3203125, -8.828125, -8.3359375, -7.84375, -7.3515625, -6.859375, -6.3671875, -5.875, -5.3828125, -4.890625, -4.3984375, -3.90625, -3.4140625, -2.921875, -2.4296875, -1.9375, -1.4453125, -0.953125, -0.4609375, 0.03125, 0.5234375, 1.015625, 1.5078125, 2.0, 2.4921875, 2.984375, 3.4765625, 3.96875, 4.4609375, 4.953125, 5.4453125, 5.9375, 6.4296875, 6.921875, 7.4140625, 7.90625, 8.3984375, 8.890625, 9.3828125, 9.875, 10.3671875, 10.859375, 11.3515625, 11.84375, 12.3359375, 12.828125, 13.3203125, 13.8125, 14.3046875, 14.796875, 15.2890625, 15.78125]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 8.0, 1.0, 5.0, 3.0, 7.0, 8.0, 12.0, 9.0, 9.0, 8.0, 16.0, 21.0, 25.0, 16.0, 33.0, 32.0, 22.0, 33.0, 42.0, 44.0, 60.0, 145.0, 1560.0, 394.0, 105.0, 59.0, 41.0, 45.0, 42.0, 23.0, 25.0, 37.0, 24.0, 34.0, 18.0, 11.0, 14.0, 11.0, 9.0, 9.0, 10.0, 5.0, 8.0, 5.0, 2.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-25.390625, -24.513427734375, -23.63623046875, -22.759033203125, -21.8818359375, -21.004638671875, -20.12744140625, -19.250244140625, -18.373046875, -17.495849609375, -16.61865234375, -15.741455078125, -14.8642578125, -13.987060546875, -13.10986328125, -12.232666015625, -11.35546875, -10.478271484375, -9.60107421875, -8.723876953125, -7.8466796875, -6.969482421875, -6.09228515625, -5.215087890625, -4.337890625, -3.460693359375, -2.58349609375, -1.706298828125, -0.8291015625, 0.048095703125, 0.92529296875, 1.802490234375, 2.6796875, 3.556884765625, 4.43408203125, 5.311279296875, 6.1884765625, 7.065673828125, 7.94287109375, 8.820068359375, 9.697265625, 10.574462890625, 11.45166015625, 12.328857421875, 13.2060546875, 14.083251953125, 14.96044921875, 15.837646484375, 16.71484375, 17.592041015625, 18.46923828125, 19.346435546875, 20.2236328125, 21.100830078125, 21.97802734375, 22.855224609375, 23.732421875, 24.609619140625, 25.48681640625, 26.364013671875, 27.2412109375, 28.118408203125, 28.99560546875, 29.872802734375, 30.75]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 4.0, 2.0, 3.0, 9.0, 8.0, 4.0, 8.0, 11.0, 10.0, 18.0, 15.0, 14.0, 32.0, 32.0, 49.0, 29.0, 43.0, 83.0, 112.0, 192.0, 310.0, 762.0, 7339.0, 3123340.0, 11504.0, 780.0, 356.0, 173.0, 113.0, 63.0, 46.0, 45.0, 39.0, 28.0, 23.0, 27.0, 10.0, 11.0, 15.0, 6.0, 15.0, 8.0, 3.0, 5.0, 6.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-90.875, -88.244140625, -85.61328125, -82.982421875, -80.3515625, -77.720703125, -75.08984375, -72.458984375, -69.828125, -67.197265625, -64.56640625, -61.935546875, -59.3046875, -56.673828125, -54.04296875, -51.412109375, -48.78125, -46.150390625, -43.51953125, -40.888671875, -38.2578125, -35.626953125, -32.99609375, -30.365234375, -27.734375, -25.103515625, -22.47265625, -19.841796875, -17.2109375, -14.580078125, -11.94921875, -9.318359375, -6.6875, -4.056640625, -1.42578125, 1.205078125, 3.8359375, 6.466796875, 9.09765625, 11.728515625, 14.359375, 16.990234375, 19.62109375, 22.251953125, 24.8828125, 27.513671875, 30.14453125, 32.775390625, 35.40625, 38.037109375, 40.66796875, 43.298828125, 45.9296875, 48.560546875, 51.19140625, 53.822265625, 56.453125, 59.083984375, 61.71484375, 64.345703125, 66.9765625, 69.607421875, 72.23828125, 74.869140625, 77.5]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 851.0, 161.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-112.76287078857422, -104.56771850585938, -96.37256622314453, -88.17741394042969, -79.98226928710938, -71.787109375, -63.59196472167969, -55.396812438964844, -47.20166015625, -39.006507873535156, -30.811357498168945, -22.616207122802734, -14.42105484008789, -6.225902557373047, 1.9692459106445312, 10.164398193359375, 18.35955047607422, 26.554702758789062, 34.749855041503906, 42.945003509521484, 51.14015579223633, 59.33530807495117, 67.53045654296875, 75.7256088256836, 83.92076110839844, 92.11591339111328, 100.31106567382812, 108.50621032714844, 116.70137023925781, 124.89651489257812, 133.0916748046875, 141.2868194580078, 149.48196411132812, 157.67710876464844, 165.8722686767578, 174.06741333007812, 182.2625732421875, 190.4577178955078, 198.65286254882812, 206.8480224609375, 215.04318237304688, 223.2383270263672, 231.43348693847656, 239.62863159179688, 247.82379150390625, 256.0189514160156, 264.2140808105469, 272.40924072265625, 280.6043701171875, 288.7995300292969, 296.9946594238281, 305.1898193359375, 313.3849792480469, 321.58013916015625, 329.7752685546875, 337.9704284667969, 346.16558837890625, 354.3607482910156, 362.5558776855469, 370.75103759765625, 378.9461975097656, 387.141357421875, 395.33648681640625, 403.5316467285156, 411.726806640625]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 6.0, 4.0, 4.0, 8.0, 6.0, 8.0, 14.0, 13.0, 16.0, 16.0, 16.0, 27.0, 30.0, 26.0, 35.0, 29.0, 42.0, 26.0, 38.0, 43.0, 38.0, 39.0, 49.0, 36.0, 56.0, 44.0, 38.0, 39.0, 30.0, 28.0, 25.0, 30.0, 24.0, 25.0, 17.0, 12.0, 10.0, 13.0, 10.0, 12.0, 5.0, 5.0, 4.0, 1.0, 3.0, 1.0, 4.0, 0.0, 1.0, 3.0], "bins": [-88.69593811035156, -86.2676010131836, -83.83926391601562, -81.41091918945312, -78.98258209228516, -76.55424499511719, -74.12590026855469, -71.69756317138672, -69.26922607421875, -66.84088897705078, -64.41255187988281, -61.98420715332031, -59.555870056152344, -57.127532958984375, -54.69919204711914, -52.270851135253906, -49.84251403808594, -47.41417694091797, -44.985836029052734, -42.5574951171875, -40.12915802001953, -37.70082092285156, -35.27248001098633, -32.844139099121094, -30.415802001953125, -27.987462997436523, -25.559123992919922, -23.13078498840332, -20.70244598388672, -18.274106979370117, -15.845767974853516, -13.417428970336914, -10.989089965820312, -8.560750961303711, -6.132411956787109, -3.704072952270508, -1.2757339477539062, 1.1526050567626953, 3.580944061279297, 6.009283065795898, 8.4376220703125, 10.865961074829102, 13.294300079345703, 15.722639083862305, 18.150978088378906, 20.579317092895508, 23.00765609741211, 25.43599510192871, 27.864334106445312, 30.292673110961914, 32.721012115478516, 35.14935302734375, 37.57769012451172, 40.00602722167969, 42.43436813354492, 44.862709045410156, 47.291046142578125, 49.719383239746094, 52.14772415161133, 54.57606506347656, 57.00440216064453, 59.4327392578125, 61.861080169677734, 64.28942108154297, 66.71775817871094]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 6.0, 6.0, 3.0, 13.0, 17.0, 12.0, 17.0, 14.0, 17.0, 14.0, 21.0, 33.0, 29.0, 36.0, 35.0, 47.0, 36.0, 42.0, 45.0, 40.0, 53.0, 40.0, 52.0, 43.0, 52.0, 40.0, 25.0, 33.0, 31.0, 29.0, 22.0, 21.0, 15.0, 12.0, 7.0, 11.0, 7.0, 6.0, 7.0, 3.0, 0.0, 1.0, 4.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.875, -8.5777587890625, -8.280517578125, -7.9832763671875, -7.68603515625, -7.3887939453125, -7.091552734375, -6.7943115234375, -6.4970703125, -6.1998291015625, -5.902587890625, -5.6053466796875, -5.30810546875, -5.0108642578125, -4.713623046875, -4.4163818359375, -4.119140625, -3.8218994140625, -3.524658203125, -3.2274169921875, -2.93017578125, -2.6329345703125, -2.335693359375, -2.0384521484375, -1.7412109375, -1.4439697265625, -1.146728515625, -0.8494873046875, -0.55224609375, -0.2550048828125, 0.042236328125, 0.3394775390625, 0.63671875, 0.9339599609375, 1.231201171875, 1.5284423828125, 1.82568359375, 2.1229248046875, 2.420166015625, 2.7174072265625, 3.0146484375, 3.3118896484375, 3.609130859375, 3.9063720703125, 4.20361328125, 4.5008544921875, 4.798095703125, 5.0953369140625, 5.392578125, 5.6898193359375, 5.987060546875, 6.2843017578125, 6.58154296875, 6.8787841796875, 7.176025390625, 7.4732666015625, 7.7705078125, 8.0677490234375, 8.364990234375, 8.6622314453125, 8.95947265625, 9.2567138671875, 9.553955078125, 9.8511962890625, 10.1484375]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 9.0, 8.0, 14.0, 10.0, 21.0, 22.0, 19.0, 19.0, 34.0, 30.0, 45.0, 73.0, 120.0, 195.0, 319.0, 554.0, 1404.0, 3646.0, 12227.0, 62790.0, 360508.0, 1381804.0, 1658204.0, 579490.0, 105865.0, 18630.0, 4816.0, 1657.0, 753.0, 349.0, 193.0, 117.0, 86.0, 51.0, 54.0, 32.0, 25.0, 17.0, 14.0, 14.0, 5.0, 11.0, 5.0, 8.0, 3.0, 7.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-12.2734375, -11.8916015625, -11.509765625, -11.1279296875, -10.74609375, -10.3642578125, -9.982421875, -9.6005859375, -9.21875, -8.8369140625, -8.455078125, -8.0732421875, -7.69140625, -7.3095703125, -6.927734375, -6.5458984375, -6.1640625, -5.7822265625, -5.400390625, -5.0185546875, -4.63671875, -4.2548828125, -3.873046875, -3.4912109375, -3.109375, -2.7275390625, -2.345703125, -1.9638671875, -1.58203125, -1.2001953125, -0.818359375, -0.4365234375, -0.0546875, 0.3271484375, 0.708984375, 1.0908203125, 1.47265625, 1.8544921875, 2.236328125, 2.6181640625, 3.0, 3.3818359375, 3.763671875, 4.1455078125, 4.52734375, 4.9091796875, 5.291015625, 5.6728515625, 6.0546875, 6.4365234375, 6.818359375, 7.2001953125, 7.58203125, 7.9638671875, 8.345703125, 8.7275390625, 9.109375, 9.4912109375, 9.873046875, 10.2548828125, 10.63671875, 11.0185546875, 11.400390625, 11.7822265625, 12.1640625]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 9.0, 5.0, 9.0, 12.0, 17.0, 16.0, 34.0, 55.0, 67.0, 82.0, 113.0, 176.0, 225.0, 324.0, 395.0, 484.0, 481.0, 408.0, 312.0, 197.0, 177.0, 132.0, 111.0, 68.0, 46.0, 40.0, 25.0, 20.0, 9.0, 11.0, 8.0, 5.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.1875, -17.617919921875, -17.04833984375, -16.478759765625, -15.9091796875, -15.339599609375, -14.77001953125, -14.200439453125, -13.630859375, -13.061279296875, -12.49169921875, -11.922119140625, -11.3525390625, -10.782958984375, -10.21337890625, -9.643798828125, -9.07421875, -8.504638671875, -7.93505859375, -7.365478515625, -6.7958984375, -6.226318359375, -5.65673828125, -5.087158203125, -4.517578125, -3.947998046875, -3.37841796875, -2.808837890625, -2.2392578125, -1.669677734375, -1.10009765625, -0.530517578125, 0.0390625, 0.608642578125, 1.17822265625, 1.747802734375, 2.3173828125, 2.886962890625, 3.45654296875, 4.026123046875, 4.595703125, 5.165283203125, 5.73486328125, 6.304443359375, 6.8740234375, 7.443603515625, 8.01318359375, 8.582763671875, 9.15234375, 9.721923828125, 10.29150390625, 10.861083984375, 11.4306640625, 12.000244140625, 12.56982421875, 13.139404296875, 13.708984375, 14.278564453125, 14.84814453125, 15.417724609375, 15.9873046875, 16.556884765625, 17.12646484375, 17.696044921875, 18.265625]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 4.0, 0.0, 2.0, 6.0, 4.0, 12.0, 9.0, 18.0, 21.0, 23.0, 41.0, 43.0, 62.0, 87.0, 114.0, 145.0, 167.0, 218.0, 310.0, 418.0, 812.0, 2686.0, 149096.0, 4015268.0, 21087.0, 1562.0, 629.0, 362.0, 252.0, 204.0, 153.0, 137.0, 91.0, 59.0, 42.0, 32.0, 36.0, 22.0, 14.0, 7.0, 8.0, 9.0, 1.0, 6.0, 2.0, 2.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-68.0, -65.830078125, -63.66015625, -61.490234375, -59.3203125, -57.150390625, -54.98046875, -52.810546875, -50.640625, -48.470703125, -46.30078125, -44.130859375, -41.9609375, -39.791015625, -37.62109375, -35.451171875, -33.28125, -31.111328125, -28.94140625, -26.771484375, -24.6015625, -22.431640625, -20.26171875, -18.091796875, -15.921875, -13.751953125, -11.58203125, -9.412109375, -7.2421875, -5.072265625, -2.90234375, -0.732421875, 1.4375, 3.607421875, 5.77734375, 7.947265625, 10.1171875, 12.287109375, 14.45703125, 16.626953125, 18.796875, 20.966796875, 23.13671875, 25.306640625, 27.4765625, 29.646484375, 31.81640625, 33.986328125, 36.15625, 38.326171875, 40.49609375, 42.666015625, 44.8359375, 47.005859375, 49.17578125, 51.345703125, 53.515625, 55.685546875, 57.85546875, 60.025390625, 62.1953125, 64.365234375, 66.53515625, 68.705078125, 70.875]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 27.0, 233.0, 466.0, 251.0, 33.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-139.7758026123047, -132.19021606445312, -124.6046142578125, -117.01902770996094, -109.43342590332031, -101.84783935546875, -94.26224517822266, -86.67665100097656, -79.09105682373047, -71.50546264648438, -63.91986846923828, -56.33427810668945, -48.74868392944336, -41.163089752197266, -33.57749938964844, -25.991905212402344, -18.40631103515625, -10.820717811584473, -3.2351245880126953, 4.350467681884766, 11.93606185913086, 19.521656036376953, 27.10724639892578, 34.692840576171875, 42.27843475341797, 49.86402893066406, 57.449623107910156, 65.03521728515625, 72.62080383300781, 80.20640563964844, 87.7919921875, 95.3775863647461, 102.96316528320312, 110.54875946044922, 118.13435363769531, 125.71994018554688, 133.3055419921875, 140.89112854003906, 148.47671508789062, 156.06231689453125, 163.64791870117188, 171.23350524902344, 178.81910705566406, 186.40469360351562, 193.99029541015625, 201.5758819580078, 209.16146850585938, 216.7470703125, 224.33265686035156, 231.91824340820312, 239.50384521484375, 247.0894317626953, 254.67503356933594, 262.2606201171875, 269.8462219238281, 277.43182373046875, 285.01739501953125, 292.6029968261719, 300.1885681152344, 307.774169921875, 315.3597717285156, 322.94537353515625, 330.53094482421875, 338.1165466308594, 345.7021484375]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 1.0, 11.0, 6.0, 6.0, 5.0, 6.0, 17.0, 16.0, 14.0, 18.0, 14.0, 22.0, 17.0, 33.0, 24.0, 29.0, 48.0, 35.0, 41.0, 37.0, 36.0, 33.0, 36.0, 46.0, 42.0, 39.0, 33.0, 36.0, 29.0, 36.0, 22.0, 29.0, 28.0, 23.0, 27.0, 20.0, 19.0, 6.0, 12.0, 13.0, 13.0, 8.0, 7.0, 6.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.94775390625, -55.20804977416992, -53.468345642089844, -51.72864532470703, -49.98894119262695, -48.249237060546875, -46.50953674316406, -44.769832611083984, -43.030128479003906, -41.29042434692383, -39.55072021484375, -37.81101989746094, -36.07131576538086, -34.33161163330078, -32.59191131591797, -30.85220718383789, -29.112503051757812, -27.372798919677734, -25.63309669494629, -23.893394470214844, -22.153690338134766, -20.413986206054688, -18.674283981323242, -16.934581756591797, -15.194877624511719, -13.455174446105957, -11.715471267700195, -9.975768089294434, -8.236064910888672, -6.49636173248291, -4.756658554077148, -3.0169553756713867, -1.277252197265625, 0.4624509811401367, 2.2021541595458984, 3.94185733795166, 5.681560516357422, 7.421263694763184, 9.160966873168945, 10.900670051574707, 12.640373229980469, 14.38007640838623, 16.119779586791992, 17.859481811523438, 19.599185943603516, 21.338890075683594, 23.07859230041504, 24.818294525146484, 26.557998657226562, 28.29770278930664, 30.037405014038086, 31.77710723876953, 33.51681137084961, 35.25651550292969, 36.9962158203125, 38.73591995239258, 40.475624084472656, 42.215328216552734, 43.95503234863281, 45.694732666015625, 47.4344367980957, 49.17414093017578, 50.913841247558594, 52.65354537963867, 54.39324951171875]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 0.0, 5.0, 4.0, 8.0, 11.0, 13.0, 10.0, 18.0, 17.0, 16.0, 26.0, 29.0, 24.0, 27.0, 22.0, 37.0, 46.0, 36.0, 35.0, 41.0, 36.0, 35.0, 36.0, 42.0, 48.0, 34.0, 52.0, 36.0, 37.0, 33.0, 29.0, 26.0, 17.0, 20.0, 20.0, 16.0, 15.0, 9.0, 11.0, 5.0, 2.0, 3.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.2109375, -7.943359375, -7.67578125, -7.408203125, -7.140625, -6.873046875, -6.60546875, -6.337890625, -6.0703125, -5.802734375, -5.53515625, -5.267578125, -5.0, -4.732421875, -4.46484375, -4.197265625, -3.9296875, -3.662109375, -3.39453125, -3.126953125, -2.859375, -2.591796875, -2.32421875, -2.056640625, -1.7890625, -1.521484375, -1.25390625, -0.986328125, -0.71875, -0.451171875, -0.18359375, 0.083984375, 0.3515625, 0.619140625, 0.88671875, 1.154296875, 1.421875, 1.689453125, 1.95703125, 2.224609375, 2.4921875, 2.759765625, 3.02734375, 3.294921875, 3.5625, 3.830078125, 4.09765625, 4.365234375, 4.6328125, 4.900390625, 5.16796875, 5.435546875, 5.703125, 5.970703125, 6.23828125, 6.505859375, 6.7734375, 7.041015625, 7.30859375, 7.576171875, 7.84375, 8.111328125, 8.37890625, 8.646484375, 8.9140625]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 4.0, 4.0, 7.0, 10.0, 14.0, 18.0, 37.0, 48.0, 69.0, 93.0, 155.0, 199.0, 270.0, 437.0, 620.0, 905.0, 1400.0, 1927.0, 2935.0, 4571.0, 7153.0, 10809.0, 16795.0, 26206.0, 40695.0, 63799.0, 98780.0, 153874.0, 198770.0, 149277.0, 95537.0, 61345.0, 39451.0, 25291.0, 16147.0, 10556.0, 6950.0, 4481.0, 2942.0, 1929.0, 1293.0, 862.0, 625.0, 428.0, 269.0, 167.0, 150.0, 87.0, 56.0, 43.0, 23.0, 15.0, 10.0, 11.0, 8.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.8427734375, -0.8159866333007812, -0.7891998291015625, -0.7624130249023438, -0.735626220703125, -0.7088394165039062, -0.6820526123046875, -0.6552658081054688, -0.62847900390625, -0.6016921997070312, -0.5749053955078125, -0.5481185913085938, -0.521331787109375, -0.49454498291015625, -0.4677581787109375, -0.44097137451171875, -0.4141845703125, -0.38739776611328125, -0.3606109619140625, -0.33382415771484375, -0.307037353515625, -0.28025054931640625, -0.2534637451171875, -0.22667694091796875, -0.19989013671875, -0.17310333251953125, -0.1463165283203125, -0.11952972412109375, -0.092742919921875, -0.06595611572265625, -0.0391693115234375, -0.01238250732421875, 0.014404296875, 0.04119110107421875, 0.0679779052734375, 0.09476470947265625, 0.121551513671875, 0.14833831787109375, 0.1751251220703125, 0.20191192626953125, 0.22869873046875, 0.25548553466796875, 0.2822723388671875, 0.30905914306640625, 0.335845947265625, 0.36263275146484375, 0.3894195556640625, 0.41620635986328125, 0.4429931640625, 0.46977996826171875, 0.4965667724609375, 0.5233535766601562, 0.550140380859375, 0.5769271850585938, 0.6037139892578125, 0.6305007934570312, 0.65728759765625, 0.6840744018554688, 0.7108612060546875, 0.7376480102539062, 0.764434814453125, 0.7912216186523438, 0.8180084228515625, 0.8447952270507812, 0.87158203125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 1.0, 0.0, 6.0, 8.0, 9.0, 12.0, 11.0, 9.0, 9.0, 22.0, 21.0, 17.0, 21.0, 20.0, 31.0, 29.0, 22.0, 27.0, 26.0, 41.0, 37.0, 32.0, 36.0, 1063.0, 50.0, 38.0, 33.0, 41.0, 46.0, 37.0, 28.0, 27.0, 28.0, 31.0, 23.0, 22.0, 20.0, 15.0, 9.0, 14.0, 8.0, 8.0, 7.0, 7.0, 4.0, 7.0, 1.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-5.015625, -4.8631591796875, -4.710693359375, -4.5582275390625, -4.40576171875, -4.2532958984375, -4.100830078125, -3.9483642578125, -3.7958984375, -3.6434326171875, -3.490966796875, -3.3385009765625, -3.18603515625, -3.0335693359375, -2.881103515625, -2.7286376953125, -2.576171875, -2.4237060546875, -2.271240234375, -2.1187744140625, -1.96630859375, -1.8138427734375, -1.661376953125, -1.5089111328125, -1.3564453125, -1.2039794921875, -1.051513671875, -0.8990478515625, -0.74658203125, -0.5941162109375, -0.441650390625, -0.2891845703125, -0.13671875, 0.0157470703125, 0.168212890625, 0.3206787109375, 0.47314453125, 0.6256103515625, 0.778076171875, 0.9305419921875, 1.0830078125, 1.2354736328125, 1.387939453125, 1.5404052734375, 1.69287109375, 1.8453369140625, 1.997802734375, 2.1502685546875, 2.302734375, 2.4552001953125, 2.607666015625, 2.7601318359375, 2.91259765625, 3.0650634765625, 3.217529296875, 3.3699951171875, 3.5224609375, 3.6749267578125, 3.827392578125, 3.9798583984375, 4.13232421875, 4.2847900390625, 4.437255859375, 4.5897216796875, 4.7421875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 7.0, 14.0, 20.0, 27.0, 38.0, 45.0, 83.0, 103.0, 158.0, 224.0, 305.0, 447.0, 664.0, 888.0, 1385.0, 2057.0, 3141.0, 4684.0, 6941.0, 10639.0, 16078.0, 24609.0, 38432.0, 59094.0, 93164.0, 148224.0, 1252844.0, 156729.0, 97778.0, 61723.0, 40112.0, 26048.0, 17139.0, 11069.0, 7324.0, 4888.0, 3116.0, 2180.0, 1543.0, 975.0, 672.0, 456.0, 353.0, 224.0, 132.0, 95.0, 86.0, 56.0, 44.0, 24.0, 19.0, 11.0, 11.0, 7.0, 5.0, 5.0], "bins": [-0.8779296875, -0.8525238037109375, -0.827117919921875, -0.8017120361328125, -0.77630615234375, -0.7509002685546875, -0.725494384765625, -0.7000885009765625, -0.6746826171875, -0.6492767333984375, -0.623870849609375, -0.5984649658203125, -0.57305908203125, -0.5476531982421875, -0.522247314453125, -0.4968414306640625, -0.471435546875, -0.4460296630859375, -0.420623779296875, -0.3952178955078125, -0.36981201171875, -0.3444061279296875, -0.319000244140625, -0.2935943603515625, -0.2681884765625, -0.2427825927734375, -0.217376708984375, -0.1919708251953125, -0.16656494140625, -0.1411590576171875, -0.115753173828125, -0.0903472900390625, -0.06494140625, -0.0395355224609375, -0.014129638671875, 0.0112762451171875, 0.03668212890625, 0.0620880126953125, 0.087493896484375, 0.1128997802734375, 0.1383056640625, 0.1637115478515625, 0.189117431640625, 0.2145233154296875, 0.23992919921875, 0.2653350830078125, 0.290740966796875, 0.3161468505859375, 0.341552734375, 0.3669586181640625, 0.392364501953125, 0.4177703857421875, 0.44317626953125, 0.4685821533203125, 0.493988037109375, 0.5193939208984375, 0.5447998046875, 0.5702056884765625, 0.595611572265625, 0.6210174560546875, 0.64642333984375, 0.6718292236328125, 0.697235107421875, 0.7226409912109375, 0.748046875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 1.0, 3.0, 6.0, 4.0, 11.0, 4.0, 17.0, 17.0, 14.0, 24.0, 33.0, 42.0, 52.0, 57.0, 56.0, 63.0, 76.0, 76.0, 64.0, 55.0, 59.0, 48.0, 47.0, 33.0, 27.0, 22.0, 23.0, 13.0, 10.0, 13.0, 4.0, 3.0, 5.0, 6.0, 1.0, 4.0, 2.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0030765533447265625, -0.0029673874378204346, -0.0028582215309143066, -0.0027490556240081787, -0.0026398897171020508, -0.002530723810195923, -0.002421557903289795, -0.002312391996383667, -0.002203226089477539, -0.002094060182571411, -0.001984894275665283, -0.0018757283687591553, -0.0017665624618530273, -0.0016573965549468994, -0.0015482306480407715, -0.0014390647411346436, -0.0013298988342285156, -0.0012207329273223877, -0.0011115670204162598, -0.0010024011135101318, -0.0008932352066040039, -0.000784069299697876, -0.000674903392791748, -0.0005657374858856201, -0.0004565715789794922, -0.00034740567207336426, -0.00023823976516723633, -0.0001290738582611084, -1.990795135498047e-05, 8.925795555114746e-05, 0.0001984238624572754, 0.0003075897693634033, 0.00041675567626953125, 0.0005259215831756592, 0.0006350874900817871, 0.000744253396987915, 0.000853419303894043, 0.0009625852108001709, 0.0010717511177062988, 0.0011809170246124268, 0.0012900829315185547, 0.0013992488384246826, 0.0015084147453308105, 0.0016175806522369385, 0.0017267465591430664, 0.0018359124660491943, 0.0019450783729553223, 0.00205424427986145, 0.002163410186767578, 0.002272576093673706, 0.002381742000579834, 0.002490907907485962, 0.00260007381439209, 0.0027092397212982178, 0.0028184056282043457, 0.0029275715351104736, 0.0030367374420166016, 0.0031459033489227295, 0.0032550692558288574, 0.0033642351627349854, 0.0034734010696411133, 0.003582566976547241, 0.003691732883453369, 0.003800898790359497, 0.003910064697265625]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 6.0, 3.0, 5.0, 3.0, 5.0, 8.0, 15.0, 12.0, 20.0, 30.0, 26.0, 41.0, 50.0, 57.0, 89.0, 151.0, 242.0, 561.0, 5336.0, 1037430.0, 3273.0, 495.0, 214.0, 127.0, 104.0, 66.0, 40.0, 39.0, 23.0, 23.0, 11.0, 12.0, 9.0, 2.0, 6.0, 7.0, 3.0, 4.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.08380126953125, -0.08129596710205078, -0.07879066467285156, -0.07628536224365234, -0.07378005981445312, -0.0712747573852539, -0.06876945495605469, -0.06626415252685547, -0.06375885009765625, -0.06125354766845703, -0.05874824523925781, -0.056242942810058594, -0.053737640380859375, -0.051232337951660156, -0.04872703552246094, -0.04622173309326172, -0.0437164306640625, -0.04121112823486328, -0.03870582580566406, -0.036200523376464844, -0.033695220947265625, -0.031189918518066406, -0.028684616088867188, -0.02617931365966797, -0.02367401123046875, -0.02116870880126953, -0.018663406372070312, -0.016158103942871094, -0.013652801513671875, -0.011147499084472656, -0.008642196655273438, -0.006136894226074219, -0.003631591796875, -0.0011262893676757812, 0.0013790130615234375, 0.0038843154907226562, 0.006389617919921875, 0.008894920349121094, 0.011400222778320312, 0.013905525207519531, 0.01641082763671875, 0.01891613006591797, 0.021421432495117188, 0.023926734924316406, 0.026432037353515625, 0.028937339782714844, 0.03144264221191406, 0.03394794464111328, 0.0364532470703125, 0.03895854949951172, 0.04146385192871094, 0.043969154357910156, 0.046474456787109375, 0.048979759216308594, 0.05148506164550781, 0.05399036407470703, 0.05649566650390625, 0.05900096893310547, 0.06150627136230469, 0.0640115737915039, 0.06651687622070312, 0.06902217864990234, 0.07152748107910156, 0.07403278350830078, 0.0765380859375]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 8.0, 142.0, 674.0, 184.0, 8.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012034166138619184, -0.0008625187911093235, -0.0005216210265643895, -0.00018072326201945543, 0.00016017456073313951, 0.0005010723834857345, 0.0008419700898230076, 0.0011828679125756025, 0.0015237657353281975, 0.0018646635580807924, 0.0022055613808333874, 0.0025464589707553387, 0.0028873570263385773, 0.0032282546162605286, 0.0035691524390131235, 0.0039100502617657185, 0.004250948317348957, 0.004591845907270908, 0.004932743962854147, 0.005273641552776098, 0.005614539608359337, 0.005955437198281288, 0.0062963347882032394, 0.006637232843786478, 0.006978130433708429, 0.007319028023630381, 0.007659926079213619, 0.00800082366913557, 0.008341721259057522, 0.008682619780302048, 0.009023517370223999, 0.00936441496014595, 0.009705313481390476, 0.010046211071312428, 0.010387108661234379, 0.010728007182478905, 0.011068904772400856, 0.011409802362322807, 0.011750699952244759, 0.01209159754216671, 0.012432496063411236, 0.012773393653333187, 0.013114291243255138, 0.013455189764499664, 0.013796087354421616, 0.014136984944343567, 0.014477882534265518, 0.01481878012418747, 0.01515967771410942, 0.015500575304031372, 0.015841472893953323, 0.016182370483875275, 0.016523268073797226, 0.016864167526364326, 0.017205065116286278, 0.01754596270620823, 0.01788686029613018, 0.01822775788605213, 0.018568655475974083, 0.018909553065896034, 0.019250450655817986, 0.019591350108385086, 0.019932247698307037, 0.02027314528822899, 0.02061404287815094]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 4.0, 4.0, 3.0, 9.0, 7.0, 10.0, 7.0, 5.0, 12.0, 15.0, 14.0, 21.0, 19.0, 10.0, 23.0, 21.0, 24.0, 36.0, 27.0, 26.0, 31.0, 37.0, 35.0, 28.0, 26.0, 46.0, 34.0, 40.0, 32.0, 35.0, 25.0, 27.0, 18.0, 31.0, 25.0, 31.0, 32.0, 22.0, 21.0, 14.0, 16.0, 15.0, 7.0, 15.0, 11.0, 9.0, 8.0, 5.0, 11.0, 6.0, 4.0, 5.0, 2.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0], "bins": [-0.0013009309768676758, -0.0012572156265377998, -0.0012135002762079239, -0.001169784925878048, -0.001126069575548172, -0.001082354225218296, -0.00103863887488842, -0.0009949235245585442, -0.0009512081742286682, -0.0009074928238987923, -0.0008637774735689163, -0.0008200621232390404, -0.0007763467729091644, -0.0007326314225792885, -0.0006889160722494125, -0.0006452007219195366, -0.0006014853715896606, -0.0005577700212597847, -0.0005140546709299088, -0.0004703393206000328, -0.00042662397027015686, -0.0003829086199402809, -0.00033919326961040497, -0.000295477919280529, -0.0002517625689506531, -0.00020804721862077713, -0.00016433186829090118, -0.00012061651796102524, -7.690116763114929e-05, -3.3185817301273346e-05, 1.05295330286026e-05, 5.4244883358478546e-05, 9.796023368835449e-05, 0.00014167558401823044, 0.00018539093434810638, 0.00022910628467798233, 0.0002728216350078583, 0.0003165369853377342, 0.00036025233566761017, 0.0004039676859974861, 0.00044768303632736206, 0.000491398386657238, 0.000535113736987114, 0.0005788290873169899, 0.0006225444376468658, 0.0006662597879767418, 0.0007099751383066177, 0.0007536904886364937, 0.0007974058389663696, 0.0008411211892962456, 0.0008848365396261215, 0.0009285518899559975, 0.0009722672402858734, 0.0010159825906157494, 0.0010596979409456253, 0.0011034132912755013, 0.0011471286416053772, 0.0011908439919352531, 0.001234559342265129, 0.001278274692595005, 0.001321990042924881, 0.001365705393254757, 0.0014094207435846329, 0.0014531360939145088, 0.0014968514442443848]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 0.0, 5.0, 4.0, 8.0, 11.0, 13.0, 10.0, 18.0, 17.0, 16.0, 26.0, 29.0, 24.0, 27.0, 22.0, 37.0, 46.0, 36.0, 35.0, 41.0, 36.0, 35.0, 36.0, 42.0, 48.0, 34.0, 52.0, 36.0, 37.0, 33.0, 29.0, 26.0, 17.0, 19.0, 21.0, 16.0, 15.0, 9.0, 11.0, 5.0, 2.0, 3.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.2109375, -7.943359375, -7.67578125, -7.408203125, -7.140625, -6.873046875, -6.60546875, -6.337890625, -6.0703125, -5.802734375, -5.53515625, -5.267578125, -5.0, -4.732421875, -4.46484375, -4.197265625, -3.9296875, -3.662109375, -3.39453125, -3.126953125, -2.859375, -2.591796875, -2.32421875, -2.056640625, -1.7890625, -1.521484375, -1.25390625, -0.986328125, -0.71875, -0.451171875, -0.18359375, 0.083984375, 0.3515625, 0.619140625, 0.88671875, 1.154296875, 1.421875, 1.689453125, 1.95703125, 2.224609375, 2.4921875, 2.759765625, 3.02734375, 3.294921875, 3.5625, 3.830078125, 4.09765625, 4.365234375, 4.6328125, 4.900390625, 5.16796875, 5.435546875, 5.703125, 5.970703125, 6.23828125, 6.505859375, 6.7734375, 7.041015625, 7.30859375, 7.576171875, 7.84375, 8.111328125, 8.37890625, 8.646484375, 8.9140625]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 4.0, 4.0, 5.0, 5.0, 9.0, 7.0, 15.0, 14.0, 22.0, 41.0, 39.0, 49.0, 62.0, 113.0, 147.0, 302.0, 533.0, 1044.0, 2149.0, 4501.0, 9358.0, 20075.0, 44755.0, 109159.0, 304671.0, 337067.0, 122406.0, 49525.0, 22241.0, 10498.0, 4893.0, 2304.0, 1149.0, 558.0, 318.0, 172.0, 94.0, 79.0, 38.0, 39.0, 21.0, 19.0, 20.0, 5.0, 8.0, 10.0, 5.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.16796875, -6.93719482421875, -6.7064208984375, -6.47564697265625, -6.244873046875, -6.01409912109375, -5.7833251953125, -5.55255126953125, -5.32177734375, -5.09100341796875, -4.8602294921875, -4.62945556640625, -4.398681640625, -4.16790771484375, -3.9371337890625, -3.70635986328125, -3.4755859375, -3.24481201171875, -3.0140380859375, -2.78326416015625, -2.552490234375, -2.32171630859375, -2.0909423828125, -1.86016845703125, -1.62939453125, -1.39862060546875, -1.1678466796875, -0.93707275390625, -0.706298828125, -0.47552490234375, -0.2447509765625, -0.01397705078125, 0.216796875, 0.44757080078125, 0.6783447265625, 0.90911865234375, 1.139892578125, 1.37066650390625, 1.6014404296875, 1.83221435546875, 2.06298828125, 2.29376220703125, 2.5245361328125, 2.75531005859375, 2.986083984375, 3.21685791015625, 3.4476318359375, 3.67840576171875, 3.9091796875, 4.13995361328125, 4.3707275390625, 4.60150146484375, 4.832275390625, 5.06304931640625, 5.2938232421875, 5.52459716796875, 5.75537109375, 5.98614501953125, 6.2169189453125, 6.44769287109375, 6.678466796875, 6.90924072265625, 7.1400146484375, 7.37078857421875, 7.6015625]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 5.0, 5.0, 6.0, 8.0, 6.0, 9.0, 8.0, 8.0, 13.0, 18.0, 15.0, 21.0, 28.0, 32.0, 20.0, 35.0, 26.0, 33.0, 41.0, 38.0, 51.0, 70.0, 192.0, 1552.0, 252.0, 112.0, 61.0, 49.0, 36.0, 42.0, 31.0, 23.0, 26.0, 18.0, 24.0, 20.0, 16.0, 16.0, 18.0, 10.0, 10.0, 2.0, 8.0, 3.0, 6.0, 5.0, 9.0, 2.0, 2.0, 4.0, 3.0, 3.0, 2.0, 1.0], "bins": [-26.640625, -25.849609375, -25.05859375, -24.267578125, -23.4765625, -22.685546875, -21.89453125, -21.103515625, -20.3125, -19.521484375, -18.73046875, -17.939453125, -17.1484375, -16.357421875, -15.56640625, -14.775390625, -13.984375, -13.193359375, -12.40234375, -11.611328125, -10.8203125, -10.029296875, -9.23828125, -8.447265625, -7.65625, -6.865234375, -6.07421875, -5.283203125, -4.4921875, -3.701171875, -2.91015625, -2.119140625, -1.328125, -0.537109375, 0.25390625, 1.044921875, 1.8359375, 2.626953125, 3.41796875, 4.208984375, 5.0, 5.791015625, 6.58203125, 7.373046875, 8.1640625, 8.955078125, 9.74609375, 10.537109375, 11.328125, 12.119140625, 12.91015625, 13.701171875, 14.4921875, 15.283203125, 16.07421875, 16.865234375, 17.65625, 18.447265625, 19.23828125, 20.029296875, 20.8203125, 21.611328125, 22.40234375, 23.193359375, 23.984375]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 8.0, 10.0, 12.0, 15.0, 16.0, 27.0, 38.0, 51.0, 65.0, 103.0, 130.0, 187.0, 278.0, 639.0, 2576.0, 608920.0, 2526801.0, 4028.0, 704.0, 370.0, 206.0, 116.0, 126.0, 82.0, 57.0, 33.0, 19.0, 24.0, 17.0, 15.0, 13.0, 7.0, 10.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.375, -55.4013671875, -53.427734375, -51.4541015625, -49.48046875, -47.5068359375, -45.533203125, -43.5595703125, -41.5859375, -39.6123046875, -37.638671875, -35.6650390625, -33.69140625, -31.7177734375, -29.744140625, -27.7705078125, -25.796875, -23.8232421875, -21.849609375, -19.8759765625, -17.90234375, -15.9287109375, -13.955078125, -11.9814453125, -10.0078125, -8.0341796875, -6.060546875, -4.0869140625, -2.11328125, -0.1396484375, 1.833984375, 3.8076171875, 5.78125, 7.7548828125, 9.728515625, 11.7021484375, 13.67578125, 15.6494140625, 17.623046875, 19.5966796875, 21.5703125, 23.5439453125, 25.517578125, 27.4912109375, 29.46484375, 31.4384765625, 33.412109375, 35.3857421875, 37.359375, 39.3330078125, 41.306640625, 43.2802734375, 45.25390625, 47.2275390625, 49.201171875, 51.1748046875, 53.1484375, 55.1220703125, 57.095703125, 59.0693359375, 61.04296875, 63.0166015625, 64.990234375, 66.9638671875, 68.9375]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 99.0, 365.0, 415.0, 115.0, 16.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.56388854980469, -87.08901977539062, -83.61415100097656, -80.1392822265625, -76.66441345214844, -73.18954467773438, -69.71467590332031, -66.23979949951172, -62.764930725097656, -59.290061950683594, -55.81519317626953, -52.34032440185547, -48.86545181274414, -45.39058303833008, -41.915714263916016, -38.44084167480469, -34.96597671508789, -31.491107940673828, -28.016237258911133, -24.54136848449707, -21.066497802734375, -17.591629028320312, -14.11676025390625, -10.641889572143555, -7.167020797729492, -3.6921513080596924, -0.21728181838989258, 3.257587432861328, 6.732457160949707, 10.207326889038086, 13.682195663452148, 17.157066345214844, 20.631935119628906, 24.10680389404297, 27.581674575805664, 31.056543350219727, 34.53141403198242, 38.006282806396484, 41.48115158081055, 44.956024169921875, 48.43089294433594, 51.90576171875, 55.38063049316406, 58.855499267578125, 62.33037185668945, 65.80523681640625, 69.28010559082031, 72.7549819946289, 76.22984313964844, 79.7047119140625, 83.17958068847656, 86.65444946289062, 90.12931823730469, 93.60418701171875, 97.07905578613281, 100.5539321899414, 104.02880096435547, 107.50366973876953, 110.9785385131836, 114.45340728759766, 117.92827606201172, 121.40315246582031, 124.87802124023438, 128.35289001464844, 131.8277587890625]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 7.0, 8.0, 10.0, 8.0, 11.0, 15.0, 18.0, 21.0, 14.0, 35.0, 16.0, 37.0, 25.0, 39.0, 34.0, 38.0, 40.0, 47.0, 45.0, 38.0, 48.0, 38.0, 50.0, 47.0, 36.0, 30.0, 43.0, 41.0, 20.0, 22.0, 19.0, 10.0, 12.0, 13.0, 22.0, 8.0, 9.0, 11.0, 7.0, 4.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-83.93081665039062, -81.49693298339844, -79.06304931640625, -76.62915802001953, -74.19527435302734, -71.76139068603516, -69.32750701904297, -66.89362335205078, -64.45973205566406, -62.025848388671875, -59.59196090698242, -57.158077239990234, -54.72418975830078, -52.290306091308594, -49.856422424316406, -47.42253875732422, -44.98865509033203, -42.554771423339844, -40.12088394165039, -37.6870002746582, -35.25311279296875, -32.81922912597656, -30.385345458984375, -27.951459884643555, -25.517574310302734, -23.083688735961914, -20.649803161621094, -18.215919494628906, -15.782033920288086, -13.348148345947266, -10.914263725280762, -8.480379104614258, -6.046485900878906, -3.612600803375244, -1.178715705871582, 1.25516939163208, 3.689054489135742, 6.1229400634765625, 8.556824684143066, 10.99070930480957, 13.42459487915039, 15.858480453491211, 18.29236602783203, 20.72624969482422, 23.16013526916504, 25.59402084350586, 28.027904510498047, 30.461790084838867, 32.89567565917969, 35.329559326171875, 37.76344680786133, 40.197330474853516, 42.63121795654297, 45.065101623535156, 47.498985290527344, 49.93286895751953, 52.366756439208984, 54.80064010620117, 57.234527587890625, 59.66841125488281, 62.102294921875, 64.53617858886719, 66.9700698852539, 69.4039535522461, 71.83783721923828]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 5.0, 4.0, 2.0, 9.0, 9.0, 12.0, 11.0, 18.0, 8.0, 17.0, 20.0, 26.0, 27.0, 26.0, 30.0, 26.0, 33.0, 29.0, 38.0, 36.0, 46.0, 41.0, 37.0, 49.0, 33.0, 45.0, 44.0, 39.0, 34.0, 25.0, 31.0, 31.0, 23.0, 22.0, 18.0, 18.0, 10.0, 13.0, 11.0, 13.0, 11.0, 5.0, 5.0, 5.0, 2.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.203125, -7.935546875, -7.66796875, -7.400390625, -7.1328125, -6.865234375, -6.59765625, -6.330078125, -6.0625, -5.794921875, -5.52734375, -5.259765625, -4.9921875, -4.724609375, -4.45703125, -4.189453125, -3.921875, -3.654296875, -3.38671875, -3.119140625, -2.8515625, -2.583984375, -2.31640625, -2.048828125, -1.78125, -1.513671875, -1.24609375, -0.978515625, -0.7109375, -0.443359375, -0.17578125, 0.091796875, 0.359375, 0.626953125, 0.89453125, 1.162109375, 1.4296875, 1.697265625, 1.96484375, 2.232421875, 2.5, 2.767578125, 3.03515625, 3.302734375, 3.5703125, 3.837890625, 4.10546875, 4.373046875, 4.640625, 4.908203125, 5.17578125, 5.443359375, 5.7109375, 5.978515625, 6.24609375, 6.513671875, 6.78125, 7.048828125, 7.31640625, 7.583984375, 7.8515625, 8.119140625, 8.38671875, 8.654296875, 8.921875]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 6.0, 4.0, 2.0, 8.0, 11.0, 12.0, 15.0, 28.0, 20.0, 25.0, 29.0, 50.0, 49.0, 62.0, 89.0, 128.0, 269.0, 817.0, 5707.0, 226037.0, 3620373.0, 331796.0, 6997.0, 901.0, 278.0, 142.0, 80.0, 78.0, 50.0, 46.0, 34.0, 33.0, 25.0, 16.0, 15.0, 12.0, 10.0, 8.0, 5.0, 7.0, 2.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-32.1875, -31.1669921875, -30.146484375, -29.1259765625, -28.10546875, -27.0849609375, -26.064453125, -25.0439453125, -24.0234375, -23.0029296875, -21.982421875, -20.9619140625, -19.94140625, -18.9208984375, -17.900390625, -16.8798828125, -15.859375, -14.8388671875, -13.818359375, -12.7978515625, -11.77734375, -10.7568359375, -9.736328125, -8.7158203125, -7.6953125, -6.6748046875, -5.654296875, -4.6337890625, -3.61328125, -2.5927734375, -1.572265625, -0.5517578125, 0.46875, 1.4892578125, 2.509765625, 3.5302734375, 4.55078125, 5.5712890625, 6.591796875, 7.6123046875, 8.6328125, 9.6533203125, 10.673828125, 11.6943359375, 12.71484375, 13.7353515625, 14.755859375, 15.7763671875, 16.796875, 17.8173828125, 18.837890625, 19.8583984375, 20.87890625, 21.8994140625, 22.919921875, 23.9404296875, 24.9609375, 25.9814453125, 27.001953125, 28.0224609375, 29.04296875, 30.0634765625, 31.083984375, 32.1044921875, 33.125]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 8.0, 7.0, 10.0, 10.0, 16.0, 22.0, 34.0, 40.0, 48.0, 60.0, 100.0, 161.0, 163.0, 254.0, 324.0, 403.0, 460.0, 429.0, 377.0, 294.0, 208.0, 161.0, 158.0, 88.0, 75.0, 40.0, 38.0, 27.0, 14.0, 11.0, 10.0, 13.0, 8.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.8515625, -15.36962890625, -14.8876953125, -14.40576171875, -13.923828125, -13.44189453125, -12.9599609375, -12.47802734375, -11.99609375, -11.51416015625, -11.0322265625, -10.55029296875, -10.068359375, -9.58642578125, -9.1044921875, -8.62255859375, -8.140625, -7.65869140625, -7.1767578125, -6.69482421875, -6.212890625, -5.73095703125, -5.2490234375, -4.76708984375, -4.28515625, -3.80322265625, -3.3212890625, -2.83935546875, -2.357421875, -1.87548828125, -1.3935546875, -0.91162109375, -0.4296875, 0.05224609375, 0.5341796875, 1.01611328125, 1.498046875, 1.97998046875, 2.4619140625, 2.94384765625, 3.42578125, 3.90771484375, 4.3896484375, 4.87158203125, 5.353515625, 5.83544921875, 6.3173828125, 6.79931640625, 7.28125, 7.76318359375, 8.2451171875, 8.72705078125, 9.208984375, 9.69091796875, 10.1728515625, 10.65478515625, 11.13671875, 11.61865234375, 12.1005859375, 12.58251953125, 13.064453125, 13.54638671875, 14.0283203125, 14.51025390625, 14.9921875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 0.0, 4.0, 4.0, 4.0, 9.0, 12.0, 13.0, 25.0, 23.0, 37.0, 50.0, 40.0, 49.0, 86.0, 85.0, 125.0, 162.0, 260.0, 319.0, 550.0, 1964.0, 142613.0, 4021117.0, 23838.0, 1214.0, 475.0, 304.0, 205.0, 147.0, 138.0, 92.0, 73.0, 55.0, 50.0, 37.0, 20.0, 16.0, 17.0, 9.0, 12.0, 12.0, 4.0, 5.0, 5.0, 4.0, 0.0, 2.0, 2.0, 1.0], "bins": [-84.875, -82.6025390625, -80.330078125, -78.0576171875, -75.78515625, -73.5126953125, -71.240234375, -68.9677734375, -66.6953125, -64.4228515625, -62.150390625, -59.8779296875, -57.60546875, -55.3330078125, -53.060546875, -50.7880859375, -48.515625, -46.2431640625, -43.970703125, -41.6982421875, -39.42578125, -37.1533203125, -34.880859375, -32.6083984375, -30.3359375, -28.0634765625, -25.791015625, -23.5185546875, -21.24609375, -18.9736328125, -16.701171875, -14.4287109375, -12.15625, -9.8837890625, -7.611328125, -5.3388671875, -3.06640625, -0.7939453125, 1.478515625, 3.7509765625, 6.0234375, 8.2958984375, 10.568359375, 12.8408203125, 15.11328125, 17.3857421875, 19.658203125, 21.9306640625, 24.203125, 26.4755859375, 28.748046875, 31.0205078125, 33.29296875, 35.5654296875, 37.837890625, 40.1103515625, 42.3828125, 44.6552734375, 46.927734375, 49.2001953125, 51.47265625, 53.7451171875, 56.017578125, 58.2900390625, 60.5625]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 10.0, 41.0, 175.0, 381.0, 279.0, 112.0, 12.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-149.92269897460938, -144.72962951660156, -139.53656005859375, -134.343505859375, -129.1504364013672, -123.95736694335938, -118.7643051147461, -113.57124328613281, -108.378173828125, -103.18510437011719, -97.9920425415039, -92.79898071289062, -87.60591125488281, -82.412841796875, -77.21977996826172, -72.02671813964844, -66.83364868164062, -61.64058303833008, -56.44751739501953, -51.254451751708984, -46.06138610839844, -40.86832046508789, -35.675254821777344, -30.482189178466797, -25.28912353515625, -20.096057891845703, -14.902992248535156, -9.70992660522461, -4.5168609619140625, 0.6762046813964844, 5.869270324707031, 11.062335968017578, 16.255386352539062, 21.44845199584961, 26.641517639160156, 31.834583282470703, 37.02764892578125, 42.2207145690918, 47.413780212402344, 52.60684585571289, 57.79991149902344, 62.992977142333984, 68.18604278564453, 73.37910461425781, 78.57217407226562, 83.76524353027344, 88.95830535888672, 94.1513671875, 99.34443664550781, 104.53750610351562, 109.7305679321289, 114.92362976074219, 120.11669921875, 125.30976867675781, 130.50283813476562, 135.69589233398438, 140.8889617919922, 146.08203125, 151.27508544921875, 156.46815490722656, 161.66122436523438, 166.8542938232422, 172.04736328125, 177.24041748046875, 182.43348693847656]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 4.0, 9.0, 4.0, 9.0, 10.0, 13.0, 14.0, 13.0, 12.0, 32.0, 21.0, 18.0, 39.0, 23.0, 34.0, 32.0, 42.0, 37.0, 36.0, 49.0, 44.0, 35.0, 42.0, 47.0, 35.0, 42.0, 30.0, 41.0, 20.0, 25.0, 24.0, 17.0, 22.0, 24.0, 17.0, 18.0, 11.0, 13.0, 9.0, 9.0, 8.0, 5.0, 4.0, 5.0, 3.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-48.632110595703125, -47.00776672363281, -45.383426666259766, -43.75908279418945, -42.134742736816406, -40.510398864746094, -38.88605499267578, -37.261714935302734, -35.63737487792969, -34.013031005859375, -32.38869094848633, -30.764347076416016, -29.14000701904297, -27.515663146972656, -25.891321182250977, -24.266979217529297, -22.642635345458984, -21.018293380737305, -19.393951416015625, -17.769607543945312, -16.145267486572266, -14.52092456817627, -12.896581649780273, -11.272239685058594, -9.647897720336914, -8.023555755615234, -6.3992133140563965, -4.774870872497559, -3.150528907775879, -1.5261869430541992, 0.09815597534179688, 1.7224979400634766, 3.3468399047851562, 4.971181869506836, 6.595524311065674, 8.219866752624512, 9.844208717346191, 11.468550682067871, 13.092893600463867, 14.717235565185547, 16.341577529907227, 17.965919494628906, 19.590261459350586, 21.214603424072266, 22.838947296142578, 24.463287353515625, 26.087631225585938, 27.711973190307617, 29.336315155029297, 30.960657119750977, 32.584999084472656, 34.20934295654297, 35.833683013916016, 37.45802688598633, 39.082366943359375, 40.70671081542969, 42.3310546875, 43.95539855957031, 45.57973861694336, 47.20408248901367, 48.82842254638672, 50.45276641845703, 52.077110290527344, 53.70145034790039, 55.32579040527344]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 6.0, 4.0, 11.0, 9.0, 7.0, 12.0, 14.0, 24.0, 15.0, 27.0, 19.0, 28.0, 32.0, 34.0, 39.0, 45.0, 33.0, 51.0, 44.0, 46.0, 47.0, 48.0, 46.0, 44.0, 45.0, 24.0, 40.0, 26.0, 20.0, 27.0, 25.0, 17.0, 22.0, 21.0, 13.0, 9.0, 8.0, 5.0, 7.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3359375, -8.0372314453125, -7.738525390625, -7.4398193359375, -7.14111328125, -6.8424072265625, -6.543701171875, -6.2449951171875, -5.9462890625, -5.6475830078125, -5.348876953125, -5.0501708984375, -4.75146484375, -4.4527587890625, -4.154052734375, -3.8553466796875, -3.556640625, -3.2579345703125, -2.959228515625, -2.6605224609375, -2.36181640625, -2.0631103515625, -1.764404296875, -1.4656982421875, -1.1669921875, -0.8682861328125, -0.569580078125, -0.2708740234375, 0.02783203125, 0.3265380859375, 0.625244140625, 0.9239501953125, 1.22265625, 1.5213623046875, 1.820068359375, 2.1187744140625, 2.41748046875, 2.7161865234375, 3.014892578125, 3.3135986328125, 3.6123046875, 3.9110107421875, 4.209716796875, 4.5084228515625, 4.80712890625, 5.1058349609375, 5.404541015625, 5.7032470703125, 6.001953125, 6.3006591796875, 6.599365234375, 6.8980712890625, 7.19677734375, 7.4954833984375, 7.794189453125, 8.0928955078125, 8.3916015625, 8.6903076171875, 8.989013671875, 9.2877197265625, 9.58642578125, 9.8851318359375, 10.183837890625, 10.4825439453125, 10.78125]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 7.0, 13.0, 22.0, 30.0, 49.0, 73.0, 90.0, 203.0, 312.0, 466.0, 735.0, 1176.0, 1916.0, 2988.0, 4829.0, 7609.0, 12307.0, 20178.0, 33590.0, 56300.0, 95533.0, 165025.0, 229717.0, 169646.0, 98783.0, 57859.0, 34602.0, 20781.0, 12707.0, 7857.0, 4999.0, 3079.0, 1843.0, 1173.0, 764.0, 485.0, 310.0, 158.0, 104.0, 86.0, 60.0, 33.0, 23.0, 11.0, 11.0, 4.0, 6.0, 2.0, 3.0, 3.0, 1.0], "bins": [-1.1875, -1.1540756225585938, -1.1206512451171875, -1.0872268676757812, -1.053802490234375, -1.0203781127929688, -0.9869537353515625, -0.9535293579101562, -0.92010498046875, -0.8866806030273438, -0.8532562255859375, -0.8198318481445312, -0.786407470703125, -0.7529830932617188, -0.7195587158203125, -0.6861343383789062, -0.6527099609375, -0.6192855834960938, -0.5858612060546875, -0.5524368286132812, -0.519012451171875, -0.48558807373046875, -0.4521636962890625, -0.41873931884765625, -0.38531494140625, -0.35189056396484375, -0.3184661865234375, -0.28504180908203125, -0.251617431640625, -0.21819305419921875, -0.1847686767578125, -0.15134429931640625, -0.117919921875, -0.08449554443359375, -0.0510711669921875, -0.01764678955078125, 0.015777587890625, 0.04920196533203125, 0.0826263427734375, 0.11605072021484375, 0.14947509765625, 0.18289947509765625, 0.2163238525390625, 0.24974822998046875, 0.283172607421875, 0.31659698486328125, 0.3500213623046875, 0.38344573974609375, 0.4168701171875, 0.45029449462890625, 0.4837188720703125, 0.5171432495117188, 0.550567626953125, 0.5839920043945312, 0.6174163818359375, 0.6508407592773438, 0.68426513671875, 0.7176895141601562, 0.7511138916015625, 0.7845382690429688, 0.817962646484375, 0.8513870239257812, 0.8848114013671875, 0.9182357788085938, 0.95166015625]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 6.0, 4.0, 4.0, 6.0, 6.0, 5.0, 12.0, 13.0, 18.0, 13.0, 10.0, 21.0, 13.0, 19.0, 17.0, 29.0, 36.0, 35.0, 36.0, 37.0, 46.0, 32.0, 33.0, 42.0, 1071.0, 37.0, 38.0, 33.0, 41.0, 31.0, 35.0, 23.0, 33.0, 29.0, 21.0, 21.0, 16.0, 17.0, 21.0, 9.0, 12.0, 15.0, 11.0, 8.0, 3.0, 4.0, 4.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.609375, -4.44805908203125, -4.2867431640625, -4.12542724609375, -3.964111328125, -3.80279541015625, -3.6414794921875, -3.48016357421875, -3.31884765625, -3.15753173828125, -2.9962158203125, -2.83489990234375, -2.673583984375, -2.51226806640625, -2.3509521484375, -2.18963623046875, -2.0283203125, -1.86700439453125, -1.7056884765625, -1.54437255859375, -1.383056640625, -1.22174072265625, -1.0604248046875, -0.89910888671875, -0.73779296875, -0.57647705078125, -0.4151611328125, -0.25384521484375, -0.092529296875, 0.06878662109375, 0.2301025390625, 0.39141845703125, 0.552734375, 0.71405029296875, 0.8753662109375, 1.03668212890625, 1.197998046875, 1.35931396484375, 1.5206298828125, 1.68194580078125, 1.84326171875, 2.00457763671875, 2.1658935546875, 2.32720947265625, 2.488525390625, 2.64984130859375, 2.8111572265625, 2.97247314453125, 3.1337890625, 3.29510498046875, 3.4564208984375, 3.61773681640625, 3.779052734375, 3.94036865234375, 4.1016845703125, 4.26300048828125, 4.42431640625, 4.58563232421875, 4.7469482421875, 4.90826416015625, 5.069580078125, 5.23089599609375, 5.3922119140625, 5.55352783203125, 5.71484375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 4.0, 3.0, 12.0, 10.0, 9.0, 12.0, 19.0, 39.0, 54.0, 75.0, 109.0, 147.0, 254.0, 349.0, 457.0, 783.0, 1142.0, 1705.0, 2658.0, 3969.0, 6061.0, 9534.0, 14983.0, 24359.0, 39410.0, 64045.0, 102988.0, 165568.0, 1260509.0, 150382.0, 93265.0, 57693.0, 35612.0, 21991.0, 13801.0, 8771.0, 5566.0, 3681.0, 2283.0, 1584.0, 1114.0, 695.0, 456.0, 338.0, 229.0, 133.0, 76.0, 65.0, 55.0, 33.0, 23.0, 9.0, 7.0, 5.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.82666015625, -0.7985382080078125, -0.770416259765625, -0.7422943115234375, -0.71417236328125, -0.6860504150390625, -0.657928466796875, -0.6298065185546875, -0.6016845703125, -0.5735626220703125, -0.545440673828125, -0.5173187255859375, -0.48919677734375, -0.4610748291015625, -0.432952880859375, -0.4048309326171875, -0.376708984375, -0.3485870361328125, -0.320465087890625, -0.2923431396484375, -0.26422119140625, -0.2360992431640625, -0.207977294921875, -0.1798553466796875, -0.1517333984375, -0.1236114501953125, -0.095489501953125, -0.0673675537109375, -0.03924560546875, -0.0111236572265625, 0.016998291015625, 0.0451202392578125, 0.0732421875, 0.1013641357421875, 0.129486083984375, 0.1576080322265625, 0.18572998046875, 0.2138519287109375, 0.241973876953125, 0.2700958251953125, 0.2982177734375, 0.3263397216796875, 0.354461669921875, 0.3825836181640625, 0.41070556640625, 0.4388275146484375, 0.466949462890625, 0.4950714111328125, 0.523193359375, 0.5513153076171875, 0.579437255859375, 0.6075592041015625, 0.63568115234375, 0.6638031005859375, 0.691925048828125, 0.7200469970703125, 0.7481689453125, 0.7762908935546875, 0.804412841796875, 0.8325347900390625, 0.86065673828125, 0.8887786865234375, 0.916900634765625, 0.9450225830078125, 0.97314453125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 2.0, 1.0, 2.0, 8.0, 9.0, 9.0, 13.0, 10.0, 24.0, 23.0, 24.0, 35.0, 36.0, 53.0, 47.0, 75.0, 76.0, 71.0, 67.0, 63.0, 59.0, 45.0, 42.0, 31.0, 32.0, 21.0, 31.0, 20.0, 22.0, 12.0, 7.0, 6.0, 7.0, 2.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.003650665283203125, -0.003543555736541748, -0.003436446189880371, -0.003329336643218994, -0.003222227096557617, -0.0031151175498962402, -0.0030080080032348633, -0.0029008984565734863, -0.0027937889099121094, -0.0026866793632507324, -0.0025795698165893555, -0.0024724602699279785, -0.0023653507232666016, -0.0022582411766052246, -0.0021511316299438477, -0.0020440220832824707, -0.0019369125366210938, -0.0018298029899597168, -0.0017226934432983398, -0.0016155838966369629, -0.001508474349975586, -0.001401364803314209, -0.001294255256652832, -0.001187145709991455, -0.0010800361633300781, -0.0009729266166687012, -0.0008658170700073242, -0.0007587075233459473, -0.0006515979766845703, -0.0005444884300231934, -0.0004373788833618164, -0.00033026933670043945, -0.0002231597900390625, -0.00011605024337768555, -8.940696716308594e-06, 9.816884994506836e-05, 0.0002052783966064453, 0.00031238794326782227, 0.0004194974899291992, 0.0005266070365905762, 0.0006337165832519531, 0.0007408261299133301, 0.000847935676574707, 0.000955045223236084, 0.001062154769897461, 0.0011692643165588379, 0.0012763738632202148, 0.0013834834098815918, 0.0014905929565429688, 0.0015977025032043457, 0.0017048120498657227, 0.0018119215965270996, 0.0019190311431884766, 0.0020261406898498535, 0.0021332502365112305, 0.0022403597831726074, 0.0023474693298339844, 0.0024545788764953613, 0.0025616884231567383, 0.0026687979698181152, 0.002775907516479492, 0.002883017063140869, 0.002990126609802246, 0.003097236156463623, 0.003204345703125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 6.0, 4.0, 5.0, 9.0, 14.0, 14.0, 29.0, 32.0, 42.0, 60.0, 66.0, 81.0, 139.0, 276.0, 662.0, 9732.0, 1033627.0, 2475.0, 517.0, 251.0, 145.0, 90.0, 77.0, 50.0, 35.0, 29.0, 18.0, 13.0, 11.0, 14.0, 6.0, 3.0, 6.0, 4.0, 2.0, 0.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.07476806640625, -0.07222270965576172, -0.06967735290527344, -0.06713199615478516, -0.06458663940429688, -0.062041282653808594, -0.05949592590332031, -0.05695056915283203, -0.05440521240234375, -0.05185985565185547, -0.04931449890136719, -0.046769142150878906, -0.044223785400390625, -0.041678428649902344, -0.03913307189941406, -0.03658771514892578, -0.0340423583984375, -0.03149700164794922, -0.028951644897460938, -0.026406288146972656, -0.023860931396484375, -0.021315574645996094, -0.018770217895507812, -0.01622486114501953, -0.01367950439453125, -0.011134147644042969, -0.008588790893554688, -0.006043434143066406, -0.003498077392578125, -0.0009527206420898438, 0.0015926361083984375, 0.004137992858886719, 0.006683349609375, 0.009228706359863281, 0.011774063110351562, 0.014319419860839844, 0.016864776611328125, 0.019410133361816406, 0.021955490112304688, 0.02450084686279297, 0.02704620361328125, 0.02959156036376953, 0.03213691711425781, 0.034682273864746094, 0.037227630615234375, 0.039772987365722656, 0.04231834411621094, 0.04486370086669922, 0.0474090576171875, 0.04995441436767578, 0.05249977111816406, 0.055045127868652344, 0.057590484619140625, 0.060135841369628906, 0.06268119812011719, 0.06522655487060547, 0.06777191162109375, 0.07031726837158203, 0.07286262512207031, 0.0754079818725586, 0.07795333862304688, 0.08049869537353516, 0.08304405212402344, 0.08558940887451172, 0.088134765625]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 6.0, 189.0, 778.0, 44.0], "bins": [-0.03071952611207962, -0.03022664412856102, -0.02973376400768757, -0.029240882024168968, -0.028748000040650368, -0.028255118057131767, -0.027762237936258316, -0.027269355952739716, -0.026776473969221115, -0.026283591985702515, -0.025790711864829063, -0.025297829881310463, -0.024804947897791862, -0.024312065914273262, -0.02381918579339981, -0.02332630380988121, -0.02283342182636261, -0.02234053984284401, -0.021847659721970558, -0.021354777738451958, -0.020861895754933357, -0.020369013771414757, -0.019876133650541306, -0.019383251667022705, -0.018890371546149254, -0.018397489562630653, -0.017904609441757202, -0.0174117274582386, -0.01691884547472, -0.0164259634912014, -0.01593308337032795, -0.015440201386809349, -0.014947318471968174, -0.014454437419772148, -0.013961555436253548, -0.013468674384057522, -0.012975792400538921, -0.012482911348342896, -0.011990029364824295, -0.01149714831262827, -0.011004267260432243, -0.010511386208236217, -0.010018504224717617, -0.009525623172521591, -0.00903274118900299, -0.008539860136806965, -0.008046979084610939, -0.0075540971010923386, -0.007061215117573738, -0.006568333599716425, -0.006075452081859112, -0.005582571029663086, -0.0050896890461444855, -0.00459680799394846, -0.0041039264760911465, -0.0036110449582338333, -0.00311816344037652, -0.002625281922519207, -0.002132400404661894, -0.0016395191196352243, -0.0011466376017779112, -0.000653756083920598, -0.00016087479889392853, 0.00033200671896338463, 0.0008248882368206978]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 5.0, 6.0, 4.0, 9.0, 9.0, 8.0, 15.0, 16.0, 13.0, 20.0, 19.0, 28.0, 24.0, 27.0, 29.0, 34.0, 43.0, 24.0, 36.0, 41.0, 48.0, 46.0, 45.0, 40.0, 42.0, 27.0, 49.0, 25.0, 24.0, 22.0, 26.0, 32.0, 28.0, 30.0, 20.0, 19.0, 12.0, 14.0, 16.0, 5.0, 8.0, 3.0, 5.0, 3.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0016813278198242188, -0.0016288673505187035, -0.0015764068812131882, -0.0015239464119076729, -0.0014714859426021576, -0.0014190254732966423, -0.001366565003991127, -0.0013141045346856117, -0.0012616440653800964, -0.0012091835960745811, -0.0011567231267690659, -0.0011042626574635506, -0.0010518021881580353, -0.00099934171885252, -0.0009468812495470047, -0.0008944207802414894, -0.0008419603109359741, -0.0007894998416304588, -0.0007370393723249435, -0.0006845789030194283, -0.000632118433713913, -0.0005796579644083977, -0.0005271974951028824, -0.0004747370257973671, -0.0004222765564918518, -0.0003698160871863365, -0.00031735561788082123, -0.00026489514857530594, -0.00021243467926979065, -0.00015997420996427536, -0.00010751374065876007, -5.505327135324478e-05, -2.592802047729492e-06, 4.98676672577858e-05, 0.00010232813656330109, 0.00015478860586881638, 0.00020724907517433167, 0.00025970954447984695, 0.00031217001378536224, 0.00036463048309087753, 0.0004170909523963928, 0.0004695514217019081, 0.0005220118910074234, 0.0005744723603129387, 0.000626932829618454, 0.0006793932989239693, 0.0007318537682294846, 0.0007843142375349998, 0.0008367747068405151, 0.0008892351761460304, 0.0009416956454515457, 0.000994156114757061, 0.0010466165840625763, 0.0010990770533680916, 0.0011515375226736069, 0.0012039979919791222, 0.0012564584612846375, 0.0013089189305901527, 0.001361379399895668, 0.0014138398692011833, 0.0014663003385066986, 0.001518760807812214, 0.0015712212771177292, 0.0016236817464232445, 0.0016761422157287598]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 6.0, 4.0, 11.0, 9.0, 7.0, 12.0, 14.0, 24.0, 16.0, 26.0, 19.0, 28.0, 32.0, 34.0, 39.0, 45.0, 33.0, 51.0, 44.0, 46.0, 47.0, 48.0, 46.0, 44.0, 45.0, 24.0, 40.0, 26.0, 20.0, 27.0, 25.0, 17.0, 22.0, 21.0, 13.0, 9.0, 8.0, 5.0, 7.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3359375, -8.0372314453125, -7.738525390625, -7.4398193359375, -7.14111328125, -6.8424072265625, -6.543701171875, -6.2449951171875, -5.9462890625, -5.6475830078125, -5.348876953125, -5.0501708984375, -4.75146484375, -4.4527587890625, -4.154052734375, -3.8553466796875, -3.556640625, -3.2579345703125, -2.959228515625, -2.6605224609375, -2.36181640625, -2.0631103515625, -1.764404296875, -1.4656982421875, -1.1669921875, -0.8682861328125, -0.569580078125, -0.2708740234375, 0.02783203125, 0.3265380859375, 0.625244140625, 0.9239501953125, 1.22265625, 1.5213623046875, 1.820068359375, 2.1187744140625, 2.41748046875, 2.7161865234375, 3.014892578125, 3.3135986328125, 3.6123046875, 3.9110107421875, 4.209716796875, 4.5084228515625, 4.80712890625, 5.1058349609375, 5.404541015625, 5.7032470703125, 6.001953125, 6.3006591796875, 6.599365234375, 6.8980712890625, 7.19677734375, 7.4954833984375, 7.794189453125, 8.0928955078125, 8.3916015625, 8.6903076171875, 8.989013671875, 9.2877197265625, 9.58642578125, 9.8851318359375, 10.183837890625, 10.4825439453125, 10.78125]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 5.0, 5.0, 5.0, 14.0, 9.0, 9.0, 19.0, 15.0, 35.0, 32.0, 48.0, 67.0, 94.0, 142.0, 184.0, 299.0, 477.0, 1290.0, 6772.0, 59378.0, 639333.0, 304947.0, 29424.0, 3831.0, 837.0, 425.0, 231.0, 186.0, 113.0, 74.0, 60.0, 55.0, 27.0, 33.0, 22.0, 16.0, 11.0, 12.0, 6.0, 8.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.375, -15.786865234375, -15.19873046875, -14.610595703125, -14.0224609375, -13.434326171875, -12.84619140625, -12.258056640625, -11.669921875, -11.081787109375, -10.49365234375, -9.905517578125, -9.3173828125, -8.729248046875, -8.14111328125, -7.552978515625, -6.96484375, -6.376708984375, -5.78857421875, -5.200439453125, -4.6123046875, -4.024169921875, -3.43603515625, -2.847900390625, -2.259765625, -1.671630859375, -1.08349609375, -0.495361328125, 0.0927734375, 0.680908203125, 1.26904296875, 1.857177734375, 2.4453125, 3.033447265625, 3.62158203125, 4.209716796875, 4.7978515625, 5.385986328125, 5.97412109375, 6.562255859375, 7.150390625, 7.738525390625, 8.32666015625, 8.914794921875, 9.5029296875, 10.091064453125, 10.67919921875, 11.267333984375, 11.85546875, 12.443603515625, 13.03173828125, 13.619873046875, 14.2080078125, 14.796142578125, 15.38427734375, 15.972412109375, 16.560546875, 17.148681640625, 17.73681640625, 18.324951171875, 18.9130859375, 19.501220703125, 20.08935546875, 20.677490234375, 21.265625]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 5.0, 7.0, 10.0, 9.0, 14.0, 7.0, 13.0, 13.0, 12.0, 23.0, 14.0, 22.0, 23.0, 34.0, 30.0, 37.0, 39.0, 50.0, 90.0, 130.0, 1542.0, 350.0, 113.0, 73.0, 53.0, 48.0, 31.0, 38.0, 32.0, 20.0, 20.0, 20.0, 13.0, 24.0, 19.0, 22.0, 11.0, 10.0, 5.0, 6.0, 5.0, 4.0, 4.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.546875, -27.679443359375, -26.81201171875, -25.944580078125, -25.0771484375, -24.209716796875, -23.34228515625, -22.474853515625, -21.607421875, -20.739990234375, -19.87255859375, -19.005126953125, -18.1376953125, -17.270263671875, -16.40283203125, -15.535400390625, -14.66796875, -13.800537109375, -12.93310546875, -12.065673828125, -11.1982421875, -10.330810546875, -9.46337890625, -8.595947265625, -7.728515625, -6.861083984375, -5.99365234375, -5.126220703125, -4.2587890625, -3.391357421875, -2.52392578125, -1.656494140625, -0.7890625, 0.078369140625, 0.94580078125, 1.813232421875, 2.6806640625, 3.548095703125, 4.41552734375, 5.282958984375, 6.150390625, 7.017822265625, 7.88525390625, 8.752685546875, 9.6201171875, 10.487548828125, 11.35498046875, 12.222412109375, 13.08984375, 13.957275390625, 14.82470703125, 15.692138671875, 16.5595703125, 17.427001953125, 18.29443359375, 19.161865234375, 20.029296875, 20.896728515625, 21.76416015625, 22.631591796875, 23.4990234375, 24.366455078125, 25.23388671875, 26.101318359375, 26.96875]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 5.0, 6.0, 5.0, 12.0, 9.0, 17.0, 18.0, 29.0, 34.0, 28.0, 32.0, 55.0, 77.0, 90.0, 129.0, 234.0, 450.0, 1396.0, 39759.0, 3090012.0, 11157.0, 1086.0, 378.0, 174.0, 137.0, 75.0, 68.0, 45.0, 34.0, 26.0, 23.0, 22.0, 23.0, 14.0, 11.0, 9.0, 7.0, 6.0, 4.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-70.8125, -68.69140625, -66.5703125, -64.44921875, -62.328125, -60.20703125, -58.0859375, -55.96484375, -53.84375, -51.72265625, -49.6015625, -47.48046875, -45.359375, -43.23828125, -41.1171875, -38.99609375, -36.875, -34.75390625, -32.6328125, -30.51171875, -28.390625, -26.26953125, -24.1484375, -22.02734375, -19.90625, -17.78515625, -15.6640625, -13.54296875, -11.421875, -9.30078125, -7.1796875, -5.05859375, -2.9375, -0.81640625, 1.3046875, 3.42578125, 5.546875, 7.66796875, 9.7890625, 11.91015625, 14.03125, 16.15234375, 18.2734375, 20.39453125, 22.515625, 24.63671875, 26.7578125, 28.87890625, 31.0, 33.12109375, 35.2421875, 37.36328125, 39.484375, 41.60546875, 43.7265625, 45.84765625, 47.96875, 50.08984375, 52.2109375, 54.33203125, 56.453125, 58.57421875, 60.6953125, 62.81640625, 64.9375]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 19.0, 120.0, 393.0, 349.0, 119.0, 15.0], "bins": [-187.45513916015625, -184.3767547607422, -181.29837036132812, -178.21998596191406, -175.1416015625, -172.063232421875, -168.98484802246094, -165.90646362304688, -162.8280792236328, -159.74969482421875, -156.6713104248047, -153.59292602539062, -150.51454162597656, -147.43617248535156, -144.3577880859375, -141.27940368652344, -138.20101928710938, -135.1226348876953, -132.04425048828125, -128.9658660888672, -125.88748931884766, -122.8091049194336, -119.73072052001953, -116.65234375, -113.5739517211914, -110.49556732177734, -107.41718292236328, -104.33880615234375, -101.26042175292969, -98.18203735351562, -95.10365295410156, -92.0252685546875, -88.9468994140625, -85.86851501464844, -82.79013061523438, -79.71175384521484, -76.63336944580078, -73.55498504638672, -70.47660064697266, -67.39822387695312, -64.31983947753906, -61.241455078125, -58.1630744934082, -55.08469009399414, -52.006309509277344, -48.92792510986328, -45.84954071044922, -42.77116012573242, -39.692771911621094, -36.61438751220703, -33.536006927490234, -30.457622528076172, -27.379241943359375, -24.300857543945312, -21.222475051879883, -18.144092559814453, -15.065711975097656, -11.987329483032227, -8.908946990966797, -5.830563545227051, -2.752181053161621, 0.3262014389038086, 3.4045848846435547, 6.482967376708984, 9.561349868774414]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 1.0, 4.0, 2.0, 5.0, 4.0, 6.0, 4.0, 14.0, 11.0, 16.0, 19.0, 21.0, 17.0, 32.0, 30.0, 20.0, 32.0, 36.0, 31.0, 38.0, 40.0, 35.0, 50.0, 48.0, 55.0, 42.0, 35.0, 37.0, 45.0, 35.0, 26.0, 28.0, 24.0, 21.0, 29.0, 28.0, 16.0, 15.0, 13.0, 7.0, 4.0, 9.0, 11.0, 5.0, 5.0, 0.0, 0.0, 4.0, 0.0, 2.0], "bins": [-83.77754974365234, -81.57593536376953, -79.37432861328125, -77.17271423339844, -74.97110748291016, -72.76949310302734, -70.56788635253906, -68.36627197265625, -66.16465759277344, -63.96304702758789, -61.761436462402344, -59.5598258972168, -57.35821533203125, -55.15660095214844, -52.95499038696289, -50.753379821777344, -48.55177307128906, -46.350162506103516, -44.14855194091797, -41.94694137573242, -39.745330810546875, -37.54371643066406, -35.342105865478516, -33.14049530029297, -30.938884735107422, -28.737274169921875, -26.535663604736328, -24.33405113220215, -22.1324405670166, -19.930830001831055, -17.729217529296875, -15.527606964111328, -13.326004028320312, -11.124393463134766, -8.922781944274902, -6.721170902252197, -4.519559860229492, -2.3179492950439453, -0.11633777618408203, 2.0852737426757812, 4.286884307861328, 6.488495349884033, 8.690106391906738, 10.891717910766602, 13.093328475952148, 15.294939041137695, 17.496551513671875, 19.698162078857422, 21.89977264404297, 24.101383209228516, 26.302993774414062, 28.504606246948242, 30.70621681213379, 32.90782928466797, 35.109439849853516, 37.31105041503906, 39.51266098022461, 41.714271545410156, 43.9158821105957, 46.11749267578125, 48.31910705566406, 50.520713806152344, 52.722328186035156, 54.9239387512207, 57.12554931640625]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 4.0, 4.0, 8.0, 10.0, 12.0, 11.0, 14.0, 18.0, 14.0, 26.0, 26.0, 23.0, 33.0, 33.0, 24.0, 33.0, 42.0, 39.0, 52.0, 45.0, 46.0, 46.0, 43.0, 45.0, 48.0, 36.0, 33.0, 30.0, 31.0, 29.0, 19.0, 21.0, 23.0, 14.0, 14.0, 13.0, 8.0, 6.0, 10.0, 8.0, 5.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.34375, -8.040283203125, -7.73681640625, -7.433349609375, -7.1298828125, -6.826416015625, -6.52294921875, -6.219482421875, -5.916015625, -5.612548828125, -5.30908203125, -5.005615234375, -4.7021484375, -4.398681640625, -4.09521484375, -3.791748046875, -3.48828125, -3.184814453125, -2.88134765625, -2.577880859375, -2.2744140625, -1.970947265625, -1.66748046875, -1.364013671875, -1.060546875, -0.757080078125, -0.45361328125, -0.150146484375, 0.1533203125, 0.456787109375, 0.76025390625, 1.063720703125, 1.3671875, 1.670654296875, 1.97412109375, 2.277587890625, 2.5810546875, 2.884521484375, 3.18798828125, 3.491455078125, 3.794921875, 4.098388671875, 4.40185546875, 4.705322265625, 5.0087890625, 5.312255859375, 5.61572265625, 5.919189453125, 6.22265625, 6.526123046875, 6.82958984375, 7.133056640625, 7.4365234375, 7.739990234375, 8.04345703125, 8.346923828125, 8.650390625, 8.953857421875, 9.25732421875, 9.560791015625, 9.8642578125, 10.167724609375, 10.47119140625, 10.774658203125, 11.078125]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 5.0, 10.0, 9.0, 8.0, 10.0, 12.0, 25.0, 20.0, 10.0, 33.0, 37.0, 53.0, 53.0, 96.0, 145.0, 260.0, 602.0, 1978.0, 14070.0, 398748.0, 3253881.0, 503847.0, 16827.0, 2113.0, 637.0, 267.0, 133.0, 90.0, 53.0, 50.0, 42.0, 33.0, 27.0, 14.0, 15.0, 11.0, 13.0, 7.0, 7.0, 11.0, 7.0, 2.0, 8.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.8125, -24.967041015625, -24.12158203125, -23.276123046875, -22.4306640625, -21.585205078125, -20.73974609375, -19.894287109375, -19.048828125, -18.203369140625, -17.35791015625, -16.512451171875, -15.6669921875, -14.821533203125, -13.97607421875, -13.130615234375, -12.28515625, -11.439697265625, -10.59423828125, -9.748779296875, -8.9033203125, -8.057861328125, -7.21240234375, -6.366943359375, -5.521484375, -4.676025390625, -3.83056640625, -2.985107421875, -2.1396484375, -1.294189453125, -0.44873046875, 0.396728515625, 1.2421875, 2.087646484375, 2.93310546875, 3.778564453125, 4.6240234375, 5.469482421875, 6.31494140625, 7.160400390625, 8.005859375, 8.851318359375, 9.69677734375, 10.542236328125, 11.3876953125, 12.233154296875, 13.07861328125, 13.924072265625, 14.76953125, 15.614990234375, 16.46044921875, 17.305908203125, 18.1513671875, 18.996826171875, 19.84228515625, 20.687744140625, 21.533203125, 22.378662109375, 23.22412109375, 24.069580078125, 24.9150390625, 25.760498046875, 26.60595703125, 27.451416015625, 28.296875]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 7.0, 3.0, 9.0, 11.0, 8.0, 20.0, 21.0, 21.0, 40.0, 41.0, 56.0, 82.0, 100.0, 122.0, 139.0, 203.0, 230.0, 310.0, 373.0, 380.0, 384.0, 334.0, 290.0, 221.0, 144.0, 121.0, 99.0, 74.0, 52.0, 38.0, 35.0, 18.0, 17.0, 21.0, 13.0, 9.0, 6.0, 8.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.8984375, -12.49072265625, -12.0830078125, -11.67529296875, -11.267578125, -10.85986328125, -10.4521484375, -10.04443359375, -9.63671875, -9.22900390625, -8.8212890625, -8.41357421875, -8.005859375, -7.59814453125, -7.1904296875, -6.78271484375, -6.375, -5.96728515625, -5.5595703125, -5.15185546875, -4.744140625, -4.33642578125, -3.9287109375, -3.52099609375, -3.11328125, -2.70556640625, -2.2978515625, -1.89013671875, -1.482421875, -1.07470703125, -0.6669921875, -0.25927734375, 0.1484375, 0.55615234375, 0.9638671875, 1.37158203125, 1.779296875, 2.18701171875, 2.5947265625, 3.00244140625, 3.41015625, 3.81787109375, 4.2255859375, 4.63330078125, 5.041015625, 5.44873046875, 5.8564453125, 6.26416015625, 6.671875, 7.07958984375, 7.4873046875, 7.89501953125, 8.302734375, 8.71044921875, 9.1181640625, 9.52587890625, 9.93359375, 10.34130859375, 10.7490234375, 11.15673828125, 11.564453125, 11.97216796875, 12.3798828125, 12.78759765625, 13.1953125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 11.0, 11.0, 11.0, 17.0, 24.0, 34.0, 40.0, 47.0, 69.0, 80.0, 125.0, 153.0, 217.0, 399.0, 862.0, 5425.0, 1136834.0, 3038251.0, 9328.0, 1018.0, 452.0, 244.0, 180.0, 110.0, 85.0, 64.0, 48.0, 26.0, 21.0, 28.0, 18.0, 18.0, 13.0, 10.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-66.375, -64.2392578125, -62.103515625, -59.9677734375, -57.83203125, -55.6962890625, -53.560546875, -51.4248046875, -49.2890625, -47.1533203125, -45.017578125, -42.8818359375, -40.74609375, -38.6103515625, -36.474609375, -34.3388671875, -32.203125, -30.0673828125, -27.931640625, -25.7958984375, -23.66015625, -21.5244140625, -19.388671875, -17.2529296875, -15.1171875, -12.9814453125, -10.845703125, -8.7099609375, -6.57421875, -4.4384765625, -2.302734375, -0.1669921875, 1.96875, 4.1044921875, 6.240234375, 8.3759765625, 10.51171875, 12.6474609375, 14.783203125, 16.9189453125, 19.0546875, 21.1904296875, 23.326171875, 25.4619140625, 27.59765625, 29.7333984375, 31.869140625, 34.0048828125, 36.140625, 38.2763671875, 40.412109375, 42.5478515625, 44.68359375, 46.8193359375, 48.955078125, 51.0908203125, 53.2265625, 55.3623046875, 57.498046875, 59.6337890625, 61.76953125, 63.9052734375, 66.041015625, 68.1767578125, 70.3125]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 74.0, 208.0, 416.0, 241.0, 57.0, 11.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-247.44393920898438, -241.774169921875, -236.10438537597656, -230.43460083007812, -224.76483154296875, -219.09506225585938, -213.42527770996094, -207.7554931640625, -202.08572387695312, -196.41595458984375, -190.7461700439453, -185.07638549804688, -179.4066162109375, -173.73684692382812, -168.0670623779297, -162.39727783203125, -156.72750854492188, -151.0577392578125, -145.38795471191406, -139.71817016601562, -134.04840087890625, -128.37863159179688, -122.70884704589844, -117.03907012939453, -111.36929321289062, -105.69951629638672, -100.02973937988281, -94.3599624633789, -88.690185546875, -83.0204086303711, -77.35063171386719, -71.68085479736328, -66.01107788085938, -60.34130096435547, -54.67152404785156, -49.001747131347656, -43.33197021484375, -37.662193298339844, -31.992416381835938, -26.32263946533203, -20.652862548828125, -14.983085632324219, -9.313308715820312, -3.6435317993164062, 2.0262451171875, 7.696022033691406, 13.365798950195312, 19.03557586669922, 24.705352783203125, 30.37512969970703, 36.04490661621094, 41.714683532714844, 47.38446044921875, 53.054237365722656, 58.72401428222656, 64.39379119873047, 70.06356811523438, 75.73334503173828, 81.40312194824219, 87.0728988647461, 92.74267578125, 98.4124526977539, 104.08222961425781, 109.75200653076172, 115.42178344726562]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 4.0, 9.0, 6.0, 5.0, 7.0, 11.0, 5.0, 7.0, 10.0, 20.0, 26.0, 24.0, 21.0, 29.0, 26.0, 33.0, 46.0, 35.0, 33.0, 29.0, 31.0, 48.0, 41.0, 50.0, 36.0, 37.0, 41.0, 35.0, 34.0, 28.0, 39.0, 27.0, 23.0, 24.0, 16.0, 17.0, 13.0, 19.0, 14.0, 11.0, 8.0, 7.0, 5.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-50.42236328125, -48.7014045715332, -46.980445861816406, -45.259490966796875, -43.53853225708008, -41.81757354736328, -40.09661865234375, -38.37565994262695, -36.654701232910156, -34.93374252319336, -33.21278381347656, -31.49182891845703, -29.770870208740234, -28.049911499023438, -26.328954696655273, -24.60799789428711, -22.887039184570312, -21.166080474853516, -19.44512367248535, -17.724166870117188, -16.00320816040039, -14.28225040435791, -12.56129264831543, -10.84033489227295, -9.119377136230469, -7.398419380187988, -5.677461624145508, -3.9565038681030273, -2.235546112060547, -0.5145883560180664, 1.206369400024414, 2.9273271560668945, 4.648284912109375, 6.3692426681518555, 8.090200424194336, 9.811158180236816, 11.532115936279297, 13.253073692321777, 14.974031448364258, 16.694988250732422, 18.41594696044922, 20.136905670166016, 21.85786247253418, 23.578819274902344, 25.29977798461914, 27.020736694335938, 28.7416934967041, 30.462650299072266, 32.18360900878906, 33.90456771850586, 35.625526428222656, 37.34648132324219, 39.067440032958984, 40.78839874267578, 42.50935363769531, 44.23031234741211, 45.951271057128906, 47.6722297668457, 49.3931884765625, 51.11414337158203, 52.83510208129883, 54.556060791015625, 56.277015686035156, 57.99797439575195, 59.71893310546875]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 4.0, 6.0, 6.0, 10.0, 6.0, 16.0, 16.0, 21.0, 16.0, 20.0, 26.0, 20.0, 25.0, 35.0, 38.0, 33.0, 43.0, 43.0, 35.0, 45.0, 44.0, 31.0, 41.0, 40.0, 37.0, 33.0, 38.0, 19.0, 42.0, 29.0, 32.0, 31.0, 19.0, 10.0, 16.0, 18.0, 11.0, 16.0, 12.0, 9.0, 5.0, 4.0, 6.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.65625, -8.358642578125, -8.06103515625, -7.763427734375, -7.4658203125, -7.168212890625, -6.87060546875, -6.572998046875, -6.275390625, -5.977783203125, -5.68017578125, -5.382568359375, -5.0849609375, -4.787353515625, -4.48974609375, -4.192138671875, -3.89453125, -3.596923828125, -3.29931640625, -3.001708984375, -2.7041015625, -2.406494140625, -2.10888671875, -1.811279296875, -1.513671875, -1.216064453125, -0.91845703125, -0.620849609375, -0.3232421875, -0.025634765625, 0.27197265625, 0.569580078125, 0.8671875, 1.164794921875, 1.46240234375, 1.760009765625, 2.0576171875, 2.355224609375, 2.65283203125, 2.950439453125, 3.248046875, 3.545654296875, 3.84326171875, 4.140869140625, 4.4384765625, 4.736083984375, 5.03369140625, 5.331298828125, 5.62890625, 5.926513671875, 6.22412109375, 6.521728515625, 6.8193359375, 7.116943359375, 7.41455078125, 7.712158203125, 8.009765625, 8.307373046875, 8.60498046875, 8.902587890625, 9.2001953125, 9.497802734375, 9.79541015625, 10.093017578125, 10.390625]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 5.0, 5.0, 10.0, 9.0, 17.0, 20.0, 32.0, 57.0, 76.0, 109.0, 154.0, 243.0, 382.0, 599.0, 962.0, 1606.0, 2384.0, 3835.0, 6256.0, 10492.0, 17159.0, 28506.0, 45417.0, 73002.0, 118741.0, 195694.0, 207894.0, 128317.0, 78955.0, 48977.0, 30704.0, 18572.0, 11231.0, 6789.0, 4118.0, 2600.0, 1603.0, 1055.0, 690.0, 467.0, 293.0, 182.0, 124.0, 88.0, 48.0, 33.0, 21.0, 10.0, 11.0, 4.0, 5.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0322265625, -0.9979095458984375, -0.963592529296875, -0.9292755126953125, -0.89495849609375, -0.8606414794921875, -0.826324462890625, -0.7920074462890625, -0.7576904296875, -0.7233734130859375, -0.689056396484375, -0.6547393798828125, -0.62042236328125, -0.5861053466796875, -0.551788330078125, -0.5174713134765625, -0.483154296875, -0.4488372802734375, -0.414520263671875, -0.3802032470703125, -0.34588623046875, -0.3115692138671875, -0.277252197265625, -0.2429351806640625, -0.2086181640625, -0.1743011474609375, -0.139984130859375, -0.1056671142578125, -0.07135009765625, -0.0370330810546875, -0.002716064453125, 0.0316009521484375, 0.06591796875, 0.1002349853515625, 0.134552001953125, 0.1688690185546875, 0.20318603515625, 0.2375030517578125, 0.271820068359375, 0.3061370849609375, 0.3404541015625, 0.3747711181640625, 0.409088134765625, 0.4434051513671875, 0.47772216796875, 0.5120391845703125, 0.546356201171875, 0.5806732177734375, 0.614990234375, 0.6493072509765625, 0.683624267578125, 0.7179412841796875, 0.75225830078125, 0.7865753173828125, 0.820892333984375, 0.8552093505859375, 0.8895263671875, 0.9238433837890625, 0.958160400390625, 0.9924774169921875, 1.02679443359375, 1.0611114501953125, 1.095428466796875, 1.1297454833984375, 1.1640625]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 5.0, 9.0, 8.0, 13.0, 13.0, 9.0, 17.0, 14.0, 21.0, 17.0, 22.0, 42.0, 27.0, 23.0, 35.0, 47.0, 36.0, 40.0, 38.0, 40.0, 28.0, 1068.0, 35.0, 33.0, 34.0, 35.0, 32.0, 44.0, 31.0, 41.0, 22.0, 22.0, 17.0, 16.0, 14.0, 12.0, 9.0, 13.0, 14.0, 14.0, 8.0, 6.0, 2.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-6.66015625, -6.4708251953125, -6.281494140625, -6.0921630859375, -5.90283203125, -5.7135009765625, -5.524169921875, -5.3348388671875, -5.1455078125, -4.9561767578125, -4.766845703125, -4.5775146484375, -4.38818359375, -4.1988525390625, -4.009521484375, -3.8201904296875, -3.630859375, -3.4415283203125, -3.252197265625, -3.0628662109375, -2.87353515625, -2.6842041015625, -2.494873046875, -2.3055419921875, -2.1162109375, -1.9268798828125, -1.737548828125, -1.5482177734375, -1.35888671875, -1.1695556640625, -0.980224609375, -0.7908935546875, -0.6015625, -0.4122314453125, -0.222900390625, -0.0335693359375, 0.15576171875, 0.3450927734375, 0.534423828125, 0.7237548828125, 0.9130859375, 1.1024169921875, 1.291748046875, 1.4810791015625, 1.67041015625, 1.8597412109375, 2.049072265625, 2.2384033203125, 2.427734375, 2.6170654296875, 2.806396484375, 2.9957275390625, 3.18505859375, 3.3743896484375, 3.563720703125, 3.7530517578125, 3.9423828125, 4.1317138671875, 4.321044921875, 4.5103759765625, 4.69970703125, 4.8890380859375, 5.078369140625, 5.2677001953125, 5.45703125]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 8.0, 13.0, 20.0, 20.0, 45.0, 55.0, 105.0, 163.0, 234.0, 341.0, 548.0, 773.0, 1180.0, 1763.0, 2716.0, 3884.0, 6033.0, 9526.0, 14820.0, 23221.0, 36559.0, 58311.0, 93601.0, 148182.0, 1253723.0, 162021.0, 102453.0, 64652.0, 40577.0, 25373.0, 16246.0, 10412.0, 6635.0, 4489.0, 2812.0, 1876.0, 1186.0, 883.0, 546.0, 367.0, 263.0, 167.0, 110.0, 66.0, 71.0, 39.0, 19.0, 10.0, 8.0, 6.0, 1.0, 4.0, 2.0, 2.0], "bins": [-1.064453125, -1.03369140625, -1.0029296875, -0.97216796875, -0.94140625, -0.91064453125, -0.8798828125, -0.84912109375, -0.818359375, -0.78759765625, -0.7568359375, -0.72607421875, -0.6953125, -0.66455078125, -0.6337890625, -0.60302734375, -0.572265625, -0.54150390625, -0.5107421875, -0.47998046875, -0.44921875, -0.41845703125, -0.3876953125, -0.35693359375, -0.326171875, -0.29541015625, -0.2646484375, -0.23388671875, -0.203125, -0.17236328125, -0.1416015625, -0.11083984375, -0.080078125, -0.04931640625, -0.0185546875, 0.01220703125, 0.04296875, 0.07373046875, 0.1044921875, 0.13525390625, 0.166015625, 0.19677734375, 0.2275390625, 0.25830078125, 0.2890625, 0.31982421875, 0.3505859375, 0.38134765625, 0.412109375, 0.44287109375, 0.4736328125, 0.50439453125, 0.53515625, 0.56591796875, 0.5966796875, 0.62744140625, 0.658203125, 0.68896484375, 0.7197265625, 0.75048828125, 0.78125, 0.81201171875, 0.8427734375, 0.87353515625, 0.904296875]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 4.0, 1.0, 4.0, 6.0, 4.0, 6.0, 5.0, 4.0, 8.0, 12.0, 13.0, 12.0, 18.0, 28.0, 27.0, 30.0, 27.0, 45.0, 35.0, 37.0, 54.0, 54.0, 64.0, 59.0, 59.0, 50.0, 55.0, 43.0, 33.0, 24.0, 45.0, 20.0, 19.0, 18.0, 15.0, 10.0, 11.0, 8.0, 6.0, 4.0, 6.0, 4.0, 2.0, 4.0, 4.0, 3.0, 2.0, 1.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0030670166015625, -0.0029675960540771484, -0.002868175506591797, -0.0027687549591064453, -0.0026693344116210938, -0.002569913864135742, -0.0024704933166503906, -0.002371072769165039, -0.0022716522216796875, -0.002172231674194336, -0.0020728111267089844, -0.001973390579223633, -0.0018739700317382812, -0.0017745494842529297, -0.0016751289367675781, -0.0015757083892822266, -0.001476287841796875, -0.0013768672943115234, -0.0012774467468261719, -0.0011780261993408203, -0.0010786056518554688, -0.0009791851043701172, -0.0008797645568847656, -0.0007803440093994141, -0.0006809234619140625, -0.0005815029144287109, -0.0004820823669433594, -0.0003826618194580078, -0.00028324127197265625, -0.0001838207244873047, -8.440017700195312e-05, 1.5020370483398438e-05, 0.00011444091796875, 0.00021386146545410156, 0.0003132820129394531, 0.0004127025604248047, 0.0005121231079101562, 0.0006115436553955078, 0.0007109642028808594, 0.0008103847503662109, 0.0009098052978515625, 0.001009225845336914, 0.0011086463928222656, 0.0012080669403076172, 0.0013074874877929688, 0.0014069080352783203, 0.0015063285827636719, 0.0016057491302490234, 0.001705169677734375, 0.0018045902252197266, 0.0019040107727050781, 0.0020034313201904297, 0.0021028518676757812, 0.002202272415161133, 0.0023016929626464844, 0.002401113510131836, 0.0025005340576171875, 0.002599954605102539, 0.0026993751525878906, 0.002798795700073242, 0.0028982162475585938, 0.0029976367950439453, 0.003097057342529297, 0.0031964778900146484, 0.0032958984375]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 5.0, 8.0, 6.0, 5.0, 3.0, 10.0, 8.0, 9.0, 25.0, 26.0, 22.0, 47.0, 57.0, 93.0, 105.0, 190.0, 335.0, 690.0, 6993.0, 1035878.0, 2641.0, 589.0, 240.0, 173.0, 110.0, 78.0, 50.0, 35.0, 26.0, 24.0, 26.0, 8.0, 6.0, 11.0, 7.0, 6.0, 8.0, 4.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09405517578125, -0.09123897552490234, -0.08842277526855469, -0.08560657501220703, -0.08279037475585938, -0.07997417449951172, -0.07715797424316406, -0.0743417739868164, -0.07152557373046875, -0.0687093734741211, -0.06589317321777344, -0.06307697296142578, -0.060260772705078125, -0.05744457244873047, -0.05462837219238281, -0.051812171936035156, -0.0489959716796875, -0.046179771423339844, -0.04336357116699219, -0.04054737091064453, -0.037731170654296875, -0.03491497039794922, -0.03209877014160156, -0.029282569885253906, -0.02646636962890625, -0.023650169372558594, -0.020833969116210938, -0.01801776885986328, -0.015201568603515625, -0.012385368347167969, -0.009569168090820312, -0.006752967834472656, -0.003936767578125, -0.0011205673217773438, 0.0016956329345703125, 0.004511833190917969, 0.007328033447265625, 0.010144233703613281, 0.012960433959960938, 0.015776634216308594, 0.01859283447265625, 0.021409034729003906, 0.024225234985351562, 0.02704143524169922, 0.029857635498046875, 0.03267383575439453, 0.03549003601074219, 0.038306236267089844, 0.0411224365234375, 0.043938636779785156, 0.04675483703613281, 0.04957103729248047, 0.052387237548828125, 0.05520343780517578, 0.05801963806152344, 0.060835838317871094, 0.06365203857421875, 0.0664682388305664, 0.06928443908691406, 0.07210063934326172, 0.07491683959960938, 0.07773303985595703, 0.08054924011230469, 0.08336544036865234, 0.086181640625]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 14.0, 508.0, 478.0, 14.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.015471485443413258, -0.014972181990742683, -0.014472877606749535, -0.013973573222756386, -0.013474269770085812, -0.012974966317415237, -0.012475661933422089, -0.01197635754942894, -0.011477054096758366, -0.010977750644087791, -0.010478446260094643, -0.009979141876101494, -0.00947983842343092, -0.008980534970760345, -0.008481230586767197, -0.007981926202774048, -0.007482622750103474, -0.006983318831771612, -0.006484014913439751, -0.005984710995107889, -0.005485407076776028, -0.004986103158444166, -0.004486799240112305, -0.003987495321780443, -0.0034881914034485817, -0.00298888748511672, -0.0024895835667848587, -0.001990279648452997, -0.0014909757301211357, -0.0009916718117892742, -0.0004923678934574127, 6.936024874448776e-06, 0.0005062390118837357, 0.0010055429302155972, 0.0015048468485474586, 0.00200415076687932, 0.0025034546852111816, 0.003002758603543043, 0.0035020625218749046, 0.004001366440206766, 0.004500670358538628, 0.004999974276870489, 0.005499278195202351, 0.005998582113534212, 0.006497886031866074, 0.006997189950197935, 0.007496493868529797, 0.00799579732120037, 0.00849510170519352, 0.008994406089186668, 0.009493709541857243, 0.009993012994527817, 0.010492317378520966, 0.010991621762514114, 0.011490925215184689, 0.011990228667855263, 0.012489533051848412, 0.01298883743584156, 0.013488140888512135, 0.013987444341182709, 0.014486748725175858, 0.014986053109169006, 0.01548535656183958, 0.015984660014510155, 0.016483964398503304]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 4.0, 4.0, 7.0, 2.0, 4.0, 10.0, 11.0, 7.0, 15.0, 17.0, 19.0, 8.0, 26.0, 25.0, 33.0, 38.0, 41.0, 34.0, 33.0, 39.0, 44.0, 49.0, 38.0, 46.0, 43.0, 44.0, 46.0, 43.0, 27.0, 31.0, 33.0, 23.0, 23.0, 16.0, 15.0, 14.0, 21.0, 10.0, 12.0, 11.0, 7.0, 4.0, 9.0, 6.0, 5.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0018306970596313477, -0.0017737457528710365, -0.0017167944461107254, -0.0016598431393504143, -0.0016028918325901031, -0.001545940525829792, -0.001488989219069481, -0.0014320379123091698, -0.0013750866055488586, -0.0013181352987885475, -0.0012611839920282364, -0.0012042326852679253, -0.0011472813785076141, -0.001090330071747303, -0.0010333787649869919, -0.0009764274582266808, -0.0009194761514663696, -0.0008625248447060585, -0.0008055735379457474, -0.0007486222311854362, -0.0006916709244251251, -0.000634719617664814, -0.0005777683109045029, -0.0005208170041441917, -0.0004638656973838806, -0.0004069143906235695, -0.00034996308386325836, -0.00029301177710294724, -0.0002360604703426361, -0.00017910916358232498, -0.00012215785682201385, -6.520655006170273e-05, -8.255243301391602e-06, 4.8696063458919525e-05, 0.00010564737021923065, 0.00016259867697954178, 0.0002195499837398529, 0.00027650129050016403, 0.00033345259726047516, 0.0003904039040207863, 0.0004473552107810974, 0.0005043065175414085, 0.0005612578243017197, 0.0006182091310620308, 0.0006751604378223419, 0.000732111744582653, 0.0007890630513429642, 0.0008460143581032753, 0.0009029656648635864, 0.0009599169716238976, 0.0010168682783842087, 0.0010738195851445198, 0.001130770891904831, 0.001187722198665142, 0.0012446735054254532, 0.0013016248121857643, 0.0013585761189460754, 0.0014155274257063866, 0.0014724787324666977, 0.0015294300392270088, 0.00158638134598732, 0.001643332652747631, 0.0017002839595079422, 0.0017572352662682533, 0.0018141865730285645]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 4.0, 6.0, 7.0, 10.0, 5.0, 16.0, 17.0, 20.0, 17.0, 19.0, 26.0, 21.0, 24.0, 36.0, 37.0, 34.0, 43.0, 42.0, 36.0, 46.0, 42.0, 32.0, 41.0, 41.0, 36.0, 32.0, 38.0, 20.0, 41.0, 29.0, 33.0, 30.0, 19.0, 11.0, 15.0, 18.0, 12.0, 15.0, 12.0, 9.0, 5.0, 4.0, 6.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6484375, -8.3509521484375, -8.053466796875, -7.7559814453125, -7.45849609375, -7.1610107421875, -6.863525390625, -6.5660400390625, -6.2685546875, -5.9710693359375, -5.673583984375, -5.3760986328125, -5.07861328125, -4.7811279296875, -4.483642578125, -4.1861572265625, -3.888671875, -3.5911865234375, -3.293701171875, -2.9962158203125, -2.69873046875, -2.4012451171875, -2.103759765625, -1.8062744140625, -1.5087890625, -1.2113037109375, -0.913818359375, -0.6163330078125, -0.31884765625, -0.0213623046875, 0.276123046875, 0.5736083984375, 0.87109375, 1.1685791015625, 1.466064453125, 1.7635498046875, 2.06103515625, 2.3585205078125, 2.656005859375, 2.9534912109375, 3.2509765625, 3.5484619140625, 3.845947265625, 4.1434326171875, 4.44091796875, 4.7384033203125, 5.035888671875, 5.3333740234375, 5.630859375, 5.9283447265625, 6.225830078125, 6.5233154296875, 6.82080078125, 7.1182861328125, 7.415771484375, 7.7132568359375, 8.0107421875, 8.3082275390625, 8.605712890625, 8.9031982421875, 9.20068359375, 9.4981689453125, 9.795654296875, 10.0931396484375, 10.390625]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 6.0, 1.0, 6.0, 11.0, 16.0, 15.0, 17.0, 27.0, 36.0, 51.0, 57.0, 75.0, 110.0, 135.0, 218.0, 298.0, 387.0, 478.0, 761.0, 1508.0, 5033.0, 26105.0, 354448.0, 614306.0, 33747.0, 6202.0, 1682.0, 745.0, 514.0, 374.0, 311.0, 235.0, 186.0, 115.0, 72.0, 48.0, 58.0, 48.0, 25.0, 30.0, 22.0, 14.0, 9.0, 6.0, 7.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.84375, -21.09228515625, -20.3408203125, -19.58935546875, -18.837890625, -18.08642578125, -17.3349609375, -16.58349609375, -15.83203125, -15.08056640625, -14.3291015625, -13.57763671875, -12.826171875, -12.07470703125, -11.3232421875, -10.57177734375, -9.8203125, -9.06884765625, -8.3173828125, -7.56591796875, -6.814453125, -6.06298828125, -5.3115234375, -4.56005859375, -3.80859375, -3.05712890625, -2.3056640625, -1.55419921875, -0.802734375, -0.05126953125, 0.7001953125, 1.45166015625, 2.203125, 2.95458984375, 3.7060546875, 4.45751953125, 5.208984375, 5.96044921875, 6.7119140625, 7.46337890625, 8.21484375, 8.96630859375, 9.7177734375, 10.46923828125, 11.220703125, 11.97216796875, 12.7236328125, 13.47509765625, 14.2265625, 14.97802734375, 15.7294921875, 16.48095703125, 17.232421875, 17.98388671875, 18.7353515625, 19.48681640625, 20.23828125, 20.98974609375, 21.7412109375, 22.49267578125, 23.244140625, 23.99560546875, 24.7470703125, 25.49853515625, 26.25]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 6.0, 6.0, 6.0, 7.0, 15.0, 10.0, 15.0, 19.0, 24.0, 21.0, 31.0, 29.0, 22.0, 22.0, 32.0, 46.0, 45.0, 46.0, 67.0, 102.0, 1597.0, 330.0, 88.0, 53.0, 56.0, 35.0, 50.0, 41.0, 34.0, 33.0, 31.0, 22.0, 24.0, 16.0, 21.0, 13.0, 6.0, 12.0, 5.0, 7.0, 1.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 4.0], "bins": [-33.46875, -32.561767578125, -31.65478515625, -30.747802734375, -29.8408203125, -28.933837890625, -28.02685546875, -27.119873046875, -26.212890625, -25.305908203125, -24.39892578125, -23.491943359375, -22.5849609375, -21.677978515625, -20.77099609375, -19.864013671875, -18.95703125, -18.050048828125, -17.14306640625, -16.236083984375, -15.3291015625, -14.422119140625, -13.51513671875, -12.608154296875, -11.701171875, -10.794189453125, -9.88720703125, -8.980224609375, -8.0732421875, -7.166259765625, -6.25927734375, -5.352294921875, -4.4453125, -3.538330078125, -2.63134765625, -1.724365234375, -0.8173828125, 0.089599609375, 0.99658203125, 1.903564453125, 2.810546875, 3.717529296875, 4.62451171875, 5.531494140625, 6.4384765625, 7.345458984375, 8.25244140625, 9.159423828125, 10.06640625, 10.973388671875, 11.88037109375, 12.787353515625, 13.6943359375, 14.601318359375, 15.50830078125, 16.415283203125, 17.322265625, 18.229248046875, 19.13623046875, 20.043212890625, 20.9501953125, 21.857177734375, 22.76416015625, 23.671142578125, 24.578125]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 1.0, 6.0, 3.0, 4.0, 12.0, 11.0, 9.0, 14.0, 29.0, 31.0, 33.0, 42.0, 61.0, 85.0, 107.0, 123.0, 243.0, 559.0, 3331.0, 2989356.0, 148855.0, 1619.0, 443.0, 226.0, 117.0, 84.0, 49.0, 43.0, 40.0, 35.0, 30.0, 23.0, 21.0, 18.0, 14.0, 11.0, 4.0, 8.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.5625, -90.6259765625, -87.689453125, -84.7529296875, -81.81640625, -78.8798828125, -75.943359375, -73.0068359375, -70.0703125, -67.1337890625, -64.197265625, -61.2607421875, -58.32421875, -55.3876953125, -52.451171875, -49.5146484375, -46.578125, -43.6416015625, -40.705078125, -37.7685546875, -34.83203125, -31.8955078125, -28.958984375, -26.0224609375, -23.0859375, -20.1494140625, -17.212890625, -14.2763671875, -11.33984375, -8.4033203125, -5.466796875, -2.5302734375, 0.40625, 3.3427734375, 6.279296875, 9.2158203125, 12.15234375, 15.0888671875, 18.025390625, 20.9619140625, 23.8984375, 26.8349609375, 29.771484375, 32.7080078125, 35.64453125, 38.5810546875, 41.517578125, 44.4541015625, 47.390625, 50.3271484375, 53.263671875, 56.2001953125, 59.13671875, 62.0732421875, 65.009765625, 67.9462890625, 70.8828125, 73.8193359375, 76.755859375, 79.6923828125, 82.62890625, 85.5654296875, 88.501953125, 91.4384765625, 94.375]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 60.0, 724.0, 228.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-128.5131072998047, -122.61096954345703, -116.70883178710938, -110.80670166015625, -104.9045639038086, -99.00242614746094, -93.10029602050781, -87.19815826416016, -81.2960205078125, -75.39388275146484, -69.49174499511719, -63.58961486816406, -57.687477111816406, -51.78533935546875, -45.88320541381836, -39.98107147216797, -34.07893371582031, -28.17679786682129, -22.274662017822266, -16.372526168823242, -10.470390319824219, -4.568254470825195, 1.3338813781738281, 7.236015319824219, 13.138153076171875, 19.0402889251709, 24.942424774169922, 30.844560623168945, 36.74669647216797, 42.648834228515625, 48.550968170166016, 54.453102111816406, 60.355255126953125, 66.25739288330078, 72.15953063964844, 78.06166076660156, 83.96379852294922, 89.86593627929688, 95.76806640625, 101.67020416259766, 107.57234191894531, 113.47447967529297, 119.37661743164062, 125.27874755859375, 131.18087768554688, 137.08302307128906, 142.9851531982422, 148.88729858398438, 154.7894287109375, 160.69155883789062, 166.5937042236328, 172.49583435058594, 178.39797973632812, 184.30010986328125, 190.20223999023438, 196.1043701171875, 202.0065155029297, 207.9086456298828, 213.810791015625, 219.71292114257812, 225.61505126953125, 231.51719665527344, 237.41932678222656, 243.32147216796875, 249.22360229492188]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 10.0, 5.0, 8.0, 6.0, 12.0, 10.0, 9.0, 10.0, 19.0, 24.0, 14.0, 29.0, 33.0, 33.0, 39.0, 38.0, 37.0, 41.0, 45.0, 53.0, 52.0, 44.0, 53.0, 38.0, 44.0, 30.0, 36.0, 34.0, 39.0, 25.0, 19.0, 26.0, 21.0, 15.0, 18.0, 13.0, 7.0, 7.0, 7.0, 4.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.84489440917969, -78.44945526123047, -76.05401611328125, -73.6585693359375, -71.26313018798828, -68.86769104003906, -66.47225189208984, -64.07681274414062, -61.68136978149414, -59.28593063354492, -56.89048767089844, -54.49504852294922, -52.099609375, -49.704166412353516, -47.3087272644043, -44.91328430175781, -42.517845153808594, -40.122406005859375, -37.72696304321289, -35.33152389526367, -32.93608093261719, -30.54064178466797, -28.14520263671875, -25.7497615814209, -23.354320526123047, -20.958879470825195, -18.563438415527344, -16.167999267578125, -13.772558212280273, -11.377117156982422, -8.981677055358887, -6.586236953735352, -4.1907958984375, -1.7953553199768066, 0.6000852584838867, 2.99552583694458, 5.390966415405273, 7.786407470703125, 10.18184757232666, 12.577287673950195, 14.972728729248047, 17.3681697845459, 19.76361083984375, 22.15904998779297, 24.55449104309082, 26.949932098388672, 29.34537124633789, 31.740812301635742, 34.136253356933594, 36.53169250488281, 38.9271354675293, 41.322574615478516, 43.718017578125, 46.11345672607422, 48.50889587402344, 50.904335021972656, 53.29977798461914, 55.69521713256836, 58.090660095214844, 60.48609924316406, 62.88153839111328, 65.2769775390625, 67.67242431640625, 70.06786346435547, 72.46330261230469]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 5.0, 7.0, 6.0, 12.0, 6.0, 15.0, 9.0, 18.0, 21.0, 22.0, 23.0, 22.0, 28.0, 38.0, 32.0, 28.0, 43.0, 35.0, 30.0, 38.0, 23.0, 43.0, 48.0, 39.0, 37.0, 26.0, 39.0, 37.0, 21.0, 31.0, 36.0, 22.0, 18.0, 16.0, 17.0, 18.0, 18.0, 10.0, 15.0, 9.0, 11.0, 7.0, 9.0, 8.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.8125, -8.5247802734375, -8.237060546875, -7.9493408203125, -7.66162109375, -7.3739013671875, -7.086181640625, -6.7984619140625, -6.5107421875, -6.2230224609375, -5.935302734375, -5.6475830078125, -5.35986328125, -5.0721435546875, -4.784423828125, -4.4967041015625, -4.208984375, -3.9212646484375, -3.633544921875, -3.3458251953125, -3.05810546875, -2.7703857421875, -2.482666015625, -2.1949462890625, -1.9072265625, -1.6195068359375, -1.331787109375, -1.0440673828125, -0.75634765625, -0.4686279296875, -0.180908203125, 0.1068115234375, 0.39453125, 0.6822509765625, 0.969970703125, 1.2576904296875, 1.54541015625, 1.8331298828125, 2.120849609375, 2.4085693359375, 2.6962890625, 2.9840087890625, 3.271728515625, 3.5594482421875, 3.84716796875, 4.1348876953125, 4.422607421875, 4.7103271484375, 4.998046875, 5.2857666015625, 5.573486328125, 5.8612060546875, 6.14892578125, 6.4366455078125, 6.724365234375, 7.0120849609375, 7.2998046875, 7.5875244140625, 7.875244140625, 8.1629638671875, 8.45068359375, 8.7384033203125, 9.026123046875, 9.3138427734375, 9.6015625]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 6.0, 6.0, 5.0, 6.0, 6.0, 7.0, 16.0, 15.0, 19.0, 24.0, 25.0, 15.0, 43.0, 46.0, 60.0, 88.0, 101.0, 113.0, 139.0, 208.0, 273.0, 419.0, 793.0, 1722.0, 5207.0, 23070.0, 195483.0, 1587988.0, 2025038.0, 308131.0, 33084.0, 7174.0, 2206.0, 977.0, 455.0, 301.0, 220.0, 162.0, 124.0, 105.0, 88.0, 66.0, 46.0, 49.0, 40.0, 29.0, 22.0, 17.0, 14.0, 7.0, 6.0, 2.0, 9.0, 7.0, 8.0, 4.0, 2.0, 4.0, 0.0, 0.0, 1.0], "bins": [-17.765625, -17.1943359375, -16.623046875, -16.0517578125, -15.48046875, -14.9091796875, -14.337890625, -13.7666015625, -13.1953125, -12.6240234375, -12.052734375, -11.4814453125, -10.91015625, -10.3388671875, -9.767578125, -9.1962890625, -8.625, -8.0537109375, -7.482421875, -6.9111328125, -6.33984375, -5.7685546875, -5.197265625, -4.6259765625, -4.0546875, -3.4833984375, -2.912109375, -2.3408203125, -1.76953125, -1.1982421875, -0.626953125, -0.0556640625, 0.515625, 1.0869140625, 1.658203125, 2.2294921875, 2.80078125, 3.3720703125, 3.943359375, 4.5146484375, 5.0859375, 5.6572265625, 6.228515625, 6.7998046875, 7.37109375, 7.9423828125, 8.513671875, 9.0849609375, 9.65625, 10.2275390625, 10.798828125, 11.3701171875, 11.94140625, 12.5126953125, 13.083984375, 13.6552734375, 14.2265625, 14.7978515625, 15.369140625, 15.9404296875, 16.51171875, 17.0830078125, 17.654296875, 18.2255859375, 18.796875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 8.0, 2.0, 15.0, 12.0, 17.0, 15.0, 32.0, 35.0, 65.0, 94.0, 147.0, 206.0, 286.0, 415.0, 512.0, 541.0, 403.0, 322.0, 275.0, 182.0, 140.0, 87.0, 60.0, 52.0, 35.0, 36.0, 17.0, 12.0, 10.0, 8.0, 14.0, 5.0, 2.0, 5.0, 2.0, 0.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.625, -13.084716796875, -12.54443359375, -12.004150390625, -11.4638671875, -10.923583984375, -10.38330078125, -9.843017578125, -9.302734375, -8.762451171875, -8.22216796875, -7.681884765625, -7.1416015625, -6.601318359375, -6.06103515625, -5.520751953125, -4.98046875, -4.440185546875, -3.89990234375, -3.359619140625, -2.8193359375, -2.279052734375, -1.73876953125, -1.198486328125, -0.658203125, -0.117919921875, 0.42236328125, 0.962646484375, 1.5029296875, 2.043212890625, 2.58349609375, 3.123779296875, 3.6640625, 4.204345703125, 4.74462890625, 5.284912109375, 5.8251953125, 6.365478515625, 6.90576171875, 7.446044921875, 7.986328125, 8.526611328125, 9.06689453125, 9.607177734375, 10.1474609375, 10.687744140625, 11.22802734375, 11.768310546875, 12.30859375, 12.848876953125, 13.38916015625, 13.929443359375, 14.4697265625, 15.010009765625, 15.55029296875, 16.090576171875, 16.630859375, 17.171142578125, 17.71142578125, 18.251708984375, 18.7919921875, 19.332275390625, 19.87255859375, 20.412841796875, 20.953125]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 1.0, 6.0, 5.0, 2.0, 6.0, 6.0, 16.0, 14.0, 36.0, 36.0, 59.0, 65.0, 103.0, 122.0, 181.0, 272.0, 463.0, 1176.0, 6182.0, 297509.0, 3840866.0, 42773.0, 2674.0, 743.0, 356.0, 174.0, 124.0, 82.0, 58.0, 53.0, 42.0, 28.0, 20.0, 12.0, 9.0, 4.0, 4.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-67.5625, -65.59228515625, -63.6220703125, -61.65185546875, -59.681640625, -57.71142578125, -55.7412109375, -53.77099609375, -51.80078125, -49.83056640625, -47.8603515625, -45.89013671875, -43.919921875, -41.94970703125, -39.9794921875, -38.00927734375, -36.0390625, -34.06884765625, -32.0986328125, -30.12841796875, -28.158203125, -26.18798828125, -24.2177734375, -22.24755859375, -20.27734375, -18.30712890625, -16.3369140625, -14.36669921875, -12.396484375, -10.42626953125, -8.4560546875, -6.48583984375, -4.515625, -2.54541015625, -0.5751953125, 1.39501953125, 3.365234375, 5.33544921875, 7.3056640625, 9.27587890625, 11.24609375, 13.21630859375, 15.1865234375, 17.15673828125, 19.126953125, 21.09716796875, 23.0673828125, 25.03759765625, 27.0078125, 28.97802734375, 30.9482421875, 32.91845703125, 34.888671875, 36.85888671875, 38.8291015625, 40.79931640625, 42.76953125, 44.73974609375, 46.7099609375, 48.68017578125, 50.650390625, 52.62060546875, 54.5908203125, 56.56103515625, 58.53125]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 47.0, 928.0, 41.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-531.0335693359375, -508.3679504394531, -485.70233154296875, -463.0367431640625, -440.3711242675781, -417.70550537109375, -395.0399169921875, -372.3742980957031, -349.70867919921875, -327.0430603027344, -304.37744140625, -281.71185302734375, -259.0462341308594, -236.380615234375, -213.7150115966797, -191.04940795898438, -168.3837890625, -145.71817016601562, -123.05256652832031, -100.38695526123047, -77.72134399414062, -55.05573272705078, -32.39012145996094, -9.724517822265625, 12.94110107421875, 35.606712341308594, 58.27232360839844, 80.93793487548828, 103.60354614257812, 126.26915740966797, 148.9347686767578, 171.60037231445312, 194.26605224609375, 216.93167114257812, 239.59727478027344, 262.26287841796875, 284.9284973144531, 307.5941162109375, 330.25970458984375, 352.9253234863281, 375.5909423828125, 398.2565612792969, 420.92218017578125, 443.5877685546875, 466.2533874511719, 488.91900634765625, 511.5845947265625, 534.250244140625, 556.9158325195312, 579.5814208984375, 602.2470703125, 624.9126586914062, 647.5782470703125, 670.243896484375, 692.9094848632812, 715.5750732421875, 738.24072265625, 760.9063110351562, 783.5719604492188, 806.237548828125, 828.9031982421875, 851.5687866210938, 874.234375, 896.9000244140625, 919.5656127929688]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 5.0, 3.0, 2.0, 4.0, 8.0, 8.0, 11.0, 14.0, 10.0, 17.0, 17.0, 19.0, 26.0, 31.0, 35.0, 41.0, 36.0, 35.0, 41.0, 37.0, 38.0, 45.0, 49.0, 52.0, 43.0, 37.0, 39.0, 37.0, 35.0, 35.0, 39.0, 31.0, 19.0, 16.0, 19.0, 16.0, 11.0, 13.0, 7.0, 5.0, 11.0, 5.0, 2.0, 3.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.62274169921875, -49.8785514831543, -48.13435745239258, -46.390167236328125, -44.645973205566406, -42.90178298950195, -41.1575927734375, -39.41339874267578, -37.66920471191406, -35.92501449584961, -34.18082046508789, -32.43663024902344, -30.69243621826172, -28.948246002197266, -27.20405387878418, -25.459861755371094, -23.71567153930664, -21.971479415893555, -20.22728729248047, -18.483097076416016, -16.738903045654297, -14.994711875915527, -13.250520706176758, -11.506328582763672, -9.762136459350586, -8.0179443359375, -6.273752689361572, -4.5295610427856445, -2.7853689193725586, -1.0411767959594727, 0.7030143737792969, 2.447206497192383, 4.191398620605469, 5.935590744018555, 7.679782390594482, 9.42397403717041, 11.168166160583496, 12.912358283996582, 14.656549453735352, 16.400741577148438, 18.144933700561523, 19.88912582397461, 21.633317947387695, 23.37751007080078, 25.121700286865234, 26.865894317626953, 28.610084533691406, 30.354276657104492, 32.09846878051758, 33.84265899658203, 35.58685302734375, 37.3310432434082, 39.07523727416992, 40.819427490234375, 42.563621520996094, 44.30781173706055, 46.052001953125, 47.79619216918945, 49.54038619995117, 51.284576416015625, 53.028770446777344, 54.7729606628418, 56.51715087890625, 58.26134490966797, 60.00553894042969]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 3.0, 7.0, 6.0, 5.0, 4.0, 8.0, 2.0, 13.0, 10.0, 13.0, 12.0, 26.0, 20.0, 21.0, 22.0, 39.0, 27.0, 34.0, 25.0, 21.0, 35.0, 32.0, 41.0, 30.0, 39.0, 33.0, 34.0, 43.0, 31.0, 32.0, 26.0, 32.0, 26.0, 32.0, 32.0, 15.0, 18.0, 21.0, 20.0, 17.0, 13.0, 12.0, 17.0, 9.0, 6.0, 8.0, 7.0, 7.0, 7.0, 4.0, 0.0, 3.0, 7.0, 4.0], "bins": [-9.5703125, -9.29888916015625, -9.0274658203125, -8.75604248046875, -8.484619140625, -8.21319580078125, -7.9417724609375, -7.67034912109375, -7.39892578125, -7.12750244140625, -6.8560791015625, -6.58465576171875, -6.313232421875, -6.04180908203125, -5.7703857421875, -5.49896240234375, -5.2275390625, -4.95611572265625, -4.6846923828125, -4.41326904296875, -4.141845703125, -3.87042236328125, -3.5989990234375, -3.32757568359375, -3.05615234375, -2.78472900390625, -2.5133056640625, -2.24188232421875, -1.970458984375, -1.69903564453125, -1.4276123046875, -1.15618896484375, -0.884765625, -0.61334228515625, -0.3419189453125, -0.07049560546875, 0.200927734375, 0.47235107421875, 0.7437744140625, 1.01519775390625, 1.28662109375, 1.55804443359375, 1.8294677734375, 2.10089111328125, 2.372314453125, 2.64373779296875, 2.9151611328125, 3.18658447265625, 3.4580078125, 3.72943115234375, 4.0008544921875, 4.27227783203125, 4.543701171875, 4.81512451171875, 5.0865478515625, 5.35797119140625, 5.62939453125, 5.90081787109375, 6.1722412109375, 6.44366455078125, 6.715087890625, 6.98651123046875, 7.2579345703125, 7.52935791015625, 7.80078125]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 9.0, 4.0, 9.0, 16.0, 17.0, 25.0, 48.0, 53.0, 96.0, 102.0, 176.0, 249.0, 410.0, 632.0, 888.0, 1123.0, 1766.0, 2505.0, 3623.0, 5030.0, 7395.0, 10577.0, 15502.0, 22659.0, 33136.0, 48809.0, 70807.0, 104779.0, 154553.0, 174007.0, 124163.0, 83194.0, 56934.0, 39174.0, 27002.0, 18095.0, 12526.0, 8751.0, 6097.0, 4152.0, 2880.0, 2015.0, 1407.0, 974.0, 683.0, 492.0, 321.0, 226.0, 147.0, 101.0, 73.0, 49.0, 44.0, 13.0, 18.0, 15.0, 7.0, 2.0, 6.0, 2.0], "bins": [-0.94091796875, -0.9125900268554688, -0.8842620849609375, -0.8559341430664062, -0.827606201171875, -0.7992782592773438, -0.7709503173828125, -0.7426223754882812, -0.71429443359375, -0.6859664916992188, -0.6576385498046875, -0.6293106079101562, -0.600982666015625, -0.5726547241210938, -0.5443267822265625, -0.5159988403320312, -0.4876708984375, -0.45934295654296875, -0.4310150146484375, -0.40268707275390625, -0.374359130859375, -0.34603118896484375, -0.3177032470703125, -0.28937530517578125, -0.26104736328125, -0.23271942138671875, -0.2043914794921875, -0.17606353759765625, -0.147735595703125, -0.11940765380859375, -0.0910797119140625, -0.06275177001953125, -0.034423828125, -0.00609588623046875, 0.0222320556640625, 0.05055999755859375, 0.078887939453125, 0.10721588134765625, 0.1355438232421875, 0.16387176513671875, 0.19219970703125, 0.22052764892578125, 0.2488555908203125, 0.27718353271484375, 0.305511474609375, 0.33383941650390625, 0.3621673583984375, 0.39049530029296875, 0.4188232421875, 0.44715118408203125, 0.4754791259765625, 0.5038070678710938, 0.532135009765625, 0.5604629516601562, 0.5887908935546875, 0.6171188354492188, 0.64544677734375, 0.6737747192382812, 0.7021026611328125, 0.7304306030273438, 0.758758544921875, 0.7870864868164062, 0.8154144287109375, 0.8437423706054688, 0.8720703125]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 3.0, 2.0, 5.0, 7.0, 6.0, 19.0, 9.0, 18.0, 22.0, 26.0, 25.0, 27.0, 22.0, 26.0, 46.0, 42.0, 32.0, 37.0, 39.0, 39.0, 31.0, 1065.0, 50.0, 40.0, 37.0, 39.0, 29.0, 33.0, 41.0, 32.0, 20.0, 28.0, 27.0, 16.0, 21.0, 10.0, 11.0, 10.0, 12.0, 4.0, 4.0, 5.0, 5.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.40234375, -6.2039794921875, -6.005615234375, -5.8072509765625, -5.60888671875, -5.4105224609375, -5.212158203125, -5.0137939453125, -4.8154296875, -4.6170654296875, -4.418701171875, -4.2203369140625, -4.02197265625, -3.8236083984375, -3.625244140625, -3.4268798828125, -3.228515625, -3.0301513671875, -2.831787109375, -2.6334228515625, -2.43505859375, -2.2366943359375, -2.038330078125, -1.8399658203125, -1.6416015625, -1.4432373046875, -1.244873046875, -1.0465087890625, -0.84814453125, -0.6497802734375, -0.451416015625, -0.2530517578125, -0.0546875, 0.1436767578125, 0.342041015625, 0.5404052734375, 0.73876953125, 0.9371337890625, 1.135498046875, 1.3338623046875, 1.5322265625, 1.7305908203125, 1.928955078125, 2.1273193359375, 2.32568359375, 2.5240478515625, 2.722412109375, 2.9207763671875, 3.119140625, 3.3175048828125, 3.515869140625, 3.7142333984375, 3.91259765625, 4.1109619140625, 4.309326171875, 4.5076904296875, 4.7060546875, 4.9044189453125, 5.102783203125, 5.3011474609375, 5.49951171875, 5.6978759765625, 5.896240234375, 6.0946044921875, 6.29296875]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 3.0, 6.0, 4.0, 10.0, 11.0, 24.0, 24.0, 35.0, 65.0, 83.0, 112.0, 149.0, 242.0, 383.0, 572.0, 787.0, 1162.0, 1768.0, 2675.0, 4100.0, 6554.0, 10130.0, 15993.0, 25685.0, 40703.0, 65122.0, 104659.0, 168644.0, 1259674.0, 145229.0, 90064.0, 56474.0, 35274.0, 21720.0, 13768.0, 8731.0, 5771.0, 3641.0, 2363.0, 1503.0, 1022.0, 656.0, 474.0, 335.0, 226.0, 163.0, 101.0, 79.0, 57.0, 37.0, 23.0, 16.0, 12.0, 16.0, 6.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0234375, -0.991790771484375, -0.96014404296875, -0.928497314453125, -0.8968505859375, -0.865203857421875, -0.83355712890625, -0.801910400390625, -0.770263671875, -0.738616943359375, -0.70697021484375, -0.675323486328125, -0.6436767578125, -0.612030029296875, -0.58038330078125, -0.548736572265625, -0.51708984375, -0.485443115234375, -0.45379638671875, -0.422149658203125, -0.3905029296875, -0.358856201171875, -0.32720947265625, -0.295562744140625, -0.263916015625, -0.232269287109375, -0.20062255859375, -0.168975830078125, -0.1373291015625, -0.105682373046875, -0.07403564453125, -0.042388916015625, -0.0107421875, 0.020904541015625, 0.05255126953125, 0.084197998046875, 0.1158447265625, 0.147491455078125, 0.17913818359375, 0.210784912109375, 0.242431640625, 0.274078369140625, 0.30572509765625, 0.337371826171875, 0.3690185546875, 0.400665283203125, 0.43231201171875, 0.463958740234375, 0.49560546875, 0.527252197265625, 0.55889892578125, 0.590545654296875, 0.6221923828125, 0.653839111328125, 0.68548583984375, 0.717132568359375, 0.748779296875, 0.780426025390625, 0.81207275390625, 0.843719482421875, 0.8753662109375, 0.907012939453125, 0.93865966796875, 0.970306396484375, 1.001953125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 3.0, 4.0, 3.0, 5.0, 6.0, 6.0, 8.0, 9.0, 20.0, 35.0, 47.0, 52.0, 59.0, 94.0, 85.0, 101.0, 76.0, 85.0, 74.0, 57.0, 51.0, 34.0, 23.0, 13.0, 14.0, 9.0, 9.0, 3.0, 4.0, 2.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0], "bins": [-0.00759124755859375, -0.007409811019897461, -0.007228374481201172, -0.007046937942504883, -0.006865501403808594, -0.006684064865112305, -0.006502628326416016, -0.0063211917877197266, -0.0061397552490234375, -0.0059583187103271484, -0.005776882171630859, -0.00559544563293457, -0.005414009094238281, -0.005232572555541992, -0.005051136016845703, -0.004869699478149414, -0.004688262939453125, -0.004506826400756836, -0.004325389862060547, -0.004143953323364258, -0.003962516784667969, -0.0037810802459716797, -0.0035996437072753906, -0.0034182071685791016, -0.0032367706298828125, -0.0030553340911865234, -0.0028738975524902344, -0.0026924610137939453, -0.0025110244750976562, -0.002329587936401367, -0.002148151397705078, -0.001966714859008789, -0.0017852783203125, -0.001603841781616211, -0.0014224052429199219, -0.0012409687042236328, -0.0010595321655273438, -0.0008780956268310547, -0.0006966590881347656, -0.0005152225494384766, -0.0003337860107421875, -0.00015234947204589844, 2.9087066650390625e-05, 0.0002105236053466797, 0.00039196014404296875, 0.0005733966827392578, 0.0007548332214355469, 0.0009362697601318359, 0.001117706298828125, 0.001299142837524414, 0.0014805793762207031, 0.0016620159149169922, 0.0018434524536132812, 0.0020248889923095703, 0.0022063255310058594, 0.0023877620697021484, 0.0025691986083984375, 0.0027506351470947266, 0.0029320716857910156, 0.0031135082244873047, 0.0032949447631835938, 0.003476381301879883, 0.003657817840576172, 0.003839254379272461, 0.00402069091796875]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 5.0, 5.0, 9.0, 5.0, 12.0, 19.0, 9.0, 31.0, 43.0, 56.0, 78.0, 128.0, 209.0, 390.0, 949.0, 192913.0, 851409.0, 1163.0, 425.0, 228.0, 152.0, 90.0, 67.0, 42.0, 30.0, 16.0, 19.0, 13.0, 7.0, 7.0, 5.0, 7.0, 7.0, 3.0, 1.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.08697509765625, -0.08336162567138672, -0.07974815368652344, -0.07613468170166016, -0.07252120971679688, -0.0689077377319336, -0.06529426574707031, -0.06168079376220703, -0.05806732177734375, -0.05445384979248047, -0.05084037780761719, -0.047226905822753906, -0.043613433837890625, -0.039999961853027344, -0.03638648986816406, -0.03277301788330078, -0.0291595458984375, -0.02554607391357422, -0.021932601928710938, -0.018319129943847656, -0.014705657958984375, -0.011092185974121094, -0.0074787139892578125, -0.0038652420043945312, -0.00025177001953125, 0.0033617019653320312, 0.0069751739501953125, 0.010588645935058594, 0.014202117919921875, 0.017815589904785156, 0.021429061889648438, 0.02504253387451172, 0.028656005859375, 0.03226947784423828, 0.03588294982910156, 0.039496421813964844, 0.043109893798828125, 0.046723365783691406, 0.05033683776855469, 0.05395030975341797, 0.05756378173828125, 0.06117725372314453, 0.06479072570800781, 0.0684041976928711, 0.07201766967773438, 0.07563114166259766, 0.07924461364746094, 0.08285808563232422, 0.0864715576171875, 0.09008502960205078, 0.09369850158691406, 0.09731197357177734, 0.10092544555664062, 0.1045389175415039, 0.10815238952636719, 0.11176586151123047, 0.11537933349609375, 0.11899280548095703, 0.12260627746582031, 0.1262197494506836, 0.12983322143554688, 0.13344669342041016, 0.13706016540527344, 0.14067363739013672, 0.144287109375]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 17.0, 133.0, 534.0, 297.0, 29.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0036790852900594473, -0.0033646856900304556, -0.0030502863228321075, -0.002735886722803116, -0.002421487122774124, -0.002107087755575776, -0.0017926881555467844, -0.0014782887883484364, -0.0011638891883194447, -0.0008494897047057748, -0.000535090162884444, -0.0002206906210631132, 9.370886255055666e-05, 0.00040810834616422653, 0.0007225079461932182, 0.0010369073133915663, 0.001351306913420558, 0.0016657063970342278, 0.0019801058806478977, 0.0022945054806768894, 0.002608905080705881, 0.002923304447904229, 0.003237704047933221, 0.003552103415131569, 0.0038665030151605606, 0.004180902615189552, 0.004495302215218544, 0.004809701815247536, 0.00512410094961524, 0.005438500549644232, 0.0057529001496732235, 0.006067299284040928, 0.00638169888406992, 0.006696098484098911, 0.007010498084127903, 0.007324897684156895, 0.007639296818524599, 0.007953695952892303, 0.008268095552921295, 0.008582495152950287, 0.008896894752979279, 0.00921129435300827, 0.009525693953037262, 0.009840093553066254, 0.010154493153095245, 0.010468892753124237, 0.010783292353153229, 0.011097691021859646, 0.011412091553211212, 0.011726491153240204, 0.012040890753269196, 0.012355290353298187, 0.012669689953327179, 0.01298408955335617, 0.013298489153385162, 0.01361288782209158, 0.013927287422120571, 0.014241687022149563, 0.014556086622178555, 0.014870486222207546, 0.015184885822236538, 0.015499284490942955, 0.015813684090971947, 0.01612808369100094, 0.01644248329102993]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 2.0, 3.0, 5.0, 5.0, 9.0, 9.0, 14.0, 9.0, 24.0, 25.0, 21.0, 23.0, 29.0, 26.0, 27.0, 34.0, 37.0, 54.0, 51.0, 45.0, 51.0, 54.0, 34.0, 38.0, 32.0, 45.0, 34.0, 36.0, 25.0, 35.0, 30.0, 20.0, 30.0, 12.0, 12.0, 13.0, 14.0, 9.0, 10.0, 4.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0021241307258605957, -0.002050674520432949, -0.0019772183150053024, -0.0019037621095776558, -0.0018303059041500092, -0.0017568496987223625, -0.0016833934932947159, -0.0016099372878670692, -0.0015364810824394226, -0.001463024877011776, -0.0013895686715841293, -0.0013161124661564827, -0.001242656260728836, -0.0011692000553011894, -0.0010957438498735428, -0.0010222876444458961, -0.0009488314390182495, -0.0008753752335906029, -0.0008019190281629562, -0.0007284628227353096, -0.000655006617307663, -0.0005815504118800163, -0.0005080942064523697, -0.00043463800102472305, -0.0003611817955970764, -0.0002877255901694298, -0.00021426938474178314, -0.0001408131793141365, -6.735697388648987e-05, 6.099231541156769e-06, 7.95554369688034e-05, 0.00015301164239645004, 0.00022646784782409668, 0.0002999240532517433, 0.00037338025867938995, 0.0004468364641070366, 0.0005202926695346832, 0.0005937488749623299, 0.0006672050803899765, 0.0007406612858176231, 0.0008141174912452698, 0.0008875736966729164, 0.000961029902100563, 0.0010344861075282097, 0.0011079423129558563, 0.001181398518383503, 0.0012548547238111496, 0.0013283109292387962, 0.0014017671346664429, 0.0014752233400940895, 0.0015486795455217361, 0.0016221357509493828, 0.0016955919563770294, 0.001769048161804676, 0.0018425043672323227, 0.0019159605726599693, 0.001989416778087616, 0.0020628729835152626, 0.0021363291889429092, 0.002209785394370556, 0.0022832415997982025, 0.002356697805225849, 0.002430154010653496, 0.0025036102160811424, 0.002577066421508789]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 3.0, 7.0, 6.0, 5.0, 4.0, 8.0, 2.0, 14.0, 9.0, 13.0, 12.0, 26.0, 20.0, 21.0, 22.0, 39.0, 28.0, 33.0, 25.0, 22.0, 34.0, 34.0, 39.0, 31.0, 38.0, 33.0, 35.0, 43.0, 31.0, 31.0, 26.0, 33.0, 25.0, 34.0, 30.0, 15.0, 18.0, 21.0, 20.0, 17.0, 13.0, 12.0, 17.0, 9.0, 6.0, 8.0, 7.0, 7.0, 7.0, 4.0, 0.0, 3.0, 7.0, 4.0], "bins": [-9.5625, -9.29119873046875, -9.0198974609375, -8.74859619140625, -8.477294921875, -8.20599365234375, -7.9346923828125, -7.66339111328125, -7.39208984375, -7.12078857421875, -6.8494873046875, -6.57818603515625, -6.306884765625, -6.03558349609375, -5.7642822265625, -5.49298095703125, -5.2216796875, -4.95037841796875, -4.6790771484375, -4.40777587890625, -4.136474609375, -3.86517333984375, -3.5938720703125, -3.32257080078125, -3.05126953125, -2.77996826171875, -2.5086669921875, -2.23736572265625, -1.966064453125, -1.69476318359375, -1.4234619140625, -1.15216064453125, -0.880859375, -0.60955810546875, -0.3382568359375, -0.06695556640625, 0.204345703125, 0.47564697265625, 0.7469482421875, 1.01824951171875, 1.28955078125, 1.56085205078125, 1.8321533203125, 2.10345458984375, 2.374755859375, 2.64605712890625, 2.9173583984375, 3.18865966796875, 3.4599609375, 3.73126220703125, 4.0025634765625, 4.27386474609375, 4.545166015625, 4.81646728515625, 5.0877685546875, 5.35906982421875, 5.63037109375, 5.90167236328125, 6.1729736328125, 6.44427490234375, 6.715576171875, 6.98687744140625, 7.2581787109375, 7.52947998046875, 7.80078125]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 6.0, 4.0, 3.0, 6.0, 10.0, 13.0, 11.0, 18.0, 23.0, 20.0, 27.0, 41.0, 52.0, 67.0, 93.0, 117.0, 171.0, 268.0, 415.0, 700.0, 1358.0, 2668.0, 6013.0, 14702.0, 38713.0, 117688.0, 415833.0, 310929.0, 86890.0, 29932.0, 11626.0, 4880.0, 2301.0, 1149.0, 610.0, 352.0, 199.0, 132.0, 131.0, 86.0, 68.0, 43.0, 43.0, 36.0, 31.0, 23.0, 19.0, 18.0, 14.0, 4.0, 2.0, 7.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.34375, -11.96826171875, -11.5927734375, -11.21728515625, -10.841796875, -10.46630859375, -10.0908203125, -9.71533203125, -9.33984375, -8.96435546875, -8.5888671875, -8.21337890625, -7.837890625, -7.46240234375, -7.0869140625, -6.71142578125, -6.3359375, -5.96044921875, -5.5849609375, -5.20947265625, -4.833984375, -4.45849609375, -4.0830078125, -3.70751953125, -3.33203125, -2.95654296875, -2.5810546875, -2.20556640625, -1.830078125, -1.45458984375, -1.0791015625, -0.70361328125, -0.328125, 0.04736328125, 0.4228515625, 0.79833984375, 1.173828125, 1.54931640625, 1.9248046875, 2.30029296875, 2.67578125, 3.05126953125, 3.4267578125, 3.80224609375, 4.177734375, 4.55322265625, 4.9287109375, 5.30419921875, 5.6796875, 6.05517578125, 6.4306640625, 6.80615234375, 7.181640625, 7.55712890625, 7.9326171875, 8.30810546875, 8.68359375, 9.05908203125, 9.4345703125, 9.81005859375, 10.185546875, 10.56103515625, 10.9365234375, 11.31201171875, 11.6875]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 3.0, 4.0, 8.0, 8.0, 7.0, 5.0, 9.0, 9.0, 11.0, 14.0, 17.0, 20.0, 27.0, 22.0, 24.0, 31.0, 32.0, 39.0, 43.0, 48.0, 63.0, 110.0, 269.0, 1566.0, 163.0, 90.0, 75.0, 38.0, 43.0, 36.0, 35.0, 24.0, 27.0, 21.0, 14.0, 18.0, 21.0, 15.0, 7.0, 10.0, 5.0, 4.0, 4.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-28.125, -27.253173828125, -26.38134765625, -25.509521484375, -24.6376953125, -23.765869140625, -22.89404296875, -22.022216796875, -21.150390625, -20.278564453125, -19.40673828125, -18.534912109375, -17.6630859375, -16.791259765625, -15.91943359375, -15.047607421875, -14.17578125, -13.303955078125, -12.43212890625, -11.560302734375, -10.6884765625, -9.816650390625, -8.94482421875, -8.072998046875, -7.201171875, -6.329345703125, -5.45751953125, -4.585693359375, -3.7138671875, -2.842041015625, -1.97021484375, -1.098388671875, -0.2265625, 0.645263671875, 1.51708984375, 2.388916015625, 3.2607421875, 4.132568359375, 5.00439453125, 5.876220703125, 6.748046875, 7.619873046875, 8.49169921875, 9.363525390625, 10.2353515625, 11.107177734375, 11.97900390625, 12.850830078125, 13.72265625, 14.594482421875, 15.46630859375, 16.338134765625, 17.2099609375, 18.081787109375, 18.95361328125, 19.825439453125, 20.697265625, 21.569091796875, 22.44091796875, 23.312744140625, 24.1845703125, 25.056396484375, 25.92822265625, 26.800048828125, 27.671875]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 1.0, 1.0, 1.0, 0.0, 6.0, 6.0, 5.0, 9.0, 11.0, 17.0, 26.0, 30.0, 48.0, 67.0, 102.0, 156.0, 233.0, 417.0, 898.0, 9505.0, 2056837.0, 1067644.0, 7700.0, 887.0, 381.0, 242.0, 142.0, 88.0, 76.0, 60.0, 31.0, 24.0, 16.0, 16.0, 11.0, 6.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-59.0, -57.26318359375, -55.5263671875, -53.78955078125, -52.052734375, -50.31591796875, -48.5791015625, -46.84228515625, -45.10546875, -43.36865234375, -41.6318359375, -39.89501953125, -38.158203125, -36.42138671875, -34.6845703125, -32.94775390625, -31.2109375, -29.47412109375, -27.7373046875, -26.00048828125, -24.263671875, -22.52685546875, -20.7900390625, -19.05322265625, -17.31640625, -15.57958984375, -13.8427734375, -12.10595703125, -10.369140625, -8.63232421875, -6.8955078125, -5.15869140625, -3.421875, -1.68505859375, 0.0517578125, 1.78857421875, 3.525390625, 5.26220703125, 6.9990234375, 8.73583984375, 10.47265625, 12.20947265625, 13.9462890625, 15.68310546875, 17.419921875, 19.15673828125, 20.8935546875, 22.63037109375, 24.3671875, 26.10400390625, 27.8408203125, 29.57763671875, 31.314453125, 33.05126953125, 34.7880859375, 36.52490234375, 38.26171875, 39.99853515625, 41.7353515625, 43.47216796875, 45.208984375, 46.94580078125, 48.6826171875, 50.41943359375, 52.15625]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 56.0, 854.0, 106.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.98699188232422, -83.28472900390625, -73.58247375488281, -63.88021469116211, -54.177955627441406, -44.4756965637207, -34.7734375, -25.07117462158203, -15.368919372558594, -5.666660308837891, 4.0355987548828125, 13.737857818603516, 23.44011688232422, 33.14237594604492, 42.844635009765625, 52.546897888183594, 62.24915313720703, 71.951416015625, 81.65367126464844, 91.35592651367188, 101.05818939208984, 110.76045227050781, 120.46270751953125, 130.16497802734375, 139.86721801757812, 149.56947326660156, 159.271728515625, 168.9739990234375, 178.67625427246094, 188.37850952148438, 198.08078002929688, 207.7830352783203, 217.48529052734375, 227.1875457763672, 236.88980102539062, 246.59207153320312, 256.2943115234375, 265.99658203125, 275.6988525390625, 285.401123046875, 295.1033630371094, 304.8056335449219, 314.50787353515625, 324.21014404296875, 333.91241455078125, 343.6146545410156, 353.3169250488281, 363.0191650390625, 372.721435546875, 382.4237060546875, 392.1259460449219, 401.8282165527344, 411.53045654296875, 421.23272705078125, 430.93499755859375, 440.63726806640625, 450.3395080566406, 460.0417785644531, 469.7440185546875, 479.4462890625, 489.1485595703125, 498.8507995605469, 508.5530700683594, 518.2553100585938, 527.9575805664062]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 6.0, 0.0, 1.0, 7.0, 9.0, 8.0, 9.0, 15.0, 14.0, 19.0, 14.0, 23.0, 21.0, 24.0, 21.0, 26.0, 29.0, 30.0, 32.0, 35.0, 34.0, 38.0, 54.0, 42.0, 42.0, 31.0, 43.0, 45.0, 39.0, 33.0, 32.0, 32.0, 35.0, 19.0, 18.0, 16.0, 15.0, 22.0, 8.0, 17.0, 15.0, 7.0, 4.0, 4.0, 6.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-67.82904815673828, -65.82946014404297, -63.82986831665039, -61.83027648925781, -59.8306884765625, -57.83109664916992, -55.831504821777344, -53.83191680908203, -51.83232498168945, -49.832733154296875, -47.83314514160156, -45.833553314208984, -43.83396530151367, -41.834373474121094, -39.83478546142578, -37.8351936340332, -35.835601806640625, -33.83600997924805, -31.836421966552734, -29.836830139160156, -27.83724021911621, -25.837650299072266, -23.83806037902832, -21.838470458984375, -19.838882446289062, -17.839292526245117, -15.839701652526855, -13.84011173248291, -11.840520858764648, -9.840930938720703, -7.841341018676758, -5.841750144958496, -3.8421592712402344, -1.8425689935684204, 0.15702128410339355, 2.156611442565918, 4.1562018394470215, 6.155792236328125, 8.15538215637207, 10.154973030090332, 12.154562950134277, 14.154152870178223, 16.153743743896484, 18.15333366394043, 20.152923583984375, 22.152515411376953, 24.152103424072266, 26.151695251464844, 28.15128517150879, 30.150875091552734, 32.15046691894531, 34.150054931640625, 36.1496467590332, 38.14923858642578, 40.148826599121094, 42.14841842651367, 44.148006439208984, 46.14759826660156, 48.147186279296875, 50.14677810668945, 52.146366119384766, 54.145957946777344, 56.145545959472656, 58.145137786865234, 60.14472961425781]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 7.0, 2.0, 6.0, 3.0, 4.0, 9.0, 8.0, 13.0, 13.0, 11.0, 20.0, 20.0, 18.0, 19.0, 37.0, 24.0, 34.0, 27.0, 31.0, 33.0, 30.0, 36.0, 39.0, 40.0, 33.0, 29.0, 36.0, 31.0, 39.0, 35.0, 28.0, 34.0, 27.0, 19.0, 19.0, 26.0, 28.0, 18.0, 17.0, 21.0, 13.0, 10.0, 3.0, 6.0, 9.0, 10.0, 9.0, 4.0, 2.0, 3.0, 2.0, 3.0, 6.0, 0.0, 1.0, 2.0], "bins": [-9.2421875, -8.9586181640625, -8.675048828125, -8.3914794921875, -8.10791015625, -7.8243408203125, -7.540771484375, -7.2572021484375, -6.9736328125, -6.6900634765625, -6.406494140625, -6.1229248046875, -5.83935546875, -5.5557861328125, -5.272216796875, -4.9886474609375, -4.705078125, -4.4215087890625, -4.137939453125, -3.8543701171875, -3.57080078125, -3.2872314453125, -3.003662109375, -2.7200927734375, -2.4365234375, -2.1529541015625, -1.869384765625, -1.5858154296875, -1.30224609375, -1.0186767578125, -0.735107421875, -0.4515380859375, -0.16796875, 0.1156005859375, 0.399169921875, 0.6827392578125, 0.96630859375, 1.2498779296875, 1.533447265625, 1.8170166015625, 2.1005859375, 2.3841552734375, 2.667724609375, 2.9512939453125, 3.23486328125, 3.5184326171875, 3.802001953125, 4.0855712890625, 4.369140625, 4.6527099609375, 4.936279296875, 5.2198486328125, 5.50341796875, 5.7869873046875, 6.070556640625, 6.3541259765625, 6.6376953125, 6.9212646484375, 7.204833984375, 7.4884033203125, 7.77197265625, 8.0555419921875, 8.339111328125, 8.6226806640625, 8.90625]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 4.0, 9.0, 4.0, 3.0, 8.0, 6.0, 9.0, 15.0, 8.0, 21.0, 18.0, 24.0, 29.0, 35.0, 42.0, 68.0, 118.0, 224.0, 544.0, 2185.0, 14153.0, 324939.0, 3101916.0, 719320.0, 25810.0, 3256.0, 799.0, 271.0, 134.0, 53.0, 33.0, 41.0, 26.0, 25.0, 23.0, 16.0, 24.0, 21.0, 8.0, 7.0, 9.0, 7.0, 4.0, 3.0, 6.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-26.625, -25.75537109375, -24.8857421875, -24.01611328125, -23.146484375, -22.27685546875, -21.4072265625, -20.53759765625, -19.66796875, -18.79833984375, -17.9287109375, -17.05908203125, -16.189453125, -15.31982421875, -14.4501953125, -13.58056640625, -12.7109375, -11.84130859375, -10.9716796875, -10.10205078125, -9.232421875, -8.36279296875, -7.4931640625, -6.62353515625, -5.75390625, -4.88427734375, -4.0146484375, -3.14501953125, -2.275390625, -1.40576171875, -0.5361328125, 0.33349609375, 1.203125, 2.07275390625, 2.9423828125, 3.81201171875, 4.681640625, 5.55126953125, 6.4208984375, 7.29052734375, 8.16015625, 9.02978515625, 9.8994140625, 10.76904296875, 11.638671875, 12.50830078125, 13.3779296875, 14.24755859375, 15.1171875, 15.98681640625, 16.8564453125, 17.72607421875, 18.595703125, 19.46533203125, 20.3349609375, 21.20458984375, 22.07421875, 22.94384765625, 23.8134765625, 24.68310546875, 25.552734375, 26.42236328125, 27.2919921875, 28.16162109375, 29.03125]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 5.0, 6.0, 3.0, 4.0, 6.0, 7.0, 14.0, 15.0, 16.0, 24.0, 28.0, 33.0, 41.0, 54.0, 87.0, 93.0, 154.0, 235.0, 304.0, 386.0, 486.0, 458.0, 409.0, 320.0, 220.0, 158.0, 126.0, 103.0, 78.0, 51.0, 35.0, 16.0, 20.0, 17.0, 8.0, 20.0, 9.0, 3.0, 9.0, 6.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.484375, -14.0574951171875, -13.630615234375, -13.2037353515625, -12.77685546875, -12.3499755859375, -11.923095703125, -11.4962158203125, -11.0693359375, -10.6424560546875, -10.215576171875, -9.7886962890625, -9.36181640625, -8.9349365234375, -8.508056640625, -8.0811767578125, -7.654296875, -7.2274169921875, -6.800537109375, -6.3736572265625, -5.94677734375, -5.5198974609375, -5.093017578125, -4.6661376953125, -4.2392578125, -3.8123779296875, -3.385498046875, -2.9586181640625, -2.53173828125, -2.1048583984375, -1.677978515625, -1.2510986328125, -0.82421875, -0.3973388671875, 0.029541015625, 0.4564208984375, 0.88330078125, 1.3101806640625, 1.737060546875, 2.1639404296875, 2.5908203125, 3.0177001953125, 3.444580078125, 3.8714599609375, 4.29833984375, 4.7252197265625, 5.152099609375, 5.5789794921875, 6.005859375, 6.4327392578125, 6.859619140625, 7.2864990234375, 7.71337890625, 8.1402587890625, 8.567138671875, 8.9940185546875, 9.4208984375, 9.8477783203125, 10.274658203125, 10.7015380859375, 11.12841796875, 11.5552978515625, 11.982177734375, 12.4090576171875, 12.8359375]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 8.0, 12.0, 11.0, 19.0, 28.0, 49.0, 51.0, 88.0, 133.0, 254.0, 557.0, 1741.0, 9826.0, 110694.0, 3292774.0, 739626.0, 32739.0, 3878.0, 927.0, 342.0, 174.0, 105.0, 89.0, 39.0, 37.0, 26.0, 18.0, 14.0, 3.0, 3.0, 6.0, 4.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-42.8125, -41.648193359375, -40.48388671875, -39.319580078125, -38.1552734375, -36.990966796875, -35.82666015625, -34.662353515625, -33.498046875, -32.333740234375, -31.16943359375, -30.005126953125, -28.8408203125, -27.676513671875, -26.51220703125, -25.347900390625, -24.18359375, -23.019287109375, -21.85498046875, -20.690673828125, -19.5263671875, -18.362060546875, -17.19775390625, -16.033447265625, -14.869140625, -13.704833984375, -12.54052734375, -11.376220703125, -10.2119140625, -9.047607421875, -7.88330078125, -6.718994140625, -5.5546875, -4.390380859375, -3.22607421875, -2.061767578125, -0.8974609375, 0.266845703125, 1.43115234375, 2.595458984375, 3.759765625, 4.924072265625, 6.08837890625, 7.252685546875, 8.4169921875, 9.581298828125, 10.74560546875, 11.909912109375, 13.07421875, 14.238525390625, 15.40283203125, 16.567138671875, 17.7314453125, 18.895751953125, 20.06005859375, 21.224365234375, 22.388671875, 23.552978515625, 24.71728515625, 25.881591796875, 27.0458984375, 28.210205078125, 29.37451171875, 30.538818359375, 31.703125]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 87.0, 730.0, 195.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-721.9892578125, -709.2320556640625, -696.4747924804688, -683.7175903320312, -670.9603271484375, -658.203125, -645.4459228515625, -632.6886596679688, -619.9314575195312, -607.1742553710938, -594.4169921875, -581.6597900390625, -568.9025268554688, -556.1453247070312, -543.3880615234375, -530.630859375, -517.8736572265625, -505.1164245605469, -492.35919189453125, -479.60198974609375, -466.8447570800781, -454.0875244140625, -441.3302917480469, -428.57305908203125, -415.8157958984375, -403.0585632324219, -390.30133056640625, -377.54412841796875, -364.7868957519531, -352.0296630859375, -339.2724304199219, -326.51519775390625, -313.75799560546875, -301.0007629394531, -288.2435302734375, -275.486328125, -262.7290954589844, -249.97186279296875, -237.21463012695312, -224.4573974609375, -211.7001953125, -198.94296264648438, -186.1857452392578, -173.4285125732422, -160.67129516601562, -147.9140625, -135.15682983398438, -122.39960479736328, -109.64237213134766, -96.88514709472656, -84.12791442871094, -71.37068939208984, -58.61346435546875, -45.856239318847656, -33.09900665283203, -20.341781616210938, -7.584556579589844, 5.172670364379883, 17.92989730834961, 30.68712615966797, 43.44435119628906, 56.201576232910156, 68.95880889892578, 81.71603393554688, 94.47325897216797]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 2.0, 5.0, 2.0, 4.0, 8.0, 12.0, 8.0, 9.0, 19.0, 14.0, 19.0, 24.0, 21.0, 22.0, 23.0, 24.0, 29.0, 30.0, 35.0, 38.0, 39.0, 37.0, 40.0, 29.0, 28.0, 22.0, 40.0, 35.0, 33.0, 23.0, 34.0, 33.0, 37.0, 30.0, 25.0, 22.0, 24.0, 23.0, 16.0, 13.0, 14.0, 9.0, 9.0, 10.0, 8.0, 7.0, 6.0, 8.0, 0.0, 3.0, 2.0, 3.0, 2.0], "bins": [-57.26423645019531, -55.65049362182617, -54.03675079345703, -52.42300796508789, -50.80926513671875, -49.19552230834961, -47.58177947998047, -45.96803283691406, -44.35429382324219, -42.74055099487305, -41.126808166503906, -39.513065338134766, -37.899322509765625, -36.285579681396484, -34.671836853027344, -33.05809020996094, -31.444347381591797, -29.830604553222656, -28.216861724853516, -26.603118896484375, -24.989376068115234, -23.375633239746094, -21.76188850402832, -20.14814567565918, -18.53440284729004, -16.9206600189209, -15.306917190551758, -13.6931734085083, -12.07943058013916, -10.46568775177002, -8.851943969726562, -7.238201141357422, -5.624458312988281, -4.010715484619141, -2.396972179412842, -0.783228874206543, 0.8305139541625977, 2.4442567825317383, 4.058000564575195, 5.671743392944336, 7.285486221313477, 8.899229049682617, 10.512971878051758, 12.126715660095215, 13.740458488464355, 15.354201316833496, 16.967945098876953, 18.581687927246094, 20.195430755615234, 21.809173583984375, 23.422916412353516, 25.036659240722656, 26.650402069091797, 28.264144897460938, 29.87788963317871, 31.49163246154785, 33.105377197265625, 34.719120025634766, 36.332862854003906, 37.94660568237305, 39.56034851074219, 41.17409133911133, 42.78783416748047, 44.401580810546875, 46.01531982421875]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 4.0, 7.0, 9.0, 5.0, 10.0, 9.0, 10.0, 9.0, 15.0, 14.0, 21.0, 21.0, 41.0, 17.0, 32.0, 31.0, 32.0, 37.0, 37.0, 41.0, 51.0, 31.0, 36.0, 48.0, 44.0, 33.0, 43.0, 31.0, 25.0, 30.0, 30.0, 22.0, 30.0, 21.0, 17.0, 19.0, 17.0, 11.0, 12.0, 10.0, 8.0, 6.0, 6.0, 7.0, 2.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-10.3984375, -10.0870361328125, -9.775634765625, -9.4642333984375, -9.15283203125, -8.8414306640625, -8.530029296875, -8.2186279296875, -7.9072265625, -7.5958251953125, -7.284423828125, -6.9730224609375, -6.66162109375, -6.3502197265625, -6.038818359375, -5.7274169921875, -5.416015625, -5.1046142578125, -4.793212890625, -4.4818115234375, -4.17041015625, -3.8590087890625, -3.547607421875, -3.2362060546875, -2.9248046875, -2.6134033203125, -2.302001953125, -1.9906005859375, -1.67919921875, -1.3677978515625, -1.056396484375, -0.7449951171875, -0.43359375, -0.1221923828125, 0.189208984375, 0.5006103515625, 0.81201171875, 1.1234130859375, 1.434814453125, 1.7462158203125, 2.0576171875, 2.3690185546875, 2.680419921875, 2.9918212890625, 3.30322265625, 3.6146240234375, 3.926025390625, 4.2374267578125, 4.548828125, 4.8602294921875, 5.171630859375, 5.4830322265625, 5.79443359375, 6.1058349609375, 6.417236328125, 6.7286376953125, 7.0400390625, 7.3514404296875, 7.662841796875, 7.9742431640625, 8.28564453125, 8.5970458984375, 8.908447265625, 9.2198486328125, 9.53125]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 6.0, 10.0, 7.0, 11.0, 15.0, 18.0, 43.0, 62.0, 79.0, 152.0, 226.0, 296.0, 436.0, 666.0, 957.0, 1353.0, 2193.0, 3205.0, 4821.0, 7306.0, 11318.0, 17568.0, 27031.0, 41922.0, 65601.0, 103405.0, 159820.0, 196100.0, 144582.0, 92313.0, 58853.0, 37778.0, 24394.0, 15742.0, 10386.0, 6659.0, 4361.0, 2967.0, 1871.0, 1362.0, 882.0, 571.0, 394.0, 241.0, 209.0, 130.0, 83.0, 56.0, 36.0, 25.0, 12.0, 14.0, 8.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.0166015625, -0.9831390380859375, -0.949676513671875, -0.9162139892578125, -0.88275146484375, -0.8492889404296875, -0.815826416015625, -0.7823638916015625, -0.7489013671875, -0.7154388427734375, -0.681976318359375, -0.6485137939453125, -0.61505126953125, -0.5815887451171875, -0.548126220703125, -0.5146636962890625, -0.481201171875, -0.4477386474609375, -0.414276123046875, -0.3808135986328125, -0.34735107421875, -0.3138885498046875, -0.280426025390625, -0.2469635009765625, -0.2135009765625, -0.1800384521484375, -0.146575927734375, -0.1131134033203125, -0.07965087890625, -0.0461883544921875, -0.012725830078125, 0.0207366943359375, 0.05419921875, 0.0876617431640625, 0.121124267578125, 0.1545867919921875, 0.18804931640625, 0.2215118408203125, 0.254974365234375, 0.2884368896484375, 0.3218994140625, 0.3553619384765625, 0.388824462890625, 0.4222869873046875, 0.45574951171875, 0.4892120361328125, 0.522674560546875, 0.5561370849609375, 0.589599609375, 0.6230621337890625, 0.656524658203125, 0.6899871826171875, 0.72344970703125, 0.7569122314453125, 0.790374755859375, 0.8238372802734375, 0.8572998046875, 0.8907623291015625, 0.924224853515625, 0.9576873779296875, 0.99114990234375, 1.0246124267578125, 1.058074951171875, 1.0915374755859375, 1.125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 9.0, 3.0, 9.0, 12.0, 11.0, 13.0, 9.0, 20.0, 28.0, 27.0, 24.0, 36.0, 42.0, 30.0, 50.0, 55.0, 43.0, 48.0, 41.0, 1076.0, 47.0, 50.0, 45.0, 50.0, 40.0, 27.0, 26.0, 24.0, 18.0, 20.0, 21.0, 18.0, 10.0, 8.0, 11.0, 5.0, 7.0, 4.0, 1.0, 5.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.75390625, -7.5125732421875, -7.271240234375, -7.0299072265625, -6.78857421875, -6.5472412109375, -6.305908203125, -6.0645751953125, -5.8232421875, -5.5819091796875, -5.340576171875, -5.0992431640625, -4.85791015625, -4.6165771484375, -4.375244140625, -4.1339111328125, -3.892578125, -3.6512451171875, -3.409912109375, -3.1685791015625, -2.92724609375, -2.6859130859375, -2.444580078125, -2.2032470703125, -1.9619140625, -1.7205810546875, -1.479248046875, -1.2379150390625, -0.99658203125, -0.7552490234375, -0.513916015625, -0.2725830078125, -0.03125, 0.2100830078125, 0.451416015625, 0.6927490234375, 0.93408203125, 1.1754150390625, 1.416748046875, 1.6580810546875, 1.8994140625, 2.1407470703125, 2.382080078125, 2.6234130859375, 2.86474609375, 3.1060791015625, 3.347412109375, 3.5887451171875, 3.830078125, 4.0714111328125, 4.312744140625, 4.5540771484375, 4.79541015625, 5.0367431640625, 5.278076171875, 5.5194091796875, 5.7607421875, 6.0020751953125, 6.243408203125, 6.4847412109375, 6.72607421875, 6.9674072265625, 7.208740234375, 7.4500732421875, 7.69140625]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 7.0, 9.0, 18.0, 28.0, 57.0, 59.0, 94.0, 122.0, 202.0, 246.0, 392.0, 562.0, 842.0, 1309.0, 1980.0, 3021.0, 4746.0, 7560.0, 12215.0, 20122.0, 33634.0, 56480.0, 95779.0, 165772.0, 1286425.0, 165230.0, 96153.0, 56695.0, 33660.0, 19985.0, 12169.0, 7747.0, 4762.0, 3096.0, 2006.0, 1315.0, 816.0, 610.0, 399.0, 249.0, 175.0, 125.0, 85.0, 42.0, 39.0, 20.0, 22.0, 22.0, 10.0, 13.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.232421875, -1.1945037841796875, -1.156585693359375, -1.1186676025390625, -1.08074951171875, -1.0428314208984375, -1.004913330078125, -0.9669952392578125, -0.9290771484375, -0.8911590576171875, -0.853240966796875, -0.8153228759765625, -0.77740478515625, -0.7394866943359375, -0.701568603515625, -0.6636505126953125, -0.625732421875, -0.5878143310546875, -0.549896240234375, -0.5119781494140625, -0.47406005859375, -0.4361419677734375, -0.398223876953125, -0.3603057861328125, -0.3223876953125, -0.2844696044921875, -0.246551513671875, -0.2086334228515625, -0.17071533203125, -0.1327972412109375, -0.094879150390625, -0.0569610595703125, -0.01904296875, 0.0188751220703125, 0.056793212890625, 0.0947113037109375, 0.13262939453125, 0.1705474853515625, 0.208465576171875, 0.2463836669921875, 0.2843017578125, 0.3222198486328125, 0.360137939453125, 0.3980560302734375, 0.43597412109375, 0.4738922119140625, 0.511810302734375, 0.5497283935546875, 0.587646484375, 0.6255645751953125, 0.663482666015625, 0.7014007568359375, 0.73931884765625, 0.7772369384765625, 0.815155029296875, 0.8530731201171875, 0.8909912109375, 0.9289093017578125, 0.966827392578125, 1.0047454833984375, 1.04266357421875, 1.0805816650390625, 1.118499755859375, 1.1564178466796875, 1.1943359375]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 6.0, 5.0, 15.0, 11.0, 23.0, 22.0, 32.0, 30.0, 60.0, 66.0, 80.0, 74.0, 71.0, 72.0, 91.0, 61.0, 53.0, 45.0, 29.0, 37.0, 23.0, 20.0, 13.0, 18.0, 7.0, 9.0, 5.0, 1.0, 2.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.005878448486328125, -0.005696475505828857, -0.00551450252532959, -0.005332529544830322, -0.005150556564331055, -0.004968583583831787, -0.0047866106033325195, -0.004604637622833252, -0.004422664642333984, -0.004240691661834717, -0.004058718681335449, -0.0038767457008361816, -0.003694772720336914, -0.0035127997398376465, -0.003330826759338379, -0.0031488537788391113, -0.0029668807983398438, -0.002784907817840576, -0.0026029348373413086, -0.002420961856842041, -0.0022389888763427734, -0.002057015895843506, -0.0018750429153442383, -0.0016930699348449707, -0.0015110969543457031, -0.0013291239738464355, -0.001147150993347168, -0.0009651780128479004, -0.0007832050323486328, -0.0006012320518493652, -0.00041925907135009766, -0.00023728609085083008, -5.53131103515625e-05, 0.00012665987014770508, 0.00030863285064697266, 0.0004906058311462402, 0.0006725788116455078, 0.0008545517921447754, 0.001036524772644043, 0.0012184977531433105, 0.0014004707336425781, 0.0015824437141418457, 0.0017644166946411133, 0.0019463896751403809, 0.0021283626556396484, 0.002310335636138916, 0.0024923086166381836, 0.002674281597137451, 0.0028562545776367188, 0.0030382275581359863, 0.003220200538635254, 0.0034021735191345215, 0.003584146499633789, 0.0037661194801330566, 0.003948092460632324, 0.004130065441131592, 0.004312038421630859, 0.004494011402130127, 0.0046759843826293945, 0.004857957363128662, 0.00503993034362793, 0.005221903324127197, 0.005403876304626465, 0.005585849285125732, 0.005767822265625]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 1.0, 6.0, 3.0, 5.0, 5.0, 7.0, 11.0, 14.0, 15.0, 12.0, 35.0, 31.0, 58.0, 77.0, 110.0, 180.0, 279.0, 731.0, 15154.0, 1029061.0, 1493.0, 500.0, 261.0, 150.0, 97.0, 86.0, 44.0, 42.0, 24.0, 18.0, 11.0, 9.0, 9.0, 8.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.123779296875, -0.11981964111328125, -0.1158599853515625, -0.11190032958984375, -0.107940673828125, -0.10398101806640625, -0.1000213623046875, -0.09606170654296875, -0.09210205078125, -0.08814239501953125, -0.0841827392578125, -0.08022308349609375, -0.076263427734375, -0.07230377197265625, -0.0683441162109375, -0.06438446044921875, -0.0604248046875, -0.05646514892578125, -0.0525054931640625, -0.04854583740234375, -0.044586181640625, -0.04062652587890625, -0.0366668701171875, -0.03270721435546875, -0.02874755859375, -0.02478790283203125, -0.0208282470703125, -0.01686859130859375, -0.012908935546875, -0.00894927978515625, -0.0049896240234375, -0.00102996826171875, 0.0029296875, 0.00688934326171875, 0.0108489990234375, 0.01480865478515625, 0.018768310546875, 0.02272796630859375, 0.0266876220703125, 0.03064727783203125, 0.03460693359375, 0.03856658935546875, 0.0425262451171875, 0.04648590087890625, 0.050445556640625, 0.05440521240234375, 0.0583648681640625, 0.06232452392578125, 0.0662841796875, 0.07024383544921875, 0.0742034912109375, 0.07816314697265625, 0.082122802734375, 0.08608245849609375, 0.0900421142578125, 0.09400177001953125, 0.09796142578125, 0.10192108154296875, 0.1058807373046875, 0.10984039306640625, 0.113800048828125, 0.11775970458984375, 0.1217193603515625, 0.12567901611328125, 0.129638671875]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 113.0, 855.0, 47.0, 1.0, 0.0, 1.0], "bins": [-0.04218907281756401, -0.04147898405790329, -0.04076889529824257, -0.04005880653858185, -0.03934871777892113, -0.038638629019260406, -0.03792853653430939, -0.037218447774648666, -0.036508359014987946, -0.035798270255327225, -0.035088181495666504, -0.03437809273600578, -0.03366800397634506, -0.03295791149139404, -0.03224782645702362, -0.0315377339720726, -0.03082764707505703, -0.03011755831539631, -0.029407469555735588, -0.028697378933429718, -0.027987290173768997, -0.027277201414108276, -0.026567112654447556, -0.025857023894786835, -0.025146935135126114, -0.024436846375465393, -0.023726757615804672, -0.02301666885614395, -0.02230657823383808, -0.02159648947417736, -0.02088640071451664, -0.02017631195485592, -0.019466223195195198, -0.018756134435534477, -0.018046045675873756, -0.017335955053567886, -0.016625866293907166, -0.015915777534246445, -0.015205688774585724, -0.014495600014925003, -0.013785510323941708, -0.013075421564280987, -0.012365331873297691, -0.01165524311363697, -0.01094515435397625, -0.010235064662992954, -0.009524975903332233, -0.008814886212348938, -0.008104797452688217, -0.007394708227366209, -0.006684619002044201, -0.00597453024238348, -0.005264441017061472, -0.004554351791739464, -0.003844263032078743, -0.003134173806756735, -0.0024240845814347267, -0.0017139954725280404, -0.001003906363621354, -0.0002938173711299896, 0.0004162718541920185, 0.0011263610795140266, 0.0018364498391747475, 0.0025465390644967556, 0.0032566282898187637]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 5.0, 3.0, 8.0, 9.0, 7.0, 9.0, 3.0, 13.0, 14.0, 18.0, 16.0, 26.0, 31.0, 31.0, 34.0, 49.0, 32.0, 40.0, 46.0, 39.0, 39.0, 49.0, 49.0, 41.0, 38.0, 33.0, 32.0, 30.0, 32.0, 33.0, 21.0, 28.0, 23.0, 22.0, 28.0, 18.0, 16.0, 6.0, 8.0, 8.0, 3.0, 1.0, 4.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.002894580364227295, -0.0028132395818829536, -0.0027318987995386124, -0.002650558017194271, -0.00256921723484993, -0.0024878764525055885, -0.0024065356701612473, -0.002325194887816906, -0.0022438541054725647, -0.0021625133231282234, -0.002081172540783882, -0.001999831758439541, -0.0019184909760951996, -0.0018371501937508583, -0.001755809411406517, -0.0016744686290621758, -0.0015931278467178345, -0.0015117870643734932, -0.001430446282029152, -0.0013491054996848106, -0.0012677647173404694, -0.001186423934996128, -0.0011050831526517868, -0.0010237423703074455, -0.0009424015879631042, -0.000861060805618763, -0.0007797200232744217, -0.0006983792409300804, -0.0006170384585857391, -0.0005356976762413979, -0.0004543568938970566, -0.0003730161115527153, -0.000291675329208374, -0.00021033454686403275, -0.00012899376451969147, -4.765298217535019e-05, 3.368780016899109e-05, 0.00011502858251333237, 0.00019636936485767365, 0.0002777101472020149, 0.0003590509295463562, 0.0004403917118906975, 0.0005217324942350388, 0.00060307327657938, 0.0006844140589237213, 0.0007657548412680626, 0.0008470956236124039, 0.0009284364059567451, 0.0010097771883010864, 0.0010911179706454277, 0.001172458752989769, 0.0012537995353341103, 0.0013351403176784515, 0.0014164811000227928, 0.001497821882367134, 0.0015791626647114754, 0.0016605034470558167, 0.001741844229400158, 0.0018231850117444992, 0.0019045257940888405, 0.0019858665764331818, 0.002067207358777523, 0.0021485481411218643, 0.0022298889234662056, 0.002311229705810547]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 4.0, 7.0, 9.0, 5.0, 10.0, 9.0, 10.0, 9.0, 15.0, 14.0, 21.0, 21.0, 39.0, 20.0, 32.0, 30.0, 32.0, 37.0, 37.0, 41.0, 51.0, 31.0, 36.0, 48.0, 44.0, 33.0, 43.0, 31.0, 25.0, 30.0, 30.0, 22.0, 30.0, 21.0, 17.0, 19.0, 17.0, 11.0, 12.0, 10.0, 8.0, 6.0, 6.0, 7.0, 2.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-10.3984375, -10.0870361328125, -9.775634765625, -9.4642333984375, -9.15283203125, -8.8414306640625, -8.530029296875, -8.2186279296875, -7.9072265625, -7.5958251953125, -7.284423828125, -6.9730224609375, -6.66162109375, -6.3502197265625, -6.038818359375, -5.7274169921875, -5.416015625, -5.1046142578125, -4.793212890625, -4.4818115234375, -4.17041015625, -3.8590087890625, -3.547607421875, -3.2362060546875, -2.9248046875, -2.6134033203125, -2.302001953125, -1.9906005859375, -1.67919921875, -1.3677978515625, -1.056396484375, -0.7449951171875, -0.43359375, -0.1221923828125, 0.189208984375, 0.5006103515625, 0.81201171875, 1.1234130859375, 1.434814453125, 1.7462158203125, 2.0576171875, 2.3690185546875, 2.680419921875, 2.9918212890625, 3.30322265625, 3.6146240234375, 3.926025390625, 4.2374267578125, 4.548828125, 4.8602294921875, 5.171630859375, 5.4830322265625, 5.79443359375, 6.1058349609375, 6.417236328125, 6.7286376953125, 7.0400390625, 7.3514404296875, 7.662841796875, 7.9742431640625, 8.28564453125, 8.5970458984375, 8.908447265625, 9.2198486328125, 9.53125]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 3.0, 3.0, 5.0, 6.0, 9.0, 9.0, 12.0, 16.0, 27.0, 22.0, 42.0, 48.0, 77.0, 97.0, 101.0, 158.0, 205.0, 274.0, 366.0, 581.0, 887.0, 1581.0, 2934.0, 6302.0, 15934.0, 45524.0, 146340.0, 426818.0, 274111.0, 80023.0, 26191.0, 9768.0, 4311.0, 2180.0, 1144.0, 659.0, 451.0, 354.0, 250.0, 175.0, 142.0, 102.0, 77.0, 51.0, 50.0, 33.0, 32.0, 26.0, 16.0, 14.0, 6.0, 6.0, 5.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-11.5234375, -11.148681640625, -10.77392578125, -10.399169921875, -10.0244140625, -9.649658203125, -9.27490234375, -8.900146484375, -8.525390625, -8.150634765625, -7.77587890625, -7.401123046875, -7.0263671875, -6.651611328125, -6.27685546875, -5.902099609375, -5.52734375, -5.152587890625, -4.77783203125, -4.403076171875, -4.0283203125, -3.653564453125, -3.27880859375, -2.904052734375, -2.529296875, -2.154541015625, -1.77978515625, -1.405029296875, -1.0302734375, -0.655517578125, -0.28076171875, 0.093994140625, 0.46875, 0.843505859375, 1.21826171875, 1.593017578125, 1.9677734375, 2.342529296875, 2.71728515625, 3.092041015625, 3.466796875, 3.841552734375, 4.21630859375, 4.591064453125, 4.9658203125, 5.340576171875, 5.71533203125, 6.090087890625, 6.46484375, 6.839599609375, 7.21435546875, 7.589111328125, 7.9638671875, 8.338623046875, 8.71337890625, 9.088134765625, 9.462890625, 9.837646484375, 10.21240234375, 10.587158203125, 10.9619140625, 11.336669921875, 11.71142578125, 12.086181640625, 12.4609375]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 2.0, 5.0, 3.0, 3.0, 8.0, 5.0, 10.0, 13.0, 12.0, 10.0, 14.0, 24.0, 25.0, 30.0, 19.0, 31.0, 48.0, 43.0, 51.0, 53.0, 76.0, 118.0, 281.0, 1423.0, 211.0, 81.0, 69.0, 55.0, 44.0, 37.0, 31.0, 31.0, 25.0, 25.0, 26.0, 23.0, 16.0, 12.0, 8.0, 11.0, 14.0, 6.0, 2.0, 8.0, 1.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-27.0, -26.18798828125, -25.3759765625, -24.56396484375, -23.751953125, -22.93994140625, -22.1279296875, -21.31591796875, -20.50390625, -19.69189453125, -18.8798828125, -18.06787109375, -17.255859375, -16.44384765625, -15.6318359375, -14.81982421875, -14.0078125, -13.19580078125, -12.3837890625, -11.57177734375, -10.759765625, -9.94775390625, -9.1357421875, -8.32373046875, -7.51171875, -6.69970703125, -5.8876953125, -5.07568359375, -4.263671875, -3.45166015625, -2.6396484375, -1.82763671875, -1.015625, -0.20361328125, 0.6083984375, 1.42041015625, 2.232421875, 3.04443359375, 3.8564453125, 4.66845703125, 5.48046875, 6.29248046875, 7.1044921875, 7.91650390625, 8.728515625, 9.54052734375, 10.3525390625, 11.16455078125, 11.9765625, 12.78857421875, 13.6005859375, 14.41259765625, 15.224609375, 16.03662109375, 16.8486328125, 17.66064453125, 18.47265625, 19.28466796875, 20.0966796875, 20.90869140625, 21.720703125, 22.53271484375, 23.3447265625, 24.15673828125, 24.96875]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 8.0, 4.0, 9.0, 14.0, 12.0, 17.0, 24.0, 55.0, 51.0, 76.0, 117.0, 186.0, 271.0, 431.0, 1022.0, 7544.0, 1523304.0, 1602757.0, 7512.0, 1012.0, 425.0, 241.0, 174.0, 125.0, 84.0, 65.0, 37.0, 34.0, 20.0, 19.0, 11.0, 9.0, 7.0, 7.0, 5.0, 5.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-61.3125, -59.50927734375, -57.7060546875, -55.90283203125, -54.099609375, -52.29638671875, -50.4931640625, -48.68994140625, -46.88671875, -45.08349609375, -43.2802734375, -41.47705078125, -39.673828125, -37.87060546875, -36.0673828125, -34.26416015625, -32.4609375, -30.65771484375, -28.8544921875, -27.05126953125, -25.248046875, -23.44482421875, -21.6416015625, -19.83837890625, -18.03515625, -16.23193359375, -14.4287109375, -12.62548828125, -10.822265625, -9.01904296875, -7.2158203125, -5.41259765625, -3.609375, -1.80615234375, -0.0029296875, 1.80029296875, 3.603515625, 5.40673828125, 7.2099609375, 9.01318359375, 10.81640625, 12.61962890625, 14.4228515625, 16.22607421875, 18.029296875, 19.83251953125, 21.6357421875, 23.43896484375, 25.2421875, 27.04541015625, 28.8486328125, 30.65185546875, 32.455078125, 34.25830078125, 36.0615234375, 37.86474609375, 39.66796875, 41.47119140625, 43.2744140625, 45.07763671875, 46.880859375, 48.68408203125, 50.4873046875, 52.29052734375, 54.09375]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 27.0, 879.0, 108.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-401.6973876953125, -390.73602294921875, -379.7746276855469, -368.8132629394531, -357.85186767578125, -346.8905029296875, -335.92913818359375, -324.9677429199219, -314.00634765625, -303.04498291015625, -292.0835876464844, -281.1222229003906, -270.16082763671875, -259.199462890625, -248.2380828857422, -237.27670288085938, -226.31533813476562, -215.3539581298828, -204.392578125, -193.43121337890625, -182.46981811523438, -171.50845336914062, -160.5470733642578, -149.585693359375, -138.6243133544922, -127.66293334960938, -116.70155334472656, -105.74018096923828, -94.77880096435547, -83.81742095947266, -72.85604858398438, -61.89466857910156, -50.93328857421875, -39.97190856933594, -29.01053237915039, -18.049156188964844, -7.087776184082031, 3.8736038208007812, 14.834976196289062, 25.796356201171875, 36.75773620605469, 47.7191162109375, 58.68049240112305, 69.6418685913086, 80.6032485961914, 91.56462860107422, 102.5260009765625, 113.48738098144531, 124.44876098632812, 135.41014099121094, 146.37152099609375, 157.3328857421875, 168.29428100585938, 179.25564575195312, 190.21702575683594, 201.17840576171875, 212.13978576660156, 223.10116577148438, 234.0625457763672, 245.02392578125, 255.98529052734375, 266.9466857910156, 277.9080505371094, 288.86944580078125, 299.830810546875]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 6.0, 3.0, 4.0, 2.0, 9.0, 9.0, 10.0, 13.0, 10.0, 22.0, 21.0, 24.0, 28.0, 29.0, 36.0, 27.0, 44.0, 45.0, 41.0, 33.0, 38.0, 52.0, 45.0, 36.0, 45.0, 41.0, 39.0, 46.0, 37.0, 29.0, 31.0, 29.0, 21.0, 18.0, 15.0, 18.0, 8.0, 17.0, 8.0, 2.0, 7.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-67.79914855957031, -65.72964477539062, -63.660133361816406, -61.59062576293945, -59.5211181640625, -57.45161437988281, -55.38210678100586, -53.312599182128906, -51.24309158325195, -49.173583984375, -47.10407638549805, -45.034568786621094, -42.965065002441406, -40.89555358886719, -38.8260498046875, -36.75654220581055, -34.687034606933594, -32.61752700805664, -30.548019409179688, -28.478513717651367, -26.409006118774414, -24.33949851989746, -22.26999282836914, -20.200485229492188, -18.130977630615234, -16.06147003173828, -13.991963386535645, -11.922456741333008, -9.852949142456055, -7.783441543579102, -5.713934898376465, -3.644428253173828, -1.574920654296875, 0.4945864677429199, 2.564093589782715, 4.63360071182251, 6.703107833862305, 8.772615432739258, 10.842122077941895, 12.911628723144531, 14.981136322021484, 17.050643920898438, 19.12015151977539, 21.18965721130371, 23.259164810180664, 25.328672409057617, 27.398178100585938, 29.46768569946289, 31.537193298339844, 33.6067008972168, 35.67620849609375, 37.7457160949707, 39.815223693847656, 41.884727478027344, 43.9542350769043, 46.02374267578125, 48.0932502746582, 50.162757873535156, 52.23226547241211, 54.30177307128906, 56.37127685546875, 58.44078826904297, 60.510292053222656, 62.57979965209961, 64.64930725097656]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 6.0, 7.0, 11.0, 8.0, 7.0, 7.0, 15.0, 16.0, 15.0, 18.0, 24.0, 22.0, 30.0, 35.0, 31.0, 39.0, 40.0, 43.0, 42.0, 33.0, 49.0, 44.0, 43.0, 51.0, 32.0, 26.0, 29.0, 20.0, 30.0, 27.0, 33.0, 22.0, 22.0, 15.0, 18.0, 14.0, 14.0, 14.0, 9.0, 9.0, 6.0, 8.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0], "bins": [-10.2109375, -9.893798828125, -9.57666015625, -9.259521484375, -8.9423828125, -8.625244140625, -8.30810546875, -7.990966796875, -7.673828125, -7.356689453125, -7.03955078125, -6.722412109375, -6.4052734375, -6.088134765625, -5.77099609375, -5.453857421875, -5.13671875, -4.819580078125, -4.50244140625, -4.185302734375, -3.8681640625, -3.551025390625, -3.23388671875, -2.916748046875, -2.599609375, -2.282470703125, -1.96533203125, -1.648193359375, -1.3310546875, -1.013916015625, -0.69677734375, -0.379638671875, -0.0625, 0.254638671875, 0.57177734375, 0.888916015625, 1.2060546875, 1.523193359375, 1.84033203125, 2.157470703125, 2.474609375, 2.791748046875, 3.10888671875, 3.426025390625, 3.7431640625, 4.060302734375, 4.37744140625, 4.694580078125, 5.01171875, 5.328857421875, 5.64599609375, 5.963134765625, 6.2802734375, 6.597412109375, 6.91455078125, 7.231689453125, 7.548828125, 7.865966796875, 8.18310546875, 8.500244140625, 8.8173828125, 9.134521484375, 9.45166015625, 9.768798828125, 10.0859375]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 3.0, 9.0, 5.0, 6.0, 5.0, 11.0, 16.0, 18.0, 20.0, 35.0, 34.0, 35.0, 59.0, 85.0, 122.0, 123.0, 195.0, 263.0, 361.0, 448.0, 1104.0, 4185242.0, 4092.0, 474.0, 338.0, 297.0, 224.0, 161.0, 108.0, 78.0, 70.0, 41.0, 47.0, 34.0, 25.0, 23.0, 17.0, 10.0, 12.0, 8.0, 7.0, 6.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-239.625, -232.056640625, -224.48828125, -216.919921875, -209.3515625, -201.783203125, -194.21484375, -186.646484375, -179.078125, -171.509765625, -163.94140625, -156.373046875, -148.8046875, -141.236328125, -133.66796875, -126.099609375, -118.53125, -110.962890625, -103.39453125, -95.826171875, -88.2578125, -80.689453125, -73.12109375, -65.552734375, -57.984375, -50.416015625, -42.84765625, -35.279296875, -27.7109375, -20.142578125, -12.57421875, -5.005859375, 2.5625, 10.130859375, 17.69921875, 25.267578125, 32.8359375, 40.404296875, 47.97265625, 55.541015625, 63.109375, 70.677734375, 78.24609375, 85.814453125, 93.3828125, 100.951171875, 108.51953125, 116.087890625, 123.65625, 131.224609375, 138.79296875, 146.361328125, 153.9296875, 161.498046875, 169.06640625, 176.634765625, 184.203125, 191.771484375, 199.33984375, 206.908203125, 214.4765625, 222.044921875, 229.61328125, 237.181640625, 244.75]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 4.0, 11.0, 5.0, 10.0, 13.0, 26.0, 28.0, 39.0, 53.0, 52.0, 91.0, 143.0, 196.0, 304.0, 532.0, 657.0, 607.0, 450.0, 285.0, 165.0, 112.0, 69.0, 68.0, 45.0, 24.0, 23.0, 18.0, 9.0, 7.0, 17.0, 5.0, 5.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-22.296875, -21.69140625, -21.0859375, -20.48046875, -19.875, -19.26953125, -18.6640625, -18.05859375, -17.453125, -16.84765625, -16.2421875, -15.63671875, -15.03125, -14.42578125, -13.8203125, -13.21484375, -12.609375, -12.00390625, -11.3984375, -10.79296875, -10.1875, -9.58203125, -8.9765625, -8.37109375, -7.765625, -7.16015625, -6.5546875, -5.94921875, -5.34375, -4.73828125, -4.1328125, -3.52734375, -2.921875, -2.31640625, -1.7109375, -1.10546875, -0.5, 0.10546875, 0.7109375, 1.31640625, 1.921875, 2.52734375, 3.1328125, 3.73828125, 4.34375, 4.94921875, 5.5546875, 6.16015625, 6.765625, 7.37109375, 7.9765625, 8.58203125, 9.1875, 9.79296875, 10.3984375, 11.00390625, 11.609375, 12.21484375, 12.8203125, 13.42578125, 14.03125, 14.63671875, 15.2421875, 15.84765625, 16.453125]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 6.0, 5.0, 7.0, 7.0, 11.0, 10.0, 9.0, 16.0, 21.0, 21.0, 30.0, 35.0, 37.0, 60.0, 75.0, 97.0, 224.0, 1590.0, 3980504.0, 210292.0, 683.0, 186.0, 75.0, 55.0, 49.0, 31.0, 35.0, 29.0, 22.0, 23.0, 10.0, 7.0, 6.0, 7.0, 3.0, 8.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-158.875, -154.31640625, -149.7578125, -145.19921875, -140.640625, -136.08203125, -131.5234375, -126.96484375, -122.40625, -117.84765625, -113.2890625, -108.73046875, -104.171875, -99.61328125, -95.0546875, -90.49609375, -85.9375, -81.37890625, -76.8203125, -72.26171875, -67.703125, -63.14453125, -58.5859375, -54.02734375, -49.46875, -44.91015625, -40.3515625, -35.79296875, -31.234375, -26.67578125, -22.1171875, -17.55859375, -13.0, -8.44140625, -3.8828125, 0.67578125, 5.234375, 9.79296875, 14.3515625, 18.91015625, 23.46875, 28.02734375, 32.5859375, 37.14453125, 41.703125, 46.26171875, 50.8203125, 55.37890625, 59.9375, 64.49609375, 69.0546875, 73.61328125, 78.171875, 82.73046875, 87.2890625, 91.84765625, 96.40625, 100.96484375, 105.5234375, 110.08203125, 114.640625, 119.19921875, 123.7578125, 128.31640625, 132.875]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [2.0, 1.0, 12.0, 449.0, 542.0, 12.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.8243522644043, -44.18359375, -29.54283905029297, -14.902080535888672, -0.2613258361816406, 14.37942886352539, 29.020191192626953, 43.660945892333984, 58.301700592041016, 72.94245910644531, 87.58321380615234, 102.22396850585938, 116.86473083496094, 131.50547790527344, 146.146240234375, 160.78700256347656, 175.42774963378906, 190.06851196289062, 204.70925903320312, 219.3500213623047, 233.99078369140625, 248.63153076171875, 263.27227783203125, 277.9130554199219, 292.5538024902344, 307.1945495605469, 321.8353271484375, 336.47607421875, 351.1168212890625, 365.757568359375, 380.3983459472656, 395.0390930175781, 409.67987060546875, 424.32061767578125, 438.9613952636719, 453.6021423339844, 468.2428894042969, 482.8836669921875, 497.5244140625, 512.1651611328125, 526.805908203125, 541.4466552734375, 556.08740234375, 570.7281494140625, 585.3689575195312, 600.0097045898438, 614.6504516601562, 629.2911987304688, 643.9320068359375, 658.57275390625, 673.2135009765625, 687.854248046875, 702.4950561523438, 717.1358032226562, 731.7765502929688, 746.4172973632812, 761.0580444335938, 775.6987915039062, 790.3395385742188, 804.9803466796875, 819.62109375, 834.2618408203125, 848.902587890625, 863.5433349609375, 878.18408203125]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 6.0, 2.0, 3.0, 9.0, 11.0, 8.0, 14.0, 12.0, 15.0, 18.0, 23.0, 15.0, 18.0, 24.0, 25.0, 33.0, 36.0, 34.0, 38.0, 40.0, 28.0, 44.0, 37.0, 35.0, 48.0, 40.0, 50.0, 41.0, 35.0, 38.0, 23.0, 34.0, 23.0, 26.0, 17.0, 17.0, 17.0, 12.0, 14.0, 9.0, 10.0, 5.0, 2.0, 6.0, 6.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.87939453125, -53.015987396240234, -51.15258026123047, -49.2891731262207, -47.42576599121094, -45.562355041503906, -43.69894790649414, -41.835540771484375, -39.97213363647461, -38.108726501464844, -36.24531936645508, -34.38191223144531, -32.51850128173828, -30.65509605407715, -28.79168701171875, -26.928279876708984, -25.06487274169922, -23.201465606689453, -21.338058471679688, -19.47464942932129, -17.611242294311523, -15.747835159301758, -13.884427070617676, -12.021018981933594, -10.157611846923828, -8.294204711914062, -6.4307966232299805, -4.567389011383057, -2.703981399536133, -0.8405742645263672, 1.0228338241577148, 2.886241912841797, 4.7496490478515625, 6.613056659698486, 8.47646427154541, 10.339872360229492, 12.203279495239258, 14.066686630249023, 15.930094718933105, 17.793502807617188, 19.656909942626953, 21.52031707763672, 23.383724212646484, 25.247133255004883, 27.11054039001465, 28.973947525024414, 30.837356567382812, 32.70076370239258, 34.564170837402344, 36.42757797241211, 38.290985107421875, 40.15439224243164, 42.017799377441406, 43.88121032714844, 45.7446174621582, 47.60802459716797, 49.471431732177734, 51.3348388671875, 53.198246002197266, 55.06165313720703, 56.92506408691406, 58.78846740722656, 60.651878356933594, 62.51528549194336, 64.37869262695312]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 0.0, 3.0, 5.0, 3.0, 4.0, 6.0, 15.0, 15.0, 6.0, 18.0, 12.0, 18.0, 16.0, 27.0, 19.0, 23.0, 25.0, 33.0, 32.0, 36.0, 32.0, 48.0, 35.0, 37.0, 39.0, 39.0, 35.0, 38.0, 38.0, 33.0, 34.0, 33.0, 33.0, 34.0, 26.0, 17.0, 18.0, 21.0, 19.0, 14.0, 13.0, 6.0, 10.0, 8.0, 3.0, 6.0, 4.0, 6.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-9.8515625, -9.551513671875, -9.25146484375, -8.951416015625, -8.6513671875, -8.351318359375, -8.05126953125, -7.751220703125, -7.451171875, -7.151123046875, -6.85107421875, -6.551025390625, -6.2509765625, -5.950927734375, -5.65087890625, -5.350830078125, -5.05078125, -4.750732421875, -4.45068359375, -4.150634765625, -3.8505859375, -3.550537109375, -3.25048828125, -2.950439453125, -2.650390625, -2.350341796875, -2.05029296875, -1.750244140625, -1.4501953125, -1.150146484375, -0.85009765625, -0.550048828125, -0.25, 0.050048828125, 0.35009765625, 0.650146484375, 0.9501953125, 1.250244140625, 1.55029296875, 1.850341796875, 2.150390625, 2.450439453125, 2.75048828125, 3.050537109375, 3.3505859375, 3.650634765625, 3.95068359375, 4.250732421875, 4.55078125, 4.850830078125, 5.15087890625, 5.450927734375, 5.7509765625, 6.051025390625, 6.35107421875, 6.651123046875, 6.951171875, 7.251220703125, 7.55126953125, 7.851318359375, 8.1513671875, 8.451416015625, 8.75146484375, 9.051513671875, 9.3515625]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 7.0, 9.0, 10.0, 19.0, 24.0, 27.0, 44.0, 86.0, 102.0, 126.0, 165.0, 250.0, 322.0, 433.0, 591.0, 850.0, 1228.0, 1692.0, 2403.0, 3246.0, 4720.0, 6771.0, 9842.0, 14283.0, 20475.0, 30203.0, 44253.0, 66644.0, 99612.0, 147423.0, 177011.0, 134514.0, 90432.0, 60537.0, 40543.0, 27380.0, 19000.0, 13014.0, 8900.0, 6164.0, 4287.0, 3136.0, 2254.0, 1495.0, 1183.0, 796.0, 551.0, 409.0, 344.0, 223.0, 130.0, 118.0, 83.0, 59.0, 41.0, 30.0, 25.0, 16.0, 12.0, 9.0, 10.0, 3.0, 3.0], "bins": [-0.9169921875, -0.8877716064453125, -0.858551025390625, -0.8293304443359375, -0.80010986328125, -0.7708892822265625, -0.741668701171875, -0.7124481201171875, -0.6832275390625, -0.6540069580078125, -0.624786376953125, -0.5955657958984375, -0.56634521484375, -0.5371246337890625, -0.507904052734375, -0.4786834716796875, -0.449462890625, -0.4202423095703125, -0.391021728515625, -0.3618011474609375, -0.33258056640625, -0.3033599853515625, -0.274139404296875, -0.2449188232421875, -0.2156982421875, -0.1864776611328125, -0.157257080078125, -0.1280364990234375, -0.09881591796875, -0.0695953369140625, -0.040374755859375, -0.0111541748046875, 0.01806640625, 0.0472869873046875, 0.076507568359375, 0.1057281494140625, 0.13494873046875, 0.1641693115234375, 0.193389892578125, 0.2226104736328125, 0.2518310546875, 0.2810516357421875, 0.310272216796875, 0.3394927978515625, 0.36871337890625, 0.3979339599609375, 0.427154541015625, 0.4563751220703125, 0.485595703125, 0.5148162841796875, 0.544036865234375, 0.5732574462890625, 0.60247802734375, 0.6316986083984375, 0.660919189453125, 0.6901397705078125, 0.7193603515625, 0.7485809326171875, 0.777801513671875, 0.8070220947265625, 0.83624267578125, 0.8654632568359375, 0.894683837890625, 0.9239044189453125, 0.953125]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 4.0, 9.0, 9.0, 15.0, 11.0, 19.0, 21.0, 28.0, 26.0, 29.0, 33.0, 32.0, 34.0, 38.0, 50.0, 42.0, 46.0, 31.0, 1060.0, 25.0, 48.0, 54.0, 29.0, 33.0, 48.0, 27.0, 39.0, 27.0, 29.0, 19.0, 11.0, 13.0, 15.0, 9.0, 15.0, 7.0, 2.0, 7.0, 4.0, 6.0, 4.0, 2.0, 4.0, 4.0, 1.0, 2.0, 2.0], "bins": [-7.17578125, -6.97509765625, -6.7744140625, -6.57373046875, -6.373046875, -6.17236328125, -5.9716796875, -5.77099609375, -5.5703125, -5.36962890625, -5.1689453125, -4.96826171875, -4.767578125, -4.56689453125, -4.3662109375, -4.16552734375, -3.96484375, -3.76416015625, -3.5634765625, -3.36279296875, -3.162109375, -2.96142578125, -2.7607421875, -2.56005859375, -2.359375, -2.15869140625, -1.9580078125, -1.75732421875, -1.556640625, -1.35595703125, -1.1552734375, -0.95458984375, -0.75390625, -0.55322265625, -0.3525390625, -0.15185546875, 0.048828125, 0.24951171875, 0.4501953125, 0.65087890625, 0.8515625, 1.05224609375, 1.2529296875, 1.45361328125, 1.654296875, 1.85498046875, 2.0556640625, 2.25634765625, 2.45703125, 2.65771484375, 2.8583984375, 3.05908203125, 3.259765625, 3.46044921875, 3.6611328125, 3.86181640625, 4.0625, 4.26318359375, 4.4638671875, 4.66455078125, 4.865234375, 5.06591796875, 5.2666015625, 5.46728515625, 5.66796875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 6.0, 3.0, 10.0, 17.0, 25.0, 31.0, 67.0, 100.0, 114.0, 188.0, 228.0, 403.0, 600.0, 794.0, 1291.0, 1791.0, 2751.0, 4095.0, 6328.0, 10040.0, 16163.0, 25515.0, 40563.0, 64816.0, 103923.0, 163809.0, 1254447.0, 146797.0, 93626.0, 58252.0, 36629.0, 22927.0, 14419.0, 9226.0, 5831.0, 3748.0, 2521.0, 1589.0, 1117.0, 732.0, 482.0, 349.0, 235.0, 180.0, 112.0, 72.0, 48.0, 49.0, 25.0, 16.0, 17.0, 9.0, 6.0, 5.0, 0.0, 1.0], "bins": [-1.1123046875, -1.0799560546875, -1.047607421875, -1.0152587890625, -0.98291015625, -0.9505615234375, -0.918212890625, -0.8858642578125, -0.853515625, -0.8211669921875, -0.788818359375, -0.7564697265625, -0.72412109375, -0.6917724609375, -0.659423828125, -0.6270751953125, -0.5947265625, -0.5623779296875, -0.530029296875, -0.4976806640625, -0.46533203125, -0.4329833984375, -0.400634765625, -0.3682861328125, -0.3359375, -0.3035888671875, -0.271240234375, -0.2388916015625, -0.20654296875, -0.1741943359375, -0.141845703125, -0.1094970703125, -0.0771484375, -0.0447998046875, -0.012451171875, 0.0198974609375, 0.05224609375, 0.0845947265625, 0.116943359375, 0.1492919921875, 0.181640625, 0.2139892578125, 0.246337890625, 0.2786865234375, 0.31103515625, 0.3433837890625, 0.375732421875, 0.4080810546875, 0.4404296875, 0.4727783203125, 0.505126953125, 0.5374755859375, 0.56982421875, 0.6021728515625, 0.634521484375, 0.6668701171875, 0.69921875, 0.7315673828125, 0.763916015625, 0.7962646484375, 0.82861328125, 0.8609619140625, 0.893310546875, 0.9256591796875, 0.9580078125]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 4.0, 8.0, 9.0, 12.0, 14.0, 15.0, 25.0, 25.0, 45.0, 60.0, 53.0, 81.0, 81.0, 91.0, 92.0, 74.0, 78.0, 65.0, 40.0, 45.0, 25.0, 19.0, 16.0, 10.0, 7.0, 7.0, 4.0, 0.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00656890869140625, -0.006390750408172607, -0.006212592124938965, -0.006034433841705322, -0.00585627555847168, -0.005678117275238037, -0.0054999589920043945, -0.005321800708770752, -0.005143642425537109, -0.004965484142303467, -0.004787325859069824, -0.004609167575836182, -0.004431009292602539, -0.0042528510093688965, -0.004074692726135254, -0.0038965344429016113, -0.0037183761596679688, -0.003540217876434326, -0.0033620595932006836, -0.003183901309967041, -0.0030057430267333984, -0.002827584743499756, -0.0026494264602661133, -0.0024712681770324707, -0.002293109893798828, -0.0021149516105651855, -0.001936793327331543, -0.0017586350440979004, -0.0015804767608642578, -0.0014023184776306152, -0.0012241601943969727, -0.00104600191116333, -0.0008678436279296875, -0.0006896853446960449, -0.0005115270614624023, -0.00033336877822875977, -0.0001552104949951172, 2.294778823852539e-05, 0.00020110607147216797, 0.00037926435470581055, 0.0005574226379394531, 0.0007355809211730957, 0.0009137392044067383, 0.0010918974876403809, 0.0012700557708740234, 0.001448214054107666, 0.0016263723373413086, 0.0018045306205749512, 0.0019826889038085938, 0.0021608471870422363, 0.002339005470275879, 0.0025171637535095215, 0.002695322036743164, 0.0028734803199768066, 0.0030516386032104492, 0.003229796886444092, 0.0034079551696777344, 0.003586113452911377, 0.0037642717361450195, 0.003942430019378662, 0.004120588302612305, 0.004298746585845947, 0.00447690486907959, 0.004655063152313232, 0.004833221435546875]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 7.0, 4.0, 12.0, 20.0, 19.0, 24.0, 28.0, 46.0, 91.0, 107.0, 206.0, 327.0, 639.0, 1800.0, 1035797.0, 7482.0, 858.0, 392.0, 217.0, 164.0, 93.0, 58.0, 47.0, 39.0, 25.0, 18.0, 12.0, 13.0, 6.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09039306640625, -0.08712577819824219, -0.08385848999023438, -0.08059120178222656, -0.07732391357421875, -0.07405662536621094, -0.07078933715820312, -0.06752204895019531, -0.0642547607421875, -0.06098747253417969, -0.057720184326171875, -0.05445289611816406, -0.05118560791015625, -0.04791831970214844, -0.044651031494140625, -0.04138374328613281, -0.038116455078125, -0.03484916687011719, -0.031581878662109375, -0.028314590454101562, -0.02504730224609375, -0.021780014038085938, -0.018512725830078125, -0.015245437622070312, -0.0119781494140625, -0.008710861206054688, -0.005443572998046875, -0.0021762847900390625, 0.00109100341796875, 0.0043582916259765625, 0.007625579833984375, 0.010892868041992188, 0.01416015625, 0.017427444458007812, 0.020694732666015625, 0.023962020874023438, 0.02722930908203125, 0.030496597290039062, 0.033763885498046875, 0.03703117370605469, 0.0402984619140625, 0.04356575012207031, 0.046833038330078125, 0.05010032653808594, 0.05336761474609375, 0.05663490295410156, 0.059902191162109375, 0.06316947937011719, 0.066436767578125, 0.06970405578613281, 0.07297134399414062, 0.07623863220214844, 0.07950592041015625, 0.08277320861816406, 0.08604049682617188, 0.08930778503417969, 0.0925750732421875, 0.09584236145019531, 0.09910964965820312, 0.10237693786621094, 0.10564422607421875, 0.10891151428222656, 0.11217880249023438, 0.11544609069824219, 0.11871337890625]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 10.0, 18.0, 59.0, 131.0, 194.0, 237.0, 189.0, 98.0, 42.0, 14.0, 10.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.001381204230710864, -0.001268543885089457, -0.00115588353946805, -0.0010432233102619648, -0.0009305629646405578, -0.0008179026190191507, -0.0007052423316054046, -0.0005925820441916585, -0.00047992169857025146, -0.0003672613820526749, -0.0002546010655350983, -0.00014194074901752174, -2.9280432499945164e-05, 8.337991312146187e-05, 0.000196040200535208, 0.0003087004879489541, 0.00042136083357036114, 0.0005340211791917682, 0.0006466814666055143, 0.0007593417540192604, 0.0008720020996406674, 0.0009846624452620745, 0.0010973226744681597, 0.0012099830200895667, 0.0013226433657109737, 0.0014353037113323808, 0.0015479640569537878, 0.001660624286159873, 0.00177328463178128, 0.001885944977402687, 0.0019986052066087723, 0.0021112654358148575, 0.00222392613068223, 0.002336586359888315, 0.002449246821925044, 0.0025619070511311293, 0.002674567513167858, 0.0027872277423739433, 0.0028998879715800285, 0.0030125482007861137, 0.0031252086628228426, 0.003237868892028928, 0.0033505293540656567, 0.003463189583271742, 0.003575849812477827, 0.003688510274514556, 0.003801170503720641, 0.00391383096575737, 0.004026491194963455, 0.00413915142416954, 0.004251811653375626, 0.004364472348242998, 0.004477132577449083, 0.0045897928066551685, 0.004702453035861254, 0.004815113265067339, 0.0049277739599347115, 0.005040434189140797, 0.005153094418346882, 0.005265755113214254, 0.00537841534242034, 0.005491075571626425, 0.00560373580083251, 0.005716396030038595, 0.00582905625924468]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 9.0, 8.0, 7.0, 12.0, 19.0, 7.0, 19.0, 13.0, 17.0, 22.0, 33.0, 22.0, 28.0, 31.0, 38.0, 40.0, 39.0, 48.0, 36.0, 39.0, 37.0, 39.0, 29.0, 43.0, 40.0, 33.0, 28.0, 25.0, 42.0, 33.0, 24.0, 26.0, 18.0, 15.0, 17.0, 12.0, 9.0, 5.0, 10.0, 6.0, 10.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.002001047134399414, -0.0019390583038330078, -0.0018770694732666016, -0.0018150806427001953, -0.001753091812133789, -0.0016911029815673828, -0.0016291141510009766, -0.0015671253204345703, -0.001505136489868164, -0.0014431476593017578, -0.0013811588287353516, -0.0013191699981689453, -0.001257181167602539, -0.0011951923370361328, -0.0011332035064697266, -0.0010712146759033203, -0.001009225845336914, -0.0009472370147705078, -0.0008852481842041016, -0.0008232593536376953, -0.0007612705230712891, -0.0006992816925048828, -0.0006372928619384766, -0.0005753040313720703, -0.0005133152008056641, -0.0004513263702392578, -0.00038933753967285156, -0.0003273487091064453, -0.00026535987854003906, -0.0002033710479736328, -0.00014138221740722656, -7.939338684082031e-05, -1.7404556274414062e-05, 4.458427429199219e-05, 0.00010657310485839844, 0.0001685619354248047, 0.00023055076599121094, 0.0002925395965576172, 0.00035452842712402344, 0.0004165172576904297, 0.00047850608825683594, 0.0005404949188232422, 0.0006024837493896484, 0.0006644725799560547, 0.0007264614105224609, 0.0007884502410888672, 0.0008504390716552734, 0.0009124279022216797, 0.0009744167327880859, 0.0010364055633544922, 0.0010983943939208984, 0.0011603832244873047, 0.001222372055053711, 0.0012843608856201172, 0.0013463497161865234, 0.0014083385467529297, 0.001470327377319336, 0.0015323162078857422, 0.0015943050384521484, 0.0016562938690185547, 0.001718282699584961, 0.0017802715301513672, 0.0018422603607177734, 0.0019042491912841797, 0.001966238021850586]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 0.0, 3.0, 5.0, 3.0, 4.0, 6.0, 15.0, 15.0, 6.0, 18.0, 12.0, 18.0, 16.0, 27.0, 19.0, 23.0, 25.0, 33.0, 32.0, 36.0, 32.0, 48.0, 35.0, 37.0, 39.0, 39.0, 35.0, 38.0, 38.0, 33.0, 34.0, 33.0, 33.0, 34.0, 26.0, 17.0, 18.0, 21.0, 19.0, 14.0, 13.0, 6.0, 10.0, 8.0, 3.0, 6.0, 4.0, 6.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-9.8515625, -9.551513671875, -9.25146484375, -8.951416015625, -8.6513671875, -8.351318359375, -8.05126953125, -7.751220703125, -7.451171875, -7.151123046875, -6.85107421875, -6.551025390625, -6.2509765625, -5.950927734375, -5.65087890625, -5.350830078125, -5.05078125, -4.750732421875, -4.45068359375, -4.150634765625, -3.8505859375, -3.550537109375, -3.25048828125, -2.950439453125, -2.650390625, -2.350341796875, -2.05029296875, -1.750244140625, -1.4501953125, -1.150146484375, -0.85009765625, -0.550048828125, -0.25, 0.050048828125, 0.35009765625, 0.650146484375, 0.9501953125, 1.250244140625, 1.55029296875, 1.850341796875, 2.150390625, 2.450439453125, 2.75048828125, 3.050537109375, 3.3505859375, 3.650634765625, 3.95068359375, 4.250732421875, 4.55078125, 4.850830078125, 5.15087890625, 5.450927734375, 5.7509765625, 6.051025390625, 6.35107421875, 6.651123046875, 6.951171875, 7.251220703125, 7.55126953125, 7.851318359375, 8.1513671875, 8.451416015625, 8.75146484375, 9.051513671875, 9.3515625]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 5.0, 3.0, 7.0, 8.0, 3.0, 16.0, 10.0, 28.0, 27.0, 45.0, 52.0, 56.0, 76.0, 102.0, 147.0, 195.0, 222.0, 251.0, 347.0, 456.0, 516.0, 716.0, 963.0, 1370.0, 2226.0, 5323.0, 19559.0, 91695.0, 414957.0, 393444.0, 84770.0, 18211.0, 5137.0, 2087.0, 1339.0, 929.0, 724.0, 528.0, 410.0, 350.0, 280.0, 237.0, 190.0, 117.0, 92.0, 74.0, 71.0, 46.0, 44.0, 23.0, 18.0, 16.0, 10.0, 9.0, 6.0, 6.0, 7.0, 9.0, 2.0, 1.0, 1.0], "bins": [-15.515625, -15.0303955078125, -14.545166015625, -14.0599365234375, -13.57470703125, -13.0894775390625, -12.604248046875, -12.1190185546875, -11.6337890625, -11.1485595703125, -10.663330078125, -10.1781005859375, -9.69287109375, -9.2076416015625, -8.722412109375, -8.2371826171875, -7.751953125, -7.2667236328125, -6.781494140625, -6.2962646484375, -5.81103515625, -5.3258056640625, -4.840576171875, -4.3553466796875, -3.8701171875, -3.3848876953125, -2.899658203125, -2.4144287109375, -1.92919921875, -1.4439697265625, -0.958740234375, -0.4735107421875, 0.01171875, 0.4969482421875, 0.982177734375, 1.4674072265625, 1.95263671875, 2.4378662109375, 2.923095703125, 3.4083251953125, 3.8935546875, 4.3787841796875, 4.864013671875, 5.3492431640625, 5.83447265625, 6.3197021484375, 6.804931640625, 7.2901611328125, 7.775390625, 8.2606201171875, 8.745849609375, 9.2310791015625, 9.71630859375, 10.2015380859375, 10.686767578125, 11.1719970703125, 11.6572265625, 12.1424560546875, 12.627685546875, 13.1129150390625, 13.59814453125, 14.0833740234375, 14.568603515625, 15.0538330078125, 15.5390625]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 4.0, 3.0, 8.0, 7.0, 10.0, 10.0, 10.0, 11.0, 17.0, 20.0, 18.0, 27.0, 41.0, 32.0, 44.0, 47.0, 43.0, 66.0, 94.0, 209.0, 1457.0, 293.0, 132.0, 70.0, 50.0, 44.0, 42.0, 32.0, 35.0, 34.0, 17.0, 18.0, 21.0, 16.0, 9.0, 13.0, 15.0, 3.0, 7.0, 9.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.75, -22.923828125, -22.09765625, -21.271484375, -20.4453125, -19.619140625, -18.79296875, -17.966796875, -17.140625, -16.314453125, -15.48828125, -14.662109375, -13.8359375, -13.009765625, -12.18359375, -11.357421875, -10.53125, -9.705078125, -8.87890625, -8.052734375, -7.2265625, -6.400390625, -5.57421875, -4.748046875, -3.921875, -3.095703125, -2.26953125, -1.443359375, -0.6171875, 0.208984375, 1.03515625, 1.861328125, 2.6875, 3.513671875, 4.33984375, 5.166015625, 5.9921875, 6.818359375, 7.64453125, 8.470703125, 9.296875, 10.123046875, 10.94921875, 11.775390625, 12.6015625, 13.427734375, 14.25390625, 15.080078125, 15.90625, 16.732421875, 17.55859375, 18.384765625, 19.2109375, 20.037109375, 20.86328125, 21.689453125, 22.515625, 23.341796875, 24.16796875, 24.994140625, 25.8203125, 26.646484375, 27.47265625, 28.298828125, 29.125]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 2.0, 6.0, 5.0, 5.0, 9.0, 8.0, 6.0, 11.0, 19.0, 25.0, 25.0, 35.0, 45.0, 54.0, 85.0, 122.0, 178.0, 310.0, 544.0, 1316.0, 19745.0, 3115913.0, 4798.0, 1074.0, 482.0, 284.0, 173.0, 113.0, 69.0, 55.0, 52.0, 37.0, 22.0, 22.0, 16.0, 12.0, 11.0, 5.0, 8.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-78.4375, -75.6728515625, -72.908203125, -70.1435546875, -67.37890625, -64.6142578125, -61.849609375, -59.0849609375, -56.3203125, -53.5556640625, -50.791015625, -48.0263671875, -45.26171875, -42.4970703125, -39.732421875, -36.9677734375, -34.203125, -31.4384765625, -28.673828125, -25.9091796875, -23.14453125, -20.3798828125, -17.615234375, -14.8505859375, -12.0859375, -9.3212890625, -6.556640625, -3.7919921875, -1.02734375, 1.7373046875, 4.501953125, 7.2666015625, 10.03125, 12.7958984375, 15.560546875, 18.3251953125, 21.08984375, 23.8544921875, 26.619140625, 29.3837890625, 32.1484375, 34.9130859375, 37.677734375, 40.4423828125, 43.20703125, 45.9716796875, 48.736328125, 51.5009765625, 54.265625, 57.0302734375, 59.794921875, 62.5595703125, 65.32421875, 68.0888671875, 70.853515625, 73.6181640625, 76.3828125, 79.1474609375, 81.912109375, 84.6767578125, 87.44140625, 90.2060546875, 92.970703125, 95.7353515625, 98.5]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 338.0, 671.0, 8.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-332.6045837402344, -318.2112121582031, -303.81781005859375, -289.4244384765625, -275.03106689453125, -260.6376953125, -246.2443084716797, -231.85092163085938, -217.45755004882812, -203.06417846679688, -188.67079162597656, -174.27740478515625, -159.884033203125, -145.49066162109375, -131.09727478027344, -116.70389556884766, -102.31051635742188, -87.9171371459961, -73.52375793457031, -59.13037872314453, -44.73699951171875, -30.34362030029297, -15.950241088867188, -1.5568618774414062, 12.836517333984375, 27.229896545410156, 41.62327575683594, 56.01665496826172, 70.4100341796875, 84.80341339111328, 99.19679260253906, 113.59017181396484, 127.98358154296875, 142.376953125, 156.7703399658203, 171.16372680664062, 185.55709838867188, 199.95046997070312, 214.34385681152344, 228.73724365234375, 243.130615234375, 257.52398681640625, 271.9173583984375, 286.3107604980469, 300.7041320800781, 315.0975036621094, 329.49090576171875, 343.88427734375, 358.27764892578125, 372.6710205078125, 387.06439208984375, 401.4577941894531, 415.8511657714844, 430.2445373535156, 444.637939453125, 459.03131103515625, 473.4246826171875, 487.81805419921875, 502.21142578125, 516.6047973632812, 530.9981689453125, 545.3916015625, 559.7849731445312, 574.1783447265625, 588.5717163085938]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 5.0, 8.0, 4.0, 10.0, 8.0, 9.0, 8.0, 9.0, 23.0, 17.0, 20.0, 22.0, 28.0, 27.0, 34.0, 30.0, 34.0, 35.0, 39.0, 38.0, 35.0, 38.0, 36.0, 41.0, 40.0, 38.0, 37.0, 37.0, 42.0, 40.0, 25.0, 23.0, 26.0, 18.0, 24.0, 14.0, 15.0, 15.0, 8.0, 8.0, 5.0, 8.0, 3.0, 5.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-69.458740234375, -67.30242919921875, -65.1461181640625, -62.98979949951172, -60.83348846435547, -58.67717742919922, -56.5208625793457, -54.36454772949219, -52.20823669433594, -50.05192565917969, -47.89561080932617, -45.739295959472656, -43.582984924316406, -41.426673889160156, -39.27035903930664, -37.114044189453125, -34.957733154296875, -32.801422119140625, -30.64510726928711, -28.488794326782227, -26.332481384277344, -24.17616844177246, -22.019855499267578, -19.863542556762695, -17.707229614257812, -15.55091667175293, -13.394603729248047, -11.238290786743164, -9.081977844238281, -6.925664901733398, -4.769351959228516, -2.613039016723633, -0.45672607421875, 1.6995868682861328, 3.8558998107910156, 6.012212753295898, 8.168525695800781, 10.324838638305664, 12.481151580810547, 14.63746452331543, 16.793777465820312, 18.950090408325195, 21.106403350830078, 23.26271629333496, 25.419029235839844, 27.575342178344727, 29.73165512084961, 31.887968063354492, 34.044281005859375, 36.200592041015625, 38.35690689086914, 40.513221740722656, 42.669532775878906, 44.825843811035156, 46.98215866088867, 49.13847351074219, 51.29478454589844, 53.45109558105469, 55.6074104309082, 57.76372528076172, 59.92003631591797, 62.07634735107422, 64.232666015625, 66.38897705078125, 68.5452880859375]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 6.0, 2.0, 4.0, 2.0, 8.0, 11.0, 10.0, 5.0, 11.0, 6.0, 6.0, 14.0, 21.0, 26.0, 24.0, 20.0, 27.0, 31.0, 27.0, 36.0, 37.0, 39.0, 39.0, 28.0, 32.0, 49.0, 38.0, 45.0, 38.0, 43.0, 36.0, 32.0, 29.0, 34.0, 18.0, 25.0, 20.0, 28.0, 16.0, 15.0, 12.0, 12.0, 11.0, 7.0, 5.0, 6.0, 4.0, 3.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.9140625, -9.6072998046875, -9.300537109375, -8.9937744140625, -8.68701171875, -8.3802490234375, -8.073486328125, -7.7667236328125, -7.4599609375, -7.1531982421875, -6.846435546875, -6.5396728515625, -6.23291015625, -5.9261474609375, -5.619384765625, -5.3126220703125, -5.005859375, -4.6990966796875, -4.392333984375, -4.0855712890625, -3.77880859375, -3.4720458984375, -3.165283203125, -2.8585205078125, -2.5517578125, -2.2449951171875, -1.938232421875, -1.6314697265625, -1.32470703125, -1.0179443359375, -0.711181640625, -0.4044189453125, -0.09765625, 0.2091064453125, 0.515869140625, 0.8226318359375, 1.12939453125, 1.4361572265625, 1.742919921875, 2.0496826171875, 2.3564453125, 2.6632080078125, 2.969970703125, 3.2767333984375, 3.58349609375, 3.8902587890625, 4.197021484375, 4.5037841796875, 4.810546875, 5.1173095703125, 5.424072265625, 5.7308349609375, 6.03759765625, 6.3443603515625, 6.651123046875, 6.9578857421875, 7.2646484375, 7.5714111328125, 7.878173828125, 8.1849365234375, 8.49169921875, 8.7984619140625, 9.105224609375, 9.4119873046875, 9.71875]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 8.0, 5.0, 14.0, 18.0, 26.0, 30.0, 45.0, 48.0, 65.0, 84.0, 106.0, 136.0, 197.0, 366.0, 820.0, 3155.0, 23128.0, 663560.0, 3232201.0, 254320.0, 12195.0, 2106.0, 622.0, 281.0, 175.0, 126.0, 101.0, 86.0, 59.0, 51.0, 37.0, 31.0, 27.0, 13.0, 12.0, 12.0, 3.0, 5.0, 6.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-40.34375, -39.292236328125, -38.24072265625, -37.189208984375, -36.1376953125, -35.086181640625, -34.03466796875, -32.983154296875, -31.931640625, -30.880126953125, -29.82861328125, -28.777099609375, -27.7255859375, -26.674072265625, -25.62255859375, -24.571044921875, -23.51953125, -22.468017578125, -21.41650390625, -20.364990234375, -19.3134765625, -18.261962890625, -17.21044921875, -16.158935546875, -15.107421875, -14.055908203125, -13.00439453125, -11.952880859375, -10.9013671875, -9.849853515625, -8.79833984375, -7.746826171875, -6.6953125, -5.643798828125, -4.59228515625, -3.540771484375, -2.4892578125, -1.437744140625, -0.38623046875, 0.665283203125, 1.716796875, 2.768310546875, 3.81982421875, 4.871337890625, 5.9228515625, 6.974365234375, 8.02587890625, 9.077392578125, 10.12890625, 11.180419921875, 12.23193359375, 13.283447265625, 14.3349609375, 15.386474609375, 16.43798828125, 17.489501953125, 18.541015625, 19.592529296875, 20.64404296875, 21.695556640625, 22.7470703125, 23.798583984375, 24.85009765625, 25.901611328125, 26.953125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 6.0, 3.0, 4.0, 6.0, 7.0, 6.0, 19.0, 14.0, 27.0, 42.0, 53.0, 83.0, 112.0, 113.0, 179.0, 196.0, 363.0, 488.0, 583.0, 537.0, 380.0, 229.0, 172.0, 105.0, 96.0, 74.0, 52.0, 40.0, 25.0, 21.0, 14.0, 7.0, 9.0, 6.0, 10.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.390625, -17.700439453125, -17.01025390625, -16.320068359375, -15.6298828125, -14.939697265625, -14.24951171875, -13.559326171875, -12.869140625, -12.178955078125, -11.48876953125, -10.798583984375, -10.1083984375, -9.418212890625, -8.72802734375, -8.037841796875, -7.34765625, -6.657470703125, -5.96728515625, -5.277099609375, -4.5869140625, -3.896728515625, -3.20654296875, -2.516357421875, -1.826171875, -1.135986328125, -0.44580078125, 0.244384765625, 0.9345703125, 1.624755859375, 2.31494140625, 3.005126953125, 3.6953125, 4.385498046875, 5.07568359375, 5.765869140625, 6.4560546875, 7.146240234375, 7.83642578125, 8.526611328125, 9.216796875, 9.906982421875, 10.59716796875, 11.287353515625, 11.9775390625, 12.667724609375, 13.35791015625, 14.048095703125, 14.73828125, 15.428466796875, 16.11865234375, 16.808837890625, 17.4990234375, 18.189208984375, 18.87939453125, 19.569580078125, 20.259765625, 20.949951171875, 21.64013671875, 22.330322265625, 23.0205078125, 23.710693359375, 24.40087890625, 25.091064453125, 25.78125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 5.0, 6.0, 9.0, 13.0, 39.0, 86.0, 203.0, 783.0, 7107.0, 4105707.0, 78019.0, 1637.0, 394.0, 144.0, 71.0, 27.0, 13.0, 9.0, 2.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-137.625, -133.875, -130.125, -126.375, -122.625, -118.875, -115.125, -111.375, -107.625, -103.875, -100.125, -96.375, -92.625, -88.875, -85.125, -81.375, -77.625, -73.875, -70.125, -66.375, -62.625, -58.875, -55.125, -51.375, -47.625, -43.875, -40.125, -36.375, -32.625, -28.875, -25.125, -21.375, -17.625, -13.875, -10.125, -6.375, -2.625, 1.125, 4.875, 8.625, 12.375, 16.125, 19.875, 23.625, 27.375, 31.125, 34.875, 38.625, 42.375, 46.125, 49.875, 53.625, 57.375, 61.125, 64.875, 68.625, 72.375, 76.125, 79.875, 83.625, 87.375, 91.125, 94.875, 98.625, 102.375]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 261.0, 749.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-387.3551330566406, -344.74444580078125, -302.13372802734375, -259.5230407714844, -216.91233825683594, -174.3016357421875, -131.69094848632812, -89.08023071289062, -46.46954345703125, -3.858844757080078, 38.751853942871094, 81.362548828125, 123.97325134277344, 166.58395385742188, 209.19464111328125, 251.80535888671875, 294.4160461425781, 337.0267333984375, 379.637451171875, 422.2481384277344, 464.85882568359375, 507.46954345703125, 550.0802001953125, 592.69091796875, 635.3016357421875, 677.912353515625, 720.5230102539062, 763.1337280273438, 805.7444458007812, 848.3551025390625, 890.9658203125, 933.5765380859375, 976.1871337890625, 1018.7978515625, 1061.4085693359375, 1104.019287109375, 1146.6298828125, 1189.2406005859375, 1231.851318359375, 1274.4620361328125, 1317.07275390625, 1359.6834716796875, 1402.294189453125, 1444.90478515625, 1487.5155029296875, 1530.126220703125, 1572.7369384765625, 1615.34765625, 1657.958251953125, 1700.5689697265625, 1743.1796875, 1785.790283203125, 1828.4010009765625, 1871.01171875, 1913.6224365234375, 1956.233154296875, 1998.8438720703125, 2041.45458984375, 2084.065185546875, 2126.676025390625, 2169.28662109375, 2211.8974609375, 2254.508056640625, 2297.11865234375, 2339.7294921875]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 7.0, 17.0, 18.0, 21.0, 23.0, 37.0, 40.0, 39.0, 55.0, 46.0, 76.0, 67.0, 62.0, 70.0, 79.0, 54.0, 57.0, 60.0, 38.0, 33.0, 21.0, 28.0, 19.0, 15.0, 8.0, 8.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-155.40496826171875, -151.6463165283203, -147.8876495361328, -144.12899780273438, -140.37033081054688, -136.61167907714844, -132.85301208496094, -129.0943603515625, -125.33570098876953, -121.57704162597656, -117.8183822631836, -114.05972290039062, -110.30107116699219, -106.54240417480469, -102.78375244140625, -99.02509307861328, -95.26643371582031, -91.50777435302734, -87.74911499023438, -83.9904556274414, -80.23179626464844, -76.47314453125, -72.71448516845703, -68.95582580566406, -65.1971664428711, -61.438507080078125, -57.679847717285156, -53.92119216918945, -50.162532806396484, -46.403873443603516, -42.64521789550781, -38.886558532714844, -35.127899169921875, -31.369239807128906, -27.61058235168457, -23.851924896240234, -20.093265533447266, -16.334606170654297, -12.575948715209961, -8.817291259765625, -5.058631896972656, -1.299973487854004, 2.4586849212646484, 6.217343330383301, 9.976001739501953, 13.734661102294922, 17.493318557739258, 21.251976013183594, 25.010635375976562, 28.76929473876953, 32.5279541015625, 36.2866096496582, 40.04526901245117, 43.80392837524414, 47.562583923339844, 51.32124328613281, 55.07990264892578, 58.83856201171875, 62.59722137451172, 66.35588073730469, 70.11453247070312, 73.87319946289062, 77.63185119628906, 81.39051055908203, 85.149169921875]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 4.0, 0.0, 6.0, 2.0, 8.0, 9.0, 11.0, 9.0, 10.0, 15.0, 12.0, 17.0, 16.0, 12.0, 24.0, 21.0, 37.0, 31.0, 32.0, 36.0, 37.0, 39.0, 36.0, 43.0, 41.0, 41.0, 42.0, 44.0, 44.0, 37.0, 32.0, 27.0, 26.0, 33.0, 21.0, 28.0, 21.0, 19.0, 17.0, 12.0, 7.0, 9.0, 9.0, 9.0, 3.0, 5.0, 1.0, 0.0, 1.0, 2.0, 5.0, 1.0, 1.0, 0.0, 4.0], "bins": [-8.3046875, -8.056396484375, -7.80810546875, -7.559814453125, -7.3115234375, -7.063232421875, -6.81494140625, -6.566650390625, -6.318359375, -6.070068359375, -5.82177734375, -5.573486328125, -5.3251953125, -5.076904296875, -4.82861328125, -4.580322265625, -4.33203125, -4.083740234375, -3.83544921875, -3.587158203125, -3.3388671875, -3.090576171875, -2.84228515625, -2.593994140625, -2.345703125, -2.097412109375, -1.84912109375, -1.600830078125, -1.3525390625, -1.104248046875, -0.85595703125, -0.607666015625, -0.359375, -0.111083984375, 0.13720703125, 0.385498046875, 0.6337890625, 0.882080078125, 1.13037109375, 1.378662109375, 1.626953125, 1.875244140625, 2.12353515625, 2.371826171875, 2.6201171875, 2.868408203125, 3.11669921875, 3.364990234375, 3.61328125, 3.861572265625, 4.10986328125, 4.358154296875, 4.6064453125, 4.854736328125, 5.10302734375, 5.351318359375, 5.599609375, 5.847900390625, 6.09619140625, 6.344482421875, 6.5927734375, 6.841064453125, 7.08935546875, 7.337646484375, 7.5859375]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 7.0, 7.0, 13.0, 20.0, 21.0, 40.0, 73.0, 86.0, 135.0, 191.0, 268.0, 429.0, 571.0, 818.0, 1172.0, 1723.0, 2569.0, 3736.0, 5641.0, 8513.0, 12709.0, 19494.0, 29645.0, 45598.0, 71336.0, 113047.0, 176860.0, 191906.0, 129753.0, 80551.0, 52027.0, 33595.0, 22081.0, 14411.0, 9554.0, 6488.0, 4265.0, 2934.0, 1987.0, 1321.0, 946.0, 639.0, 433.0, 288.0, 217.0, 141.0, 90.0, 78.0, 50.0, 37.0, 16.0, 18.0, 10.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.84716796875, -0.8199691772460938, -0.7927703857421875, -0.7655715942382812, -0.738372802734375, -0.7111740112304688, -0.6839752197265625, -0.6567764282226562, -0.62957763671875, -0.6023788452148438, -0.5751800537109375, -0.5479812622070312, -0.520782470703125, -0.49358367919921875, -0.4663848876953125, -0.43918609619140625, -0.4119873046875, -0.38478851318359375, -0.3575897216796875, -0.33039093017578125, -0.303192138671875, -0.27599334716796875, -0.2487945556640625, -0.22159576416015625, -0.19439697265625, -0.16719818115234375, -0.1399993896484375, -0.11280059814453125, -0.085601806640625, -0.05840301513671875, -0.0312042236328125, -0.00400543212890625, 0.023193359375, 0.05039215087890625, 0.0775909423828125, 0.10478973388671875, 0.131988525390625, 0.15918731689453125, 0.1863861083984375, 0.21358489990234375, 0.24078369140625, 0.26798248291015625, 0.2951812744140625, 0.32238006591796875, 0.349578857421875, 0.37677764892578125, 0.4039764404296875, 0.43117523193359375, 0.4583740234375, 0.48557281494140625, 0.5127716064453125, 0.5399703979492188, 0.567169189453125, 0.5943679809570312, 0.6215667724609375, 0.6487655639648438, 0.67596435546875, 0.7031631469726562, 0.7303619384765625, 0.7575607299804688, 0.784759521484375, 0.8119583129882812, 0.8391571044921875, 0.8663558959960938, 0.8935546875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 0.0, 6.0, 3.0, 17.0, 9.0, 9.0, 16.0, 20.0, 23.0, 26.0, 21.0, 25.0, 30.0, 34.0, 28.0, 35.0, 48.0, 42.0, 35.0, 48.0, 1055.0, 47.0, 40.0, 43.0, 32.0, 35.0, 45.0, 26.0, 38.0, 35.0, 31.0, 18.0, 13.0, 18.0, 11.0, 13.0, 16.0, 14.0, 3.0, 8.0, 5.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8203125, -4.646240234375, -4.47216796875, -4.298095703125, -4.1240234375, -3.949951171875, -3.77587890625, -3.601806640625, -3.427734375, -3.253662109375, -3.07958984375, -2.905517578125, -2.7314453125, -2.557373046875, -2.38330078125, -2.209228515625, -2.03515625, -1.861083984375, -1.68701171875, -1.512939453125, -1.3388671875, -1.164794921875, -0.99072265625, -0.816650390625, -0.642578125, -0.468505859375, -0.29443359375, -0.120361328125, 0.0537109375, 0.227783203125, 0.40185546875, 0.575927734375, 0.75, 0.924072265625, 1.09814453125, 1.272216796875, 1.4462890625, 1.620361328125, 1.79443359375, 1.968505859375, 2.142578125, 2.316650390625, 2.49072265625, 2.664794921875, 2.8388671875, 3.012939453125, 3.18701171875, 3.361083984375, 3.53515625, 3.709228515625, 3.88330078125, 4.057373046875, 4.2314453125, 4.405517578125, 4.57958984375, 4.753662109375, 4.927734375, 5.101806640625, 5.27587890625, 5.449951171875, 5.6240234375, 5.798095703125, 5.97216796875, 6.146240234375, 6.3203125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 5.0, 5.0, 2.0, 8.0, 6.0, 24.0, 27.0, 37.0, 67.0, 106.0, 147.0, 233.0, 362.0, 565.0, 886.0, 1356.0, 2217.0, 3423.0, 5408.0, 8415.0, 13625.0, 21570.0, 35265.0, 56950.0, 92432.0, 150157.0, 1263975.0, 167268.0, 103569.0, 64163.0, 39459.0, 24324.0, 15278.0, 9316.0, 5956.0, 3682.0, 2537.0, 1534.0, 1006.0, 656.0, 379.0, 281.0, 154.0, 115.0, 68.0, 49.0, 22.0, 23.0, 14.0, 5.0, 5.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.84716796875, -0.8185653686523438, -0.7899627685546875, -0.7613601684570312, -0.732757568359375, -0.7041549682617188, -0.6755523681640625, -0.6469497680664062, -0.61834716796875, -0.5897445678710938, -0.5611419677734375, -0.5325393676757812, -0.503936767578125, -0.47533416748046875, -0.4467315673828125, -0.41812896728515625, -0.3895263671875, -0.36092376708984375, -0.3323211669921875, -0.30371856689453125, -0.275115966796875, -0.24651336669921875, -0.2179107666015625, -0.18930816650390625, -0.16070556640625, -0.13210296630859375, -0.1035003662109375, -0.07489776611328125, -0.046295166015625, -0.01769256591796875, 0.0109100341796875, 0.03951263427734375, 0.068115234375, 0.09671783447265625, 0.1253204345703125, 0.15392303466796875, 0.182525634765625, 0.21112823486328125, 0.2397308349609375, 0.26833343505859375, 0.29693603515625, 0.32553863525390625, 0.3541412353515625, 0.38274383544921875, 0.411346435546875, 0.43994903564453125, 0.4685516357421875, 0.49715423583984375, 0.5257568359375, 0.5543594360351562, 0.5829620361328125, 0.6115646362304688, 0.640167236328125, 0.6687698364257812, 0.6973724365234375, 0.7259750366210938, 0.75457763671875, 0.7831802368164062, 0.8117828369140625, 0.8403854370117188, 0.868988037109375, 0.8975906372070312, 0.9261932373046875, 0.9547958374023438, 0.9833984375]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 10.0, 9.0, 10.0, 28.0, 20.0, 40.0, 51.0, 60.0, 73.0, 80.0, 72.0, 86.0, 66.0, 79.0, 66.0, 50.0, 48.0, 35.0, 18.0, 24.0, 26.0, 12.0, 15.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0043792724609375, -0.004252135753631592, -0.004124999046325684, -0.003997862339019775, -0.003870725631713867, -0.003743588924407959, -0.0036164522171020508, -0.0034893155097961426, -0.0033621788024902344, -0.003235042095184326, -0.003107905387878418, -0.0029807686805725098, -0.0028536319732666016, -0.0027264952659606934, -0.002599358558654785, -0.002472221851348877, -0.0023450851440429688, -0.0022179484367370605, -0.0020908117294311523, -0.001963675022125244, -0.001836538314819336, -0.0017094016075134277, -0.0015822649002075195, -0.0014551281929016113, -0.0013279914855957031, -0.001200854778289795, -0.0010737180709838867, -0.0009465813636779785, -0.0008194446563720703, -0.0006923079490661621, -0.0005651712417602539, -0.0004380345344543457, -0.0003108978271484375, -0.0001837611198425293, -5.6624412536621094e-05, 7.051229476928711e-05, 0.0001976490020751953, 0.0003247857093811035, 0.0004519224166870117, 0.0005790591239929199, 0.0007061958312988281, 0.0008333325386047363, 0.0009604692459106445, 0.0010876059532165527, 0.001214742660522461, 0.0013418793678283691, 0.0014690160751342773, 0.0015961527824401855, 0.0017232894897460938, 0.001850426197052002, 0.00197756290435791, 0.0021046996116638184, 0.0022318363189697266, 0.0023589730262756348, 0.002486109733581543, 0.002613246440887451, 0.0027403831481933594, 0.0028675198554992676, 0.0029946565628051758, 0.003121793270111084, 0.003248929977416992, 0.0033760666847229004, 0.0035032033920288086, 0.003630340099334717, 0.003757476806640625]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 4.0, 2.0, 0.0, 6.0, 6.0, 15.0, 24.0, 29.0, 42.0, 52.0, 61.0, 93.0, 135.0, 222.0, 375.0, 744.0, 3912.0, 1035046.0, 5882.0, 783.0, 414.0, 223.0, 149.0, 98.0, 74.0, 45.0, 34.0, 25.0, 17.0, 6.0, 7.0, 7.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06988525390625, -0.0675191879272461, -0.06515312194824219, -0.06278705596923828, -0.060420989990234375, -0.05805492401123047, -0.05568885803222656, -0.053322792053222656, -0.05095672607421875, -0.048590660095214844, -0.04622459411621094, -0.04385852813720703, -0.041492462158203125, -0.03912639617919922, -0.03676033020019531, -0.034394264221191406, -0.0320281982421875, -0.029662132263183594, -0.027296066284179688, -0.02493000030517578, -0.022563934326171875, -0.02019786834716797, -0.017831802368164062, -0.015465736389160156, -0.01309967041015625, -0.010733604431152344, -0.008367538452148438, -0.006001472473144531, -0.003635406494140625, -0.0012693405151367188, 0.0010967254638671875, 0.0034627914428710938, 0.005828857421875, 0.008194923400878906, 0.010560989379882812, 0.012927055358886719, 0.015293121337890625, 0.01765918731689453, 0.020025253295898438, 0.022391319274902344, 0.02475738525390625, 0.027123451232910156, 0.029489517211914062, 0.03185558319091797, 0.034221649169921875, 0.03658771514892578, 0.03895378112792969, 0.041319847106933594, 0.0436859130859375, 0.046051979064941406, 0.04841804504394531, 0.05078411102294922, 0.053150177001953125, 0.05551624298095703, 0.05788230895996094, 0.060248374938964844, 0.06261444091796875, 0.06498050689697266, 0.06734657287597656, 0.06971263885498047, 0.07207870483398438, 0.07444477081298828, 0.07681083679199219, 0.0791769027709961, 0.08154296875]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 76.0, 490.0, 387.0, 54.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0017000561347231269, -0.0014108906034380198, -0.0011217249557375908, -0.0008325594244524837, -0.0005433938931673765, -0.0002542283618822694, 3.493728581815958e-05, 0.0003241027006879449, 0.0006132683483883739, 0.000902433879673481, 0.00119159952737391, 0.001480765058659017, 0.0017699305899441242, 0.0020590960048139095, 0.002348261885344982, 0.0026374273002147675, 0.0029265927150845528, 0.0032157583627849817, 0.003504923777654767, 0.003794089425355196, 0.004083254840224981, 0.004372420720756054, 0.004661586135625839, 0.0049507515504956245, 0.005239917431026697, 0.0055290828458964825, 0.005818248726427555, 0.00610741414129734, 0.006396579556167126, 0.006685744971036911, 0.006974910851567984, 0.007264076266437769, 0.007553241215646267, 0.007842406630516052, 0.008131572045385838, 0.008420737460255623, 0.008709903806447983, 0.008999069221317768, 0.009288234636187553, 0.009577400051057339, 0.009866565465927124, 0.01015573088079691, 0.010444896295666695, 0.010734062641859055, 0.01102322805672884, 0.011312393471598625, 0.01160155888646841, 0.011890724301338196, 0.012179890647530556, 0.012469056062400341, 0.012758221477270126, 0.013047387823462486, 0.013336553238332272, 0.013625718653202057, 0.013914884068071842, 0.014204049482941628, 0.014493214897811413, 0.014782380312681198, 0.015071545727550983, 0.015360711142420769, 0.01564987748861313, 0.01593904197216034, 0.0162282083183527, 0.01651737466454506, 0.01680653914809227]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 7.0, 7.0, 12.0, 20.0, 12.0, 17.0, 22.0, 21.0, 27.0, 26.0, 33.0, 35.0, 29.0, 27.0, 41.0, 50.0, 52.0, 43.0, 46.0, 58.0, 47.0, 38.0, 38.0, 22.0, 41.0, 26.0, 40.0, 33.0, 35.0, 22.0, 20.0, 12.0, 10.0, 9.0, 9.0, 7.0, 3.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001968204975128174, -0.0019109025597572327, -0.0018536001443862915, -0.0017962977290153503, -0.0017389953136444092, -0.001681692898273468, -0.0016243904829025269, -0.0015670880675315857, -0.0015097856521606445, -0.0014524832367897034, -0.0013951808214187622, -0.001337878406047821, -0.0012805759906768799, -0.0012232735753059387, -0.0011659711599349976, -0.0011086687445640564, -0.0010513663291931152, -0.000994063913822174, -0.0009367614984512329, -0.0008794590830802917, -0.0008221566677093506, -0.0007648542523384094, -0.0007075518369674683, -0.0006502494215965271, -0.0005929470062255859, -0.0005356445908546448, -0.0004783421754837036, -0.00042103976011276245, -0.0003637373447418213, -0.0003064349293708801, -0.00024913251399993896, -0.0001918300986289978, -0.00013452768325805664, -7.722526788711548e-05, -1.9922852516174316e-05, 3.7379562854766846e-05, 9.468197822570801e-05, 0.00015198439359664917, 0.00020928680896759033, 0.0002665892243385315, 0.00032389163970947266, 0.0003811940550804138, 0.000438496470451355, 0.0004957988858222961, 0.0005531013011932373, 0.0006104037165641785, 0.0006677061319351196, 0.0007250085473060608, 0.000782310962677002, 0.0008396133780479431, 0.0008969157934188843, 0.0009542182087898254, 0.0010115206241607666, 0.0010688230395317078, 0.001126125454902649, 0.00118342787027359, 0.0012407302856445312, 0.0012980327010154724, 0.0013553351163864136, 0.0014126375317573547, 0.001469939947128296, 0.001527242362499237, 0.0015845447778701782, 0.0016418471932411194, 0.0016991496086120605]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 4.0, 0.0, 6.0, 2.0, 8.0, 9.0, 11.0, 9.0, 10.0, 15.0, 12.0, 16.0, 17.0, 12.0, 24.0, 21.0, 37.0, 31.0, 32.0, 36.0, 37.0, 39.0, 36.0, 43.0, 41.0, 41.0, 42.0, 43.0, 45.0, 37.0, 32.0, 27.0, 26.0, 33.0, 21.0, 28.0, 21.0, 19.0, 17.0, 12.0, 7.0, 9.0, 9.0, 9.0, 3.0, 5.0, 1.0, 0.0, 1.0, 2.0, 5.0, 1.0, 1.0, 0.0, 4.0], "bins": [-8.3046875, -8.056396484375, -7.80810546875, -7.559814453125, -7.3115234375, -7.063232421875, -6.81494140625, -6.566650390625, -6.318359375, -6.070068359375, -5.82177734375, -5.573486328125, -5.3251953125, -5.076904296875, -4.82861328125, -4.580322265625, -4.33203125, -4.083740234375, -3.83544921875, -3.587158203125, -3.3388671875, -3.090576171875, -2.84228515625, -2.593994140625, -2.345703125, -2.097412109375, -1.84912109375, -1.600830078125, -1.3525390625, -1.104248046875, -0.85595703125, -0.607666015625, -0.359375, -0.111083984375, 0.13720703125, 0.385498046875, 0.6337890625, 0.882080078125, 1.13037109375, 1.378662109375, 1.626953125, 1.875244140625, 2.12353515625, 2.371826171875, 2.6201171875, 2.868408203125, 3.11669921875, 3.364990234375, 3.61328125, 3.861572265625, 4.10986328125, 4.358154296875, 4.6064453125, 4.854736328125, 5.10302734375, 5.351318359375, 5.599609375, 5.847900390625, 6.09619140625, 6.344482421875, 6.5927734375, 6.841064453125, 7.08935546875, 7.337646484375, 7.5859375]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 6.0, 2.0, 5.0, 4.0, 3.0, 7.0, 15.0, 19.0, 32.0, 32.0, 50.0, 68.0, 59.0, 113.0, 129.0, 183.0, 269.0, 389.0, 514.0, 754.0, 1060.0, 1584.0, 2395.0, 4896.0, 17327.0, 152439.0, 715610.0, 123842.0, 14914.0, 4422.0, 2392.0, 1488.0, 989.0, 683.0, 485.0, 358.0, 269.0, 196.0, 140.0, 105.0, 72.0, 66.0, 44.0, 34.0, 30.0, 17.0, 14.0, 11.0, 9.0, 2.0, 4.0, 6.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-20.8125, -20.15087890625, -19.4892578125, -18.82763671875, -18.166015625, -17.50439453125, -16.8427734375, -16.18115234375, -15.51953125, -14.85791015625, -14.1962890625, -13.53466796875, -12.873046875, -12.21142578125, -11.5498046875, -10.88818359375, -10.2265625, -9.56494140625, -8.9033203125, -8.24169921875, -7.580078125, -6.91845703125, -6.2568359375, -5.59521484375, -4.93359375, -4.27197265625, -3.6103515625, -2.94873046875, -2.287109375, -1.62548828125, -0.9638671875, -0.30224609375, 0.359375, 1.02099609375, 1.6826171875, 2.34423828125, 3.005859375, 3.66748046875, 4.3291015625, 4.99072265625, 5.65234375, 6.31396484375, 6.9755859375, 7.63720703125, 8.298828125, 8.96044921875, 9.6220703125, 10.28369140625, 10.9453125, 11.60693359375, 12.2685546875, 12.93017578125, 13.591796875, 14.25341796875, 14.9150390625, 15.57666015625, 16.23828125, 16.89990234375, 17.5615234375, 18.22314453125, 18.884765625, 19.54638671875, 20.2080078125, 20.86962890625, 21.53125]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 4.0, 3.0, 9.0, 6.0, 10.0, 5.0, 13.0, 12.0, 14.0, 21.0, 18.0, 32.0, 31.0, 26.0, 39.0, 44.0, 59.0, 97.0, 166.0, 1473.0, 392.0, 153.0, 80.0, 53.0, 42.0, 48.0, 26.0, 27.0, 34.0, 24.0, 18.0, 22.0, 10.0, 7.0, 6.0, 5.0, 7.0, 5.0, 4.0, 6.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.109375, -21.258056640625, -20.40673828125, -19.555419921875, -18.7041015625, -17.852783203125, -17.00146484375, -16.150146484375, -15.298828125, -14.447509765625, -13.59619140625, -12.744873046875, -11.8935546875, -11.042236328125, -10.19091796875, -9.339599609375, -8.48828125, -7.636962890625, -6.78564453125, -5.934326171875, -5.0830078125, -4.231689453125, -3.38037109375, -2.529052734375, -1.677734375, -0.826416015625, 0.02490234375, 0.876220703125, 1.7275390625, 2.578857421875, 3.43017578125, 4.281494140625, 5.1328125, 5.984130859375, 6.83544921875, 7.686767578125, 8.5380859375, 9.389404296875, 10.24072265625, 11.092041015625, 11.943359375, 12.794677734375, 13.64599609375, 14.497314453125, 15.3486328125, 16.199951171875, 17.05126953125, 17.902587890625, 18.75390625, 19.605224609375, 20.45654296875, 21.307861328125, 22.1591796875, 23.010498046875, 23.86181640625, 24.713134765625, 25.564453125, 26.415771484375, 27.26708984375, 28.118408203125, 28.9697265625, 29.821044921875, 30.67236328125, 31.523681640625, 32.375]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 8.0, 5.0, 4.0, 5.0, 10.0, 10.0, 14.0, 28.0, 45.0, 39.0, 58.0, 64.0, 82.0, 114.0, 205.0, 325.0, 651.0, 1714.0, 185548.0, 2952298.0, 2556.0, 793.0, 362.0, 222.0, 145.0, 87.0, 76.0, 52.0, 44.0, 37.0, 24.0, 19.0, 12.0, 16.0, 12.0, 3.0, 8.0, 6.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-88.25, -85.806640625, -83.36328125, -80.919921875, -78.4765625, -76.033203125, -73.58984375, -71.146484375, -68.703125, -66.259765625, -63.81640625, -61.373046875, -58.9296875, -56.486328125, -54.04296875, -51.599609375, -49.15625, -46.712890625, -44.26953125, -41.826171875, -39.3828125, -36.939453125, -34.49609375, -32.052734375, -29.609375, -27.166015625, -24.72265625, -22.279296875, -19.8359375, -17.392578125, -14.94921875, -12.505859375, -10.0625, -7.619140625, -5.17578125, -2.732421875, -0.2890625, 2.154296875, 4.59765625, 7.041015625, 9.484375, 11.927734375, 14.37109375, 16.814453125, 19.2578125, 21.701171875, 24.14453125, 26.587890625, 29.03125, 31.474609375, 33.91796875, 36.361328125, 38.8046875, 41.248046875, 43.69140625, 46.134765625, 48.578125, 51.021484375, 53.46484375, 55.908203125, 58.3515625, 60.794921875, 63.23828125, 65.681640625, 68.125]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [10.0, 224.0, 622.0, 150.0, 13.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.084012985229492, -11.205876350402832, -3.327739715576172, 4.550397872924805, 12.428533554077148, 20.306669235229492, 28.1848087310791, 36.06294250488281, 43.941078186035156, 51.8192138671875, 59.697349548339844, 67.57548522949219, 75.45362854003906, 83.33175659179688, 91.20989990234375, 99.0880355834961, 106.96617126464844, 114.84430694580078, 122.72244262695312, 130.6005859375, 138.4787139892578, 146.3568572998047, 154.2349853515625, 162.11312866210938, 169.99127197265625, 177.86941528320312, 185.74754333496094, 193.6256866455078, 201.50381469726562, 209.3819580078125, 217.26010131835938, 225.1382293701172, 233.016357421875, 240.89450073242188, 248.7726287841797, 256.6507568359375, 264.5289001464844, 272.40704345703125, 280.2851867675781, 288.163330078125, 296.04144287109375, 303.9195861816406, 311.7977294921875, 319.67584228515625, 327.5539855957031, 335.43212890625, 343.3102722167969, 351.18841552734375, 359.0665283203125, 366.9446716308594, 374.82281494140625, 382.700927734375, 390.5790710449219, 398.45721435546875, 406.3353576660156, 414.2135009765625, 422.0916442871094, 429.96978759765625, 437.8479309082031, 445.7260437011719, 453.60418701171875, 461.4823303222656, 469.3604736328125, 477.23858642578125, 485.1167297363281]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 6.0, 4.0, 13.0, 3.0, 11.0, 17.0, 12.0, 27.0, 18.0, 17.0, 30.0, 31.0, 24.0, 35.0, 38.0, 37.0, 40.0, 50.0, 39.0, 47.0, 45.0, 45.0, 46.0, 46.0, 39.0, 40.0, 37.0, 34.0, 34.0, 24.0, 18.0, 15.0, 20.0, 12.0, 9.0, 10.0, 9.0, 5.0, 3.0, 5.0, 1.0, 4.0, 0.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-69.57427978515625, -67.2948226928711, -65.0153579711914, -62.73590087890625, -60.456443786621094, -58.17698287963867, -55.89752197265625, -53.618064880371094, -51.33860397338867, -49.05914306640625, -46.779685974121094, -44.50022506713867, -42.22076416015625, -39.941307067871094, -37.66184616088867, -35.38238525390625, -33.102928161621094, -30.823469161987305, -28.544010162353516, -26.264549255371094, -23.985090255737305, -21.705631256103516, -19.426170349121094, -17.146711349487305, -14.867252349853516, -12.587793350219727, -10.308333396911621, -8.028873443603516, -5.749414443969727, -3.4699554443359375, -1.190495491027832, 1.0889644622802734, 3.3684234619140625, 5.64788293838501, 7.927342414855957, 10.206802368164062, 12.486261367797852, 14.76572036743164, 17.045181274414062, 19.32464027404785, 21.60409927368164, 23.88355827331543, 26.16301727294922, 28.44247817993164, 30.72193717956543, 33.00139617919922, 35.28085708618164, 37.56031799316406, 39.83977508544922, 42.11923599243164, 44.3986930847168, 46.67815399169922, 48.957611083984375, 51.2370719909668, 53.51653289794922, 55.795989990234375, 58.0754508972168, 60.35491180419922, 62.634368896484375, 64.91382598876953, 67.19329071044922, 69.47274780273438, 71.75220489501953, 74.03166961669922, 76.31112670898438]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 7.0, 4.0, 7.0, 5.0, 9.0, 6.0, 13.0, 10.0, 20.0, 13.0, 14.0, 25.0, 22.0, 36.0, 29.0, 36.0, 30.0, 32.0, 40.0, 33.0, 39.0, 41.0, 29.0, 36.0, 48.0, 42.0, 24.0, 24.0, 41.0, 33.0, 36.0, 30.0, 20.0, 17.0, 27.0, 30.0, 20.0, 11.0, 5.0, 11.0, 9.0, 7.0, 8.0, 3.0, 8.0, 2.0, 2.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.34375, -8.08837890625, -7.8330078125, -7.57763671875, -7.322265625, -7.06689453125, -6.8115234375, -6.55615234375, -6.30078125, -6.04541015625, -5.7900390625, -5.53466796875, -5.279296875, -5.02392578125, -4.7685546875, -4.51318359375, -4.2578125, -4.00244140625, -3.7470703125, -3.49169921875, -3.236328125, -2.98095703125, -2.7255859375, -2.47021484375, -2.21484375, -1.95947265625, -1.7041015625, -1.44873046875, -1.193359375, -0.93798828125, -0.6826171875, -0.42724609375, -0.171875, 0.08349609375, 0.3388671875, 0.59423828125, 0.849609375, 1.10498046875, 1.3603515625, 1.61572265625, 1.87109375, 2.12646484375, 2.3818359375, 2.63720703125, 2.892578125, 3.14794921875, 3.4033203125, 3.65869140625, 3.9140625, 4.16943359375, 4.4248046875, 4.68017578125, 4.935546875, 5.19091796875, 5.4462890625, 5.70166015625, 5.95703125, 6.21240234375, 6.4677734375, 6.72314453125, 6.978515625, 7.23388671875, 7.4892578125, 7.74462890625, 8.0]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 4.0, 7.0, 7.0, 11.0, 17.0, 18.0, 15.0, 34.0, 40.0, 47.0, 88.0, 132.0, 177.0, 288.0, 481.0, 838.0, 1458.0, 2807.0, 5881.0, 15160.0, 62208.0, 475195.0, 2088267.0, 1294931.0, 194144.0, 32516.0, 10055.0, 4250.0, 2207.0, 1157.0, 666.0, 399.0, 233.0, 150.0, 120.0, 80.0, 57.0, 44.0, 26.0, 19.0, 10.0, 11.0, 14.0, 9.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.265625, -14.769775390625, -14.27392578125, -13.778076171875, -13.2822265625, -12.786376953125, -12.29052734375, -11.794677734375, -11.298828125, -10.802978515625, -10.30712890625, -9.811279296875, -9.3154296875, -8.819580078125, -8.32373046875, -7.827880859375, -7.33203125, -6.836181640625, -6.34033203125, -5.844482421875, -5.3486328125, -4.852783203125, -4.35693359375, -3.861083984375, -3.365234375, -2.869384765625, -2.37353515625, -1.877685546875, -1.3818359375, -0.885986328125, -0.39013671875, 0.105712890625, 0.6015625, 1.097412109375, 1.59326171875, 2.089111328125, 2.5849609375, 3.080810546875, 3.57666015625, 4.072509765625, 4.568359375, 5.064208984375, 5.56005859375, 6.055908203125, 6.5517578125, 7.047607421875, 7.54345703125, 8.039306640625, 8.53515625, 9.031005859375, 9.52685546875, 10.022705078125, 10.5185546875, 11.014404296875, 11.51025390625, 12.006103515625, 12.501953125, 12.997802734375, 13.49365234375, 13.989501953125, 14.4853515625, 14.981201171875, 15.47705078125, 15.972900390625, 16.46875]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 3.0, 6.0, 5.0, 15.0, 20.0, 12.0, 30.0, 50.0, 68.0, 136.0, 133.0, 239.0, 342.0, 532.0, 648.0, 595.0, 404.0, 284.0, 189.0, 118.0, 102.0, 57.0, 25.0, 20.0, 14.0, 13.0, 5.0, 3.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.40625, -18.72900390625, -18.0517578125, -17.37451171875, -16.697265625, -16.02001953125, -15.3427734375, -14.66552734375, -13.98828125, -13.31103515625, -12.6337890625, -11.95654296875, -11.279296875, -10.60205078125, -9.9248046875, -9.24755859375, -8.5703125, -7.89306640625, -7.2158203125, -6.53857421875, -5.861328125, -5.18408203125, -4.5068359375, -3.82958984375, -3.15234375, -2.47509765625, -1.7978515625, -1.12060546875, -0.443359375, 0.23388671875, 0.9111328125, 1.58837890625, 2.265625, 2.94287109375, 3.6201171875, 4.29736328125, 4.974609375, 5.65185546875, 6.3291015625, 7.00634765625, 7.68359375, 8.36083984375, 9.0380859375, 9.71533203125, 10.392578125, 11.06982421875, 11.7470703125, 12.42431640625, 13.1015625, 13.77880859375, 14.4560546875, 15.13330078125, 15.810546875, 16.48779296875, 17.1650390625, 17.84228515625, 18.51953125, 19.19677734375, 19.8740234375, 20.55126953125, 21.228515625, 21.90576171875, 22.5830078125, 23.26025390625, 23.9375]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 3.0, 3.0, 10.0, 10.0, 17.0, 34.0, 72.0, 115.0, 246.0, 516.0, 1304.0, 5375.0, 3287049.0, 893452.0, 4028.0, 1083.0, 457.0, 226.0, 102.0, 63.0, 41.0, 19.0, 19.0, 17.0, 1.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.125, -55.8828125, -53.640625, -51.3984375, -49.15625, -46.9140625, -44.671875, -42.4296875, -40.1875, -37.9453125, -35.703125, -33.4609375, -31.21875, -28.9765625, -26.734375, -24.4921875, -22.25, -20.0078125, -17.765625, -15.5234375, -13.28125, -11.0390625, -8.796875, -6.5546875, -4.3125, -2.0703125, 0.171875, 2.4140625, 4.65625, 6.8984375, 9.140625, 11.3828125, 13.625, 15.8671875, 18.109375, 20.3515625, 22.59375, 24.8359375, 27.078125, 29.3203125, 31.5625, 33.8046875, 36.046875, 38.2890625, 40.53125, 42.7734375, 45.015625, 47.2578125, 49.5, 51.7421875, 53.984375, 56.2265625, 58.46875, 60.7109375, 62.953125, 65.1953125, 67.4375, 69.6796875, 71.921875, 74.1640625, 76.40625, 78.6484375, 80.890625, 83.1328125, 85.375]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 49.0, 901.0, 63.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-280.87066650390625, -260.0891418457031, -239.30758666992188, -218.52606201171875, -197.74452209472656, -176.96298217773438, -156.18145751953125, -135.39991760253906, -114.61837768554688, -93.83683776855469, -73.05530548095703, -52.27376937866211, -31.492233276367188, -10.710693359375, 10.070838928222656, 30.852371215820312, 51.6339111328125, 72.41545104980469, 93.19698333740234, 113.978515625, 134.7600555419922, 155.54159545898438, 176.3231201171875, 197.1046600341797, 217.88619995117188, 238.66773986816406, 259.44927978515625, 280.2308044433594, 301.0123291015625, 321.79388427734375, 342.5754089355469, 363.35693359375, 384.138427734375, 404.9199523925781, 425.7015075683594, 446.4830322265625, 467.26458740234375, 488.0461120605469, 508.82763671875, 529.6091918945312, 550.3907470703125, 571.1723022460938, 591.9537963867188, 612.7353515625, 633.5169067382812, 654.2984619140625, 675.0799560546875, 695.8615112304688, 716.6430053710938, 737.424560546875, 758.2060546875, 778.9876098632812, 799.7691650390625, 820.5506591796875, 841.3322143554688, 862.11376953125, 882.895263671875, 903.6768188476562, 924.4583129882812, 945.2398681640625, 966.0214233398438, 986.802978515625, 1007.58447265625, 1028.365966796875, 1049.1475830078125]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 8.0, 14.0, 8.0, 5.0, 6.0, 14.0, 7.0, 17.0, 15.0, 19.0, 21.0, 21.0, 26.0, 22.0, 30.0, 35.0, 21.0, 41.0, 29.0, 36.0, 32.0, 45.0, 47.0, 40.0, 41.0, 45.0, 38.0, 44.0, 23.0, 21.0, 33.0, 22.0, 33.0, 21.0, 19.0, 13.0, 19.0, 20.0, 10.0, 12.0, 4.0, 1.0, 6.0, 8.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.473785400390625, -53.69788360595703, -51.9219856262207, -50.14608383178711, -48.37018585205078, -46.59428405761719, -44.818382263183594, -43.042484283447266, -41.26658630371094, -39.490684509277344, -37.714786529541016, -35.93888473510742, -34.162986755371094, -32.3870849609375, -30.61118507385254, -28.835285186767578, -27.059383392333984, -25.283483505249023, -23.507583618164062, -21.73168182373047, -19.95578384399414, -18.179882049560547, -16.403982162475586, -14.628082275390625, -12.852182388305664, -11.076282501220703, -9.300382614135742, -7.524481773376465, -5.748581886291504, -3.972681999206543, -2.1967811584472656, -0.4208812713623047, 1.3550186157226562, 3.1309187412261963, 4.906818866729736, 6.6827192306518555, 8.458619117736816, 10.234519004821777, 12.010419845581055, 13.786319732666016, 15.562219619750977, 17.338119506835938, 19.1140193939209, 20.88991928100586, 22.665821075439453, 24.44171905517578, 26.217620849609375, 27.993520736694336, 29.769420623779297, 31.545320510864258, 33.32122039794922, 35.09712219238281, 36.87302017211914, 38.648921966552734, 40.42481994628906, 42.200721740722656, 43.97662353515625, 45.752525329589844, 47.52842330932617, 49.304325103759766, 51.080223083496094, 52.85612487792969, 54.63202667236328, 56.40792465209961, 58.18382263183594]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 5.0, 5.0, 5.0, 6.0, 13.0, 10.0, 8.0, 17.0, 14.0, 16.0, 26.0, 17.0, 30.0, 26.0, 30.0, 40.0, 35.0, 32.0, 37.0, 40.0, 34.0, 36.0, 47.0, 32.0, 40.0, 33.0, 37.0, 34.0, 26.0, 32.0, 22.0, 24.0, 36.0, 22.0, 30.0, 19.0, 16.0, 12.0, 9.0, 13.0, 7.0, 8.0, 5.0, 7.0, 4.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.6640625, -7.4349365234375, -7.205810546875, -6.9766845703125, -6.74755859375, -6.5184326171875, -6.289306640625, -6.0601806640625, -5.8310546875, -5.6019287109375, -5.372802734375, -5.1436767578125, -4.91455078125, -4.6854248046875, -4.456298828125, -4.2271728515625, -3.998046875, -3.7689208984375, -3.539794921875, -3.3106689453125, -3.08154296875, -2.8524169921875, -2.623291015625, -2.3941650390625, -2.1650390625, -1.9359130859375, -1.706787109375, -1.4776611328125, -1.24853515625, -1.0194091796875, -0.790283203125, -0.5611572265625, -0.33203125, -0.1029052734375, 0.126220703125, 0.3553466796875, 0.58447265625, 0.8135986328125, 1.042724609375, 1.2718505859375, 1.5009765625, 1.7301025390625, 1.959228515625, 2.1883544921875, 2.41748046875, 2.6466064453125, 2.875732421875, 3.1048583984375, 3.333984375, 3.5631103515625, 3.792236328125, 4.0213623046875, 4.25048828125, 4.4796142578125, 4.708740234375, 4.9378662109375, 5.1669921875, 5.3961181640625, 5.625244140625, 5.8543701171875, 6.08349609375, 6.3126220703125, 6.541748046875, 6.7708740234375, 7.0]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 7.0, 6.0, 7.0, 9.0, 22.0, 43.0, 63.0, 98.0, 150.0, 264.0, 408.0, 635.0, 1012.0, 1423.0, 2251.0, 3577.0, 5436.0, 8606.0, 13430.0, 20965.0, 33886.0, 55000.0, 89818.0, 149432.0, 211458.0, 172632.0, 106140.0, 64431.0, 39263.0, 24564.0, 15708.0, 9861.0, 6359.0, 4129.0, 2738.0, 1651.0, 1066.0, 772.0, 452.0, 286.0, 207.0, 116.0, 59.0, 40.0, 32.0, 21.0, 13.0, 5.0, 6.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8232421875, -0.7963943481445312, -0.7695465087890625, -0.7426986694335938, -0.715850830078125, -0.6890029907226562, -0.6621551513671875, -0.6353073120117188, -0.60845947265625, -0.5816116333007812, -0.5547637939453125, -0.5279159545898438, -0.501068115234375, -0.47422027587890625, -0.4473724365234375, -0.42052459716796875, -0.3936767578125, -0.36682891845703125, -0.3399810791015625, -0.31313323974609375, -0.286285400390625, -0.25943756103515625, -0.2325897216796875, -0.20574188232421875, -0.17889404296875, -0.15204620361328125, -0.1251983642578125, -0.09835052490234375, -0.071502685546875, -0.04465484619140625, -0.0178070068359375, 0.00904083251953125, 0.035888671875, 0.06273651123046875, 0.0895843505859375, 0.11643218994140625, 0.143280029296875, 0.17012786865234375, 0.1969757080078125, 0.22382354736328125, 0.25067138671875, 0.27751922607421875, 0.3043670654296875, 0.33121490478515625, 0.358062744140625, 0.38491058349609375, 0.4117584228515625, 0.43860626220703125, 0.4654541015625, 0.49230194091796875, 0.5191497802734375, 0.5459976196289062, 0.572845458984375, 0.5996932983398438, 0.6265411376953125, 0.6533889770507812, 0.68023681640625, 0.7070846557617188, 0.7339324951171875, 0.7607803344726562, 0.787628173828125, 0.8144760131835938, 0.8413238525390625, 0.8681716918945312, 0.89501953125]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 2.0, 4.0, 3.0, 4.0, 9.0, 7.0, 15.0, 11.0, 7.0, 14.0, 24.0, 22.0, 22.0, 23.0, 16.0, 24.0, 35.0, 28.0, 26.0, 38.0, 42.0, 37.0, 47.0, 1055.0, 37.0, 45.0, 33.0, 43.0, 27.0, 24.0, 38.0, 38.0, 23.0, 21.0, 27.0, 19.0, 16.0, 18.0, 21.0, 13.0, 12.0, 15.0, 9.0, 7.0, 11.0, 3.0, 6.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-4.390625, -4.251953125, -4.11328125, -3.974609375, -3.8359375, -3.697265625, -3.55859375, -3.419921875, -3.28125, -3.142578125, -3.00390625, -2.865234375, -2.7265625, -2.587890625, -2.44921875, -2.310546875, -2.171875, -2.033203125, -1.89453125, -1.755859375, -1.6171875, -1.478515625, -1.33984375, -1.201171875, -1.0625, -0.923828125, -0.78515625, -0.646484375, -0.5078125, -0.369140625, -0.23046875, -0.091796875, 0.046875, 0.185546875, 0.32421875, 0.462890625, 0.6015625, 0.740234375, 0.87890625, 1.017578125, 1.15625, 1.294921875, 1.43359375, 1.572265625, 1.7109375, 1.849609375, 1.98828125, 2.126953125, 2.265625, 2.404296875, 2.54296875, 2.681640625, 2.8203125, 2.958984375, 3.09765625, 3.236328125, 3.375, 3.513671875, 3.65234375, 3.791015625, 3.9296875, 4.068359375, 4.20703125, 4.345703125, 4.484375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 3.0, 6.0, 7.0, 15.0, 10.0, 25.0, 37.0, 55.0, 78.0, 120.0, 153.0, 246.0, 363.0, 545.0, 739.0, 1075.0, 1545.0, 2262.0, 3295.0, 4765.0, 7261.0, 10831.0, 16099.0, 24557.0, 37573.0, 56691.0, 86705.0, 133779.0, 1236529.0, 161665.0, 106052.0, 69068.0, 45426.0, 29627.0, 19754.0, 12973.0, 8810.0, 5907.0, 3935.0, 2679.0, 1892.0, 1189.0, 893.0, 601.0, 389.0, 277.0, 191.0, 142.0, 85.0, 79.0, 43.0, 29.0, 23.0, 19.0, 10.0, 4.0, 5.0, 2.0, 1.0, 4.0, 3.0, 0.0, 2.0], "bins": [-0.66552734375, -0.6431427001953125, -0.620758056640625, -0.5983734130859375, -0.57598876953125, -0.5536041259765625, -0.531219482421875, -0.5088348388671875, -0.4864501953125, -0.4640655517578125, -0.441680908203125, -0.4192962646484375, -0.39691162109375, -0.3745269775390625, -0.352142333984375, -0.3297576904296875, -0.307373046875, -0.2849884033203125, -0.262603759765625, -0.2402191162109375, -0.21783447265625, -0.1954498291015625, -0.173065185546875, -0.1506805419921875, -0.1282958984375, -0.1059112548828125, -0.083526611328125, -0.0611419677734375, -0.03875732421875, -0.0163726806640625, 0.006011962890625, 0.0283966064453125, 0.05078125, 0.0731658935546875, 0.095550537109375, 0.1179351806640625, 0.14031982421875, 0.1627044677734375, 0.185089111328125, 0.2074737548828125, 0.2298583984375, 0.2522430419921875, 0.274627685546875, 0.2970123291015625, 0.31939697265625, 0.3417816162109375, 0.364166259765625, 0.3865509033203125, 0.408935546875, 0.4313201904296875, 0.453704833984375, 0.4760894775390625, 0.49847412109375, 0.5208587646484375, 0.543243408203125, 0.5656280517578125, 0.5880126953125, 0.6103973388671875, 0.632781982421875, 0.6551666259765625, 0.67755126953125, 0.6999359130859375, 0.722320556640625, 0.7447052001953125, 0.76708984375]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 4.0, 9.0, 6.0, 18.0, 12.0, 9.0, 16.0, 19.0, 28.0, 39.0, 38.0, 33.0, 47.0, 56.0, 74.0, 65.0, 61.0, 72.0, 65.0, 51.0, 46.0, 42.0, 40.0, 30.0, 21.0, 17.0, 21.0, 17.0, 11.0, 7.0, 8.0, 4.0, 6.0, 3.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0034580230712890625, -0.0033577382564544678, -0.003257453441619873, -0.0031571686267852783, -0.0030568838119506836, -0.002956598997116089, -0.002856314182281494, -0.0027560293674468994, -0.0026557445526123047, -0.00255545973777771, -0.0024551749229431152, -0.0023548901081085205, -0.0022546052932739258, -0.002154320478439331, -0.0020540356636047363, -0.0019537508487701416, -0.0018534660339355469, -0.0017531812191009521, -0.0016528964042663574, -0.0015526115894317627, -0.001452326774597168, -0.0013520419597625732, -0.0012517571449279785, -0.0011514723300933838, -0.001051187515258789, -0.0009509027004241943, -0.0008506178855895996, -0.0007503330707550049, -0.0006500482559204102, -0.0005497634410858154, -0.0004494786262512207, -0.000349193811416626, -0.00024890899658203125, -0.00014862418174743652, -4.83393669128418e-05, 5.194544792175293e-05, 0.00015223026275634766, 0.0002525150775909424, 0.0003527998924255371, 0.00045308470726013184, 0.0005533695220947266, 0.0006536543369293213, 0.000753939151763916, 0.0008542239665985107, 0.0009545087814331055, 0.0010547935962677002, 0.001155078411102295, 0.0012553632259368896, 0.0013556480407714844, 0.001455932855606079, 0.0015562176704406738, 0.0016565024852752686, 0.0017567873001098633, 0.001857072114944458, 0.0019573569297790527, 0.0020576417446136475, 0.002157926559448242, 0.002258211374282837, 0.0023584961891174316, 0.0024587810039520264, 0.002559065818786621, 0.002659350633621216, 0.0027596354484558105, 0.0028599202632904053, 0.002960205078125]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 5.0, 2.0, 3.0, 3.0, 5.0, 6.0, 8.0, 12.0, 14.0, 21.0, 21.0, 40.0, 49.0, 48.0, 67.0, 77.0, 97.0, 152.0, 220.0, 285.0, 467.0, 770.0, 4283.0, 1032965.0, 6409.0, 891.0, 460.0, 332.0, 197.0, 134.0, 118.0, 96.0, 79.0, 51.0, 37.0, 29.0, 39.0, 21.0, 11.0, 10.0, 5.0, 10.0, 2.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.045074462890625, -0.0435481071472168, -0.042021751403808594, -0.04049539566040039, -0.03896903991699219, -0.037442684173583984, -0.03591632843017578, -0.03438997268676758, -0.032863616943359375, -0.03133726119995117, -0.02981090545654297, -0.028284549713134766, -0.026758193969726562, -0.02523183822631836, -0.023705482482910156, -0.022179126739501953, -0.02065277099609375, -0.019126415252685547, -0.017600059509277344, -0.01607370376586914, -0.014547348022460938, -0.013020992279052734, -0.011494636535644531, -0.009968280792236328, -0.008441925048828125, -0.006915569305419922, -0.005389213562011719, -0.0038628578186035156, -0.0023365020751953125, -0.0008101463317871094, 0.0007162094116210938, 0.002242565155029297, 0.0037689208984375, 0.005295276641845703, 0.006821632385253906, 0.00834798812866211, 0.009874343872070312, 0.011400699615478516, 0.012927055358886719, 0.014453411102294922, 0.015979766845703125, 0.017506122589111328, 0.01903247833251953, 0.020558834075927734, 0.022085189819335938, 0.02361154556274414, 0.025137901306152344, 0.026664257049560547, 0.02819061279296875, 0.029716968536376953, 0.031243324279785156, 0.03276968002319336, 0.03429603576660156, 0.035822391510009766, 0.03734874725341797, 0.03887510299682617, 0.040401458740234375, 0.04192781448364258, 0.04345417022705078, 0.044980525970458984, 0.04650688171386719, 0.04803323745727539, 0.049559593200683594, 0.0510859489440918, 0.0526123046875]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 62.0, 543.0, 376.0, 27.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01034457515925169, -0.010113962925970554, -0.009883350692689419, -0.009652738459408283, -0.009422127157449722, -0.009191514924168587, -0.008960902690887451, -0.008730290457606316, -0.00849967822432518, -0.008269065991044044, -0.008038453757762909, -0.007807841990143061, -0.007577229756861925, -0.007346617989242077, -0.007116005755960941, -0.006885393522679806, -0.00665478128939867, -0.006424169056117535, -0.006193557288497686, -0.005962945055216551, -0.005732332821935415, -0.005501721054315567, -0.0052711088210344315, -0.005040496587753296, -0.004809884820133448, -0.004579272586852312, -0.004348660819232464, -0.004118048585951328, -0.0038874363526701927, -0.003656824352219701, -0.003426212351769209, -0.0031956001184880733, -0.002964987885206938, -0.002734375884756446, -0.0025037636514753103, -0.0022731516510248184, -0.002042539417743683, -0.001811927417293191, -0.0015813153004273772, -0.0013507031835615635, -0.0011200910666957498, -0.000889478949829936, -0.0006588668329641223, -0.0004282547743059695, -0.00019764265744015574, 3.2969401217997074e-05, 0.0002635815180838108, 0.0004941936349496245, 0.0007248057518154383, 0.000955417868681252, 0.0011860299855470657, 0.0014166419859975576, 0.0016472542192786932, 0.001877866219729185, 0.0021084784530103207, 0.0023390904534608126, 0.0025697024539113045, 0.0028003144543617964, 0.003030926687642932, 0.003261538688093424, 0.0034921509213745594, 0.0037227629218250513, 0.003953374922275543, 0.004183987155556679, 0.004414599388837814]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 6.0, 5.0, 6.0, 6.0, 9.0, 6.0, 10.0, 15.0, 15.0, 23.0, 23.0, 26.0, 29.0, 25.0, 29.0, 33.0, 33.0, 25.0, 43.0, 32.0, 44.0, 33.0, 47.0, 34.0, 43.0, 38.0, 42.0, 32.0, 35.0, 24.0, 30.0, 29.0, 25.0, 19.0, 22.0, 16.0, 19.0, 9.0, 11.0, 10.0, 15.0, 9.0, 5.0, 6.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 3.0], "bins": [-0.0015636086463928223, -0.001516789197921753, -0.0014699697494506836, -0.0014231503009796143, -0.001376330852508545, -0.0013295114040374756, -0.0012826919555664062, -0.001235872507095337, -0.0011890530586242676, -0.0011422336101531982, -0.001095414161682129, -0.0010485947132110596, -0.0010017752647399902, -0.0009549558162689209, -0.0009081363677978516, -0.0008613169193267822, -0.0008144974708557129, -0.0007676780223846436, -0.0007208585739135742, -0.0006740391254425049, -0.0006272196769714355, -0.0005804002285003662, -0.0005335807800292969, -0.00048676133155822754, -0.0004399418830871582, -0.00039312243461608887, -0.00034630298614501953, -0.0002994835376739502, -0.00025266408920288086, -0.00020584464073181152, -0.0001590251922607422, -0.00011220574378967285, -6.538629531860352e-05, -1.856684684753418e-05, 2.8252601623535156e-05, 7.507205009460449e-05, 0.00012189149856567383, 0.00016871094703674316, 0.0002155303955078125, 0.00026234984397888184, 0.00030916929244995117, 0.0003559887409210205, 0.00040280818939208984, 0.0004496276378631592, 0.0004964470863342285, 0.0005432665348052979, 0.0005900859832763672, 0.0006369054317474365, 0.0006837248802185059, 0.0007305443286895752, 0.0007773637771606445, 0.0008241832256317139, 0.0008710026741027832, 0.0009178221225738525, 0.0009646415710449219, 0.0010114610195159912, 0.0010582804679870605, 0.0011050999164581299, 0.0011519193649291992, 0.0011987388134002686, 0.0012455582618713379, 0.0012923777103424072, 0.0013391971588134766, 0.001386016607284546, 0.0014328360557556152]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 5.0, 5.0, 5.0, 6.0, 13.0, 10.0, 8.0, 17.0, 14.0, 16.0, 26.0, 17.0, 30.0, 26.0, 30.0, 40.0, 35.0, 32.0, 37.0, 40.0, 34.0, 36.0, 47.0, 32.0, 40.0, 33.0, 37.0, 34.0, 26.0, 32.0, 22.0, 24.0, 36.0, 22.0, 30.0, 19.0, 16.0, 12.0, 9.0, 13.0, 7.0, 8.0, 5.0, 7.0, 4.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.6640625, -7.4349365234375, -7.205810546875, -6.9766845703125, -6.74755859375, -6.5184326171875, -6.289306640625, -6.0601806640625, -5.8310546875, -5.6019287109375, -5.372802734375, -5.1436767578125, -4.91455078125, -4.6854248046875, -4.456298828125, -4.2271728515625, -3.998046875, -3.7689208984375, -3.539794921875, -3.3106689453125, -3.08154296875, -2.8524169921875, -2.623291015625, -2.3941650390625, -2.1650390625, -1.9359130859375, -1.706787109375, -1.4776611328125, -1.24853515625, -1.0194091796875, -0.790283203125, -0.5611572265625, -0.33203125, -0.1029052734375, 0.126220703125, 0.3553466796875, 0.58447265625, 0.8135986328125, 1.042724609375, 1.2718505859375, 1.5009765625, 1.7301025390625, 1.959228515625, 2.1883544921875, 2.41748046875, 2.6466064453125, 2.875732421875, 3.1048583984375, 3.333984375, 3.5631103515625, 3.792236328125, 4.0213623046875, 4.25048828125, 4.4796142578125, 4.708740234375, 4.9378662109375, 5.1669921875, 5.3961181640625, 5.625244140625, 5.8543701171875, 6.08349609375, 6.3126220703125, 6.541748046875, 6.7708740234375, 7.0]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 8.0, 4.0, 2.0, 6.0, 15.0, 12.0, 22.0, 23.0, 30.0, 41.0, 56.0, 79.0, 103.0, 150.0, 194.0, 307.0, 430.0, 696.0, 1196.0, 2166.0, 4467.0, 11746.0, 38877.0, 197976.0, 611152.0, 131544.0, 29299.0, 9280.0, 3806.0, 1778.0, 1022.0, 675.0, 370.0, 298.0, 184.0, 166.0, 112.0, 66.0, 51.0, 36.0, 34.0, 23.0, 13.0, 12.0, 9.0, 10.0, 7.0, 3.0, 1.0, 1.0, 6.0, 0.0, 1.0, 1.0], "bins": [-14.953125, -14.518310546875, -14.08349609375, -13.648681640625, -13.2138671875, -12.779052734375, -12.34423828125, -11.909423828125, -11.474609375, -11.039794921875, -10.60498046875, -10.170166015625, -9.7353515625, -9.300537109375, -8.86572265625, -8.430908203125, -7.99609375, -7.561279296875, -7.12646484375, -6.691650390625, -6.2568359375, -5.822021484375, -5.38720703125, -4.952392578125, -4.517578125, -4.082763671875, -3.64794921875, -3.213134765625, -2.7783203125, -2.343505859375, -1.90869140625, -1.473876953125, -1.0390625, -0.604248046875, -0.16943359375, 0.265380859375, 0.7001953125, 1.135009765625, 1.56982421875, 2.004638671875, 2.439453125, 2.874267578125, 3.30908203125, 3.743896484375, 4.1787109375, 4.613525390625, 5.04833984375, 5.483154296875, 5.91796875, 6.352783203125, 6.78759765625, 7.222412109375, 7.6572265625, 8.092041015625, 8.52685546875, 8.961669921875, 9.396484375, 9.831298828125, 10.26611328125, 10.700927734375, 11.1357421875, 11.570556640625, 12.00537109375, 12.440185546875, 12.875]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 7.0, 4.0, 4.0, 5.0, 4.0, 9.0, 13.0, 17.0, 18.0, 18.0, 24.0, 29.0, 35.0, 49.0, 33.0, 46.0, 67.0, 96.0, 312.0, 1589.0, 201.0, 87.0, 79.0, 59.0, 36.0, 31.0, 26.0, 29.0, 25.0, 23.0, 18.0, 10.0, 8.0, 5.0, 7.0, 6.0, 5.0, 3.0, 1.0, 5.0, 2.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.0625, -22.3017578125, -21.541015625, -20.7802734375, -20.01953125, -19.2587890625, -18.498046875, -17.7373046875, -16.9765625, -16.2158203125, -15.455078125, -14.6943359375, -13.93359375, -13.1728515625, -12.412109375, -11.6513671875, -10.890625, -10.1298828125, -9.369140625, -8.6083984375, -7.84765625, -7.0869140625, -6.326171875, -5.5654296875, -4.8046875, -4.0439453125, -3.283203125, -2.5224609375, -1.76171875, -1.0009765625, -0.240234375, 0.5205078125, 1.28125, 2.0419921875, 2.802734375, 3.5634765625, 4.32421875, 5.0849609375, 5.845703125, 6.6064453125, 7.3671875, 8.1279296875, 8.888671875, 9.6494140625, 10.41015625, 11.1708984375, 11.931640625, 12.6923828125, 13.453125, 14.2138671875, 14.974609375, 15.7353515625, 16.49609375, 17.2568359375, 18.017578125, 18.7783203125, 19.5390625, 20.2998046875, 21.060546875, 21.8212890625, 22.58203125, 23.3427734375, 24.103515625, 24.8642578125, 25.625]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 3.0, 3.0, 1.0, 2.0, 3.0, 5.0, 6.0, 6.0, 5.0, 12.0, 20.0, 25.0, 19.0, 26.0, 72.0, 72.0, 105.0, 203.0, 398.0, 833.0, 4874.0, 3128794.0, 8194.0, 972.0, 413.0, 232.0, 121.0, 78.0, 60.0, 49.0, 23.0, 22.0, 15.0, 9.0, 5.0, 5.0, 9.0, 4.0, 3.0, 4.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-74.75, -72.5224609375, -70.294921875, -68.0673828125, -65.83984375, -63.6123046875, -61.384765625, -59.1572265625, -56.9296875, -54.7021484375, -52.474609375, -50.2470703125, -48.01953125, -45.7919921875, -43.564453125, -41.3369140625, -39.109375, -36.8818359375, -34.654296875, -32.4267578125, -30.19921875, -27.9716796875, -25.744140625, -23.5166015625, -21.2890625, -19.0615234375, -16.833984375, -14.6064453125, -12.37890625, -10.1513671875, -7.923828125, -5.6962890625, -3.46875, -1.2412109375, 0.986328125, 3.2138671875, 5.44140625, 7.6689453125, 9.896484375, 12.1240234375, 14.3515625, 16.5791015625, 18.806640625, 21.0341796875, 23.26171875, 25.4892578125, 27.716796875, 29.9443359375, 32.171875, 34.3994140625, 36.626953125, 38.8544921875, 41.08203125, 43.3095703125, 45.537109375, 47.7646484375, 49.9921875, 52.2197265625, 54.447265625, 56.6748046875, 58.90234375, 61.1298828125, 63.357421875, 65.5849609375, 67.8125]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 16.0, 912.0, 81.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.02238464355469, -52.62108612060547, -43.21978759765625, -33.818485260009766, -24.417186737060547, -15.015888214111328, -5.614585876464844, 3.786712646484375, 13.188011169433594, 22.589309692382812, 31.990610122680664, 41.391910552978516, 50.793209075927734, 60.19450759887695, 69.59580993652344, 78.99710845947266, 88.39840698242188, 97.7997055053711, 107.20100402832031, 116.60231018066406, 126.00360107421875, 135.4049072265625, 144.80621337890625, 154.20750427246094, 163.60879516601562, 173.01010131835938, 182.41139221191406, 191.8126983642578, 201.2139892578125, 210.61529541015625, 220.0166015625, 229.4178924560547, 238.81918334960938, 248.22048950195312, 257.6217956542969, 267.0230712890625, 276.42437744140625, 285.82568359375, 295.22698974609375, 304.6282958984375, 314.0295715332031, 323.4308776855469, 332.8321838378906, 342.23345947265625, 351.634765625, 361.03607177734375, 370.4373779296875, 379.83868408203125, 389.239990234375, 398.64129638671875, 408.0426025390625, 417.4438781738281, 426.8451843261719, 436.2464904785156, 445.6477966308594, 455.049072265625, 464.45037841796875, 473.8516845703125, 483.25299072265625, 492.6542663574219, 502.0555725097656, 511.4568786621094, 520.858154296875, 530.2594604492188, 539.6607666015625]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 2.0, 6.0, 4.0, 7.0, 7.0, 5.0, 14.0, 8.0, 10.0, 15.0, 14.0, 16.0, 21.0, 24.0, 24.0, 30.0, 24.0, 31.0, 28.0, 29.0, 35.0, 39.0, 36.0, 27.0, 48.0, 42.0, 37.0, 39.0, 37.0, 46.0, 33.0, 29.0, 35.0, 28.0, 25.0, 29.0, 14.0, 14.0, 10.0, 16.0, 7.0, 15.0, 13.0, 7.0, 4.0, 6.0, 6.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0], "bins": [-44.23744201660156, -42.61337661743164, -40.98930740356445, -39.36524200439453, -37.741172790527344, -36.11710739135742, -34.4930419921875, -32.86897277832031, -31.24490737915039, -29.620840072631836, -27.99677276611328, -26.37270736694336, -24.748640060424805, -23.12457275390625, -21.500505447387695, -19.87643814086914, -18.252370834350586, -16.62830352783203, -15.004237174987793, -13.380169868469238, -11.756103515625, -10.132036209106445, -8.50796890258789, -6.883902549743652, -5.259835243225098, -3.635768413543701, -2.0117013454437256, -0.38763427734375, 1.2364325523376465, 2.860499382019043, 4.484566688537598, 6.108633041381836, 7.732700347900391, 9.356767654418945, 10.980834007263184, 12.604901313781738, 14.228967666625977, 15.853034973144531, 17.477102279663086, 19.10116958618164, 20.725234985351562, 22.349302291870117, 23.973369598388672, 25.597434997558594, 27.22150230407715, 28.845569610595703, 30.469636917114258, 32.09370422363281, 33.7177734375, 35.34183883666992, 36.96590805053711, 38.58997344970703, 40.21404266357422, 41.83810806274414, 43.46217346191406, 45.08624267578125, 46.71030807495117, 48.334373474121094, 49.95844268798828, 51.5825080871582, 53.20657730102539, 54.83064270019531, 56.4547119140625, 58.07877731323242, 59.702842712402344]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 4.0, 6.0, 2.0, 8.0, 9.0, 9.0, 8.0, 19.0, 22.0, 17.0, 22.0, 27.0, 30.0, 21.0, 31.0, 34.0, 32.0, 43.0, 38.0, 39.0, 41.0, 27.0, 40.0, 38.0, 44.0, 46.0, 37.0, 44.0, 28.0, 14.0, 24.0, 26.0, 24.0, 17.0, 23.0, 17.0, 24.0, 17.0, 12.0, 9.0, 8.0, 5.0, 4.0, 2.0, 7.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.8046875, -8.5223388671875, -8.239990234375, -7.9576416015625, -7.67529296875, -7.3929443359375, -7.110595703125, -6.8282470703125, -6.5458984375, -6.2635498046875, -5.981201171875, -5.6988525390625, -5.41650390625, -5.1341552734375, -4.851806640625, -4.5694580078125, -4.287109375, -4.0047607421875, -3.722412109375, -3.4400634765625, -3.15771484375, -2.8753662109375, -2.593017578125, -2.3106689453125, -2.0283203125, -1.7459716796875, -1.463623046875, -1.1812744140625, -0.89892578125, -0.6165771484375, -0.334228515625, -0.0518798828125, 0.23046875, 0.5128173828125, 0.795166015625, 1.0775146484375, 1.35986328125, 1.6422119140625, 1.924560546875, 2.2069091796875, 2.4892578125, 2.7716064453125, 3.053955078125, 3.3363037109375, 3.61865234375, 3.9010009765625, 4.183349609375, 4.4656982421875, 4.748046875, 5.0303955078125, 5.312744140625, 5.5950927734375, 5.87744140625, 6.1597900390625, 6.442138671875, 6.7244873046875, 7.0068359375, 7.2891845703125, 7.571533203125, 7.8538818359375, 8.13623046875, 8.4185791015625, 8.700927734375, 8.9832763671875, 9.265625]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 5.0, 6.0, 11.0, 8.0, 10.0, 14.0, 26.0, 23.0, 40.0, 49.0, 57.0, 62.0, 72.0, 95.0, 112.0, 163.0, 208.0, 288.0, 449.0, 727.0, 1290.0, 4204.0, 134783.0, 3921998.0, 121914.0, 4048.0, 1197.0, 668.0, 428.0, 285.0, 238.0, 167.0, 127.0, 97.0, 80.0, 60.0, 63.0, 44.0, 36.0, 28.0, 28.0, 16.0, 21.0, 10.0, 11.0, 6.0, 6.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0], "bins": [-59.5, -57.77490234375, -56.0498046875, -54.32470703125, -52.599609375, -50.87451171875, -49.1494140625, -47.42431640625, -45.69921875, -43.97412109375, -42.2490234375, -40.52392578125, -38.798828125, -37.07373046875, -35.3486328125, -33.62353515625, -31.8984375, -30.17333984375, -28.4482421875, -26.72314453125, -24.998046875, -23.27294921875, -21.5478515625, -19.82275390625, -18.09765625, -16.37255859375, -14.6474609375, -12.92236328125, -11.197265625, -9.47216796875, -7.7470703125, -6.02197265625, -4.296875, -2.57177734375, -0.8466796875, 0.87841796875, 2.603515625, 4.32861328125, 6.0537109375, 7.77880859375, 9.50390625, 11.22900390625, 12.9541015625, 14.67919921875, 16.404296875, 18.12939453125, 19.8544921875, 21.57958984375, 23.3046875, 25.02978515625, 26.7548828125, 28.47998046875, 30.205078125, 31.93017578125, 33.6552734375, 35.38037109375, 37.10546875, 38.83056640625, 40.5556640625, 42.28076171875, 44.005859375, 45.73095703125, 47.4560546875, 49.18115234375, 50.90625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 5.0, 6.0, 9.0, 19.0, 15.0, 38.0, 42.0, 92.0, 165.0, 316.0, 639.0, 865.0, 839.0, 483.0, 256.0, 116.0, 57.0, 46.0, 22.0, 14.0, 7.0, 4.0, 3.0, 3.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.921875, -18.127197265625, -17.33251953125, -16.537841796875, -15.7431640625, -14.948486328125, -14.15380859375, -13.359130859375, -12.564453125, -11.769775390625, -10.97509765625, -10.180419921875, -9.3857421875, -8.591064453125, -7.79638671875, -7.001708984375, -6.20703125, -5.412353515625, -4.61767578125, -3.822998046875, -3.0283203125, -2.233642578125, -1.43896484375, -0.644287109375, 0.150390625, 0.945068359375, 1.73974609375, 2.534423828125, 3.3291015625, 4.123779296875, 4.91845703125, 5.713134765625, 6.5078125, 7.302490234375, 8.09716796875, 8.891845703125, 9.6865234375, 10.481201171875, 11.27587890625, 12.070556640625, 12.865234375, 13.659912109375, 14.45458984375, 15.249267578125, 16.0439453125, 16.838623046875, 17.63330078125, 18.427978515625, 19.22265625, 20.017333984375, 20.81201171875, 21.606689453125, 22.4013671875, 23.196044921875, 23.99072265625, 24.785400390625, 25.580078125, 26.374755859375, 27.16943359375, 27.964111328125, 28.7587890625, 29.553466796875, 30.34814453125, 31.142822265625, 31.9375]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 5.0, 9.0, 4.0, 23.0, 23.0, 48.0, 107.0, 338.0, 879.0, 3550.0, 32605.0, 3710906.0, 433249.0, 9654.0, 1938.0, 562.0, 203.0, 76.0, 51.0, 22.0, 10.0, 8.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.65625, -32.2978515625, -30.939453125, -29.5810546875, -28.22265625, -26.8642578125, -25.505859375, -24.1474609375, -22.7890625, -21.4306640625, -20.072265625, -18.7138671875, -17.35546875, -15.9970703125, -14.638671875, -13.2802734375, -11.921875, -10.5634765625, -9.205078125, -7.8466796875, -6.48828125, -5.1298828125, -3.771484375, -2.4130859375, -1.0546875, 0.3037109375, 1.662109375, 3.0205078125, 4.37890625, 5.7373046875, 7.095703125, 8.4541015625, 9.8125, 11.1708984375, 12.529296875, 13.8876953125, 15.24609375, 16.6044921875, 17.962890625, 19.3212890625, 20.6796875, 22.0380859375, 23.396484375, 24.7548828125, 26.11328125, 27.4716796875, 28.830078125, 30.1884765625, 31.546875, 32.9052734375, 34.263671875, 35.6220703125, 36.98046875, 38.3388671875, 39.697265625, 41.0556640625, 42.4140625, 43.7724609375, 45.130859375, 46.4892578125, 47.84765625, 49.2060546875, 50.564453125, 51.9228515625, 53.28125]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 8.0, 12.0, 24.0, 53.0, 117.0, 199.0, 250.0, 173.0, 92.0, 53.0, 15.0, 9.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-153.6534881591797, -147.05442810058594, -140.4553680419922, -133.85630798339844, -127.25724792480469, -120.65818786621094, -114.05912780761719, -107.46006774902344, -100.86100769042969, -94.26194763183594, -87.66288757324219, -81.06382751464844, -74.46476745605469, -67.86570739746094, -61.26664733886719, -54.66758728027344, -48.06852722167969, -41.46946716308594, -34.87040710449219, -28.271347045898438, -21.672286987304688, -15.073226928710938, -8.474166870117188, -1.8751068115234375, 4.7239532470703125, 11.323013305664062, 17.922073364257812, 24.521133422851562, 31.120193481445312, 37.71925354003906, 44.31831359863281, 50.91737365722656, 57.51641845703125, 64.115478515625, 70.71453857421875, 77.3135986328125, 83.91265869140625, 90.51171875, 97.11077880859375, 103.7098388671875, 110.30889892578125, 116.907958984375, 123.50701904296875, 130.1060791015625, 136.70513916015625, 143.30419921875, 149.90325927734375, 156.5023193359375, 163.10137939453125, 169.700439453125, 176.29949951171875, 182.8985595703125, 189.49761962890625, 196.0966796875, 202.69573974609375, 209.2947998046875, 215.89385986328125, 222.492919921875, 229.09197998046875, 235.6910400390625, 242.29010009765625, 248.88916015625, 255.48822021484375, 262.0872802734375, 268.68634033203125]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 7.0, 8.0, 5.0, 10.0, 12.0, 14.0, 21.0, 22.0, 26.0, 34.0, 31.0, 43.0, 53.0, 57.0, 66.0, 53.0, 43.0, 58.0, 56.0, 52.0, 49.0, 46.0, 36.0, 38.0, 33.0, 29.0, 17.0, 20.0, 25.0, 12.0, 17.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-64.976318359375, -62.81026840209961, -60.64421844482422, -58.47816848754883, -56.31211853027344, -54.14606857299805, -51.980018615722656, -49.813968658447266, -47.647918701171875, -45.481868743896484, -43.315818786621094, -41.1497688293457, -38.98371887207031, -36.81766891479492, -34.65161895751953, -32.48556900024414, -30.31951904296875, -28.15346908569336, -25.98741912841797, -23.821369171142578, -21.655319213867188, -19.489269256591797, -17.323219299316406, -15.157169342041016, -12.991119384765625, -10.825069427490234, -8.659019470214844, -6.492969512939453, -4.3269195556640625, -2.160869598388672, 0.00518035888671875, 2.1712303161621094, 4.3372802734375, 6.503330230712891, 8.669380187988281, 10.835430145263672, 13.001480102539062, 15.167530059814453, 17.333580017089844, 19.499629974365234, 21.665679931640625, 23.831729888916016, 25.997779846191406, 28.163829803466797, 30.329879760742188, 32.49592971801758, 34.66197967529297, 36.82802963256836, 38.99407958984375, 41.16012954711914, 43.32617950439453, 45.49222946166992, 47.65827941894531, 49.8243293762207, 51.990379333496094, 54.156429290771484, 56.322479248046875, 58.488529205322266, 60.654579162597656, 62.82062911987305, 64.98667907714844, 67.15272521972656, 69.31877899169922, 71.48483276367188, 73.65087890625]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 7.0, 7.0, 10.0, 4.0, 16.0, 15.0, 12.0, 32.0, 28.0, 42.0, 45.0, 52.0, 56.0, 67.0, 51.0, 64.0, 58.0, 63.0, 52.0, 48.0, 47.0, 46.0, 31.0, 33.0, 24.0, 29.0, 22.0, 13.0, 16.0, 5.0, 7.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-106.375, -102.58984375, -98.8046875, -95.01953125, -91.234375, -87.44921875, -83.6640625, -79.87890625, -76.09375, -72.30859375, -68.5234375, -64.73828125, -60.953125, -57.16796875, -53.3828125, -49.59765625, -45.8125, -42.02734375, -38.2421875, -34.45703125, -30.671875, -26.88671875, -23.1015625, -19.31640625, -15.53125, -11.74609375, -7.9609375, -4.17578125, -0.390625, 3.39453125, 7.1796875, 10.96484375, 14.75, 18.53515625, 22.3203125, 26.10546875, 29.890625, 33.67578125, 37.4609375, 41.24609375, 45.03125, 48.81640625, 52.6015625, 56.38671875, 60.171875, 63.95703125, 67.7421875, 71.52734375, 75.3125, 79.09765625, 82.8828125, 86.66796875, 90.453125, 94.23828125, 98.0234375, 101.80859375, 105.59375, 109.37890625, 113.1640625, 116.94921875, 120.734375, 124.51953125, 128.3046875, 132.08984375, 135.875]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 6.0, 8.0, 10.0, 14.0, 24.0, 33.0, 52.0, 65.0, 117.0, 195.0, 265.0, 518.0, 908.0, 1713.0, 3573.0, 7418.0, 14976.0, 30961.0, 66263.0, 149363.0, 314194.0, 251075.0, 109906.0, 49878.0, 23966.0, 11429.0, 5660.0, 2682.0, 1423.0, 713.0, 416.0, 260.0, 166.0, 96.0, 59.0, 48.0, 30.0, 15.0, 24.0, 10.0, 4.0, 6.0, 4.0, 5.0, 4.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.6796875, -15.1868896484375, -14.694091796875, -14.2012939453125, -13.70849609375, -13.2156982421875, -12.722900390625, -12.2301025390625, -11.7373046875, -11.2445068359375, -10.751708984375, -10.2589111328125, -9.76611328125, -9.2733154296875, -8.780517578125, -8.2877197265625, -7.794921875, -7.3021240234375, -6.809326171875, -6.3165283203125, -5.82373046875, -5.3309326171875, -4.838134765625, -4.3453369140625, -3.8525390625, -3.3597412109375, -2.866943359375, -2.3741455078125, -1.88134765625, -1.3885498046875, -0.895751953125, -0.4029541015625, 0.08984375, 0.5826416015625, 1.075439453125, 1.5682373046875, 2.06103515625, 2.5538330078125, 3.046630859375, 3.5394287109375, 4.0322265625, 4.5250244140625, 5.017822265625, 5.5106201171875, 6.00341796875, 6.4962158203125, 6.989013671875, 7.4818115234375, 7.974609375, 8.4674072265625, 8.960205078125, 9.4530029296875, 9.94580078125, 10.4385986328125, 10.931396484375, 11.4241943359375, 11.9169921875, 12.4097900390625, 12.902587890625, 13.3953857421875, 13.88818359375, 14.3809814453125, 14.873779296875, 15.3665771484375, 15.859375]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 1.0, 9.0, 11.0, 10.0, 11.0, 10.0, 18.0, 21.0, 17.0, 25.0, 39.0, 43.0, 24.0, 41.0, 42.0, 51.0, 48.0, 52.0, 1083.0, 38.0, 56.0, 44.0, 51.0, 37.0, 34.0, 35.0, 29.0, 32.0, 27.0, 17.0, 15.0, 20.0, 7.0, 9.0, 6.0, 5.0, 2.0, 2.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.875, -57.837890625, -55.80078125, -53.763671875, -51.7265625, -49.689453125, -47.65234375, -45.615234375, -43.578125, -41.541015625, -39.50390625, -37.466796875, -35.4296875, -33.392578125, -31.35546875, -29.318359375, -27.28125, -25.244140625, -23.20703125, -21.169921875, -19.1328125, -17.095703125, -15.05859375, -13.021484375, -10.984375, -8.947265625, -6.91015625, -4.873046875, -2.8359375, -0.798828125, 1.23828125, 3.275390625, 5.3125, 7.349609375, 9.38671875, 11.423828125, 13.4609375, 15.498046875, 17.53515625, 19.572265625, 21.609375, 23.646484375, 25.68359375, 27.720703125, 29.7578125, 31.794921875, 33.83203125, 35.869140625, 37.90625, 39.943359375, 41.98046875, 44.017578125, 46.0546875, 48.091796875, 50.12890625, 52.166015625, 54.203125, 56.240234375, 58.27734375, 60.314453125, 62.3515625, 64.388671875, 66.42578125, 68.462890625, 70.5]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 9.0, 9.0, 9.0, 21.0, 29.0, 26.0, 58.0, 120.0, 174.0, 224.0, 393.0, 620.0, 1023.0, 1577.0, 2439.0, 3934.0, 6522.0, 10461.0, 16849.0, 28714.0, 47946.0, 81338.0, 137267.0, 1264198.0, 197353.0, 119016.0, 70445.0, 41992.0, 25049.0, 14959.0, 9186.0, 5608.0, 3609.0, 2252.0, 1364.0, 841.0, 555.0, 333.0, 238.0, 128.0, 81.0, 60.0, 38.0, 24.0, 12.0, 14.0, 7.0, 4.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-10.3515625, -10.0267333984375, -9.701904296875, -9.3770751953125, -9.05224609375, -8.7274169921875, -8.402587890625, -8.0777587890625, -7.7529296875, -7.4281005859375, -7.103271484375, -6.7784423828125, -6.45361328125, -6.1287841796875, -5.803955078125, -5.4791259765625, -5.154296875, -4.8294677734375, -4.504638671875, -4.1798095703125, -3.85498046875, -3.5301513671875, -3.205322265625, -2.8804931640625, -2.5556640625, -2.2308349609375, -1.906005859375, -1.5811767578125, -1.25634765625, -0.9315185546875, -0.606689453125, -0.2818603515625, 0.04296875, 0.3677978515625, 0.692626953125, 1.0174560546875, 1.34228515625, 1.6671142578125, 1.991943359375, 2.3167724609375, 2.6416015625, 2.9664306640625, 3.291259765625, 3.6160888671875, 3.94091796875, 4.2657470703125, 4.590576171875, 4.9154052734375, 5.240234375, 5.5650634765625, 5.889892578125, 6.2147216796875, 6.53955078125, 6.8643798828125, 7.189208984375, 7.5140380859375, 7.8388671875, 8.1636962890625, 8.488525390625, 8.8133544921875, 9.13818359375, 9.4630126953125, 9.787841796875, 10.1126708984375, 10.4375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 10.0, 5.0, 11.0, 10.0, 13.0, 10.0, 13.0, 15.0, 19.0, 18.0, 24.0, 44.0, 41.0, 40.0, 56.0, 40.0, 52.0, 51.0, 45.0, 57.0, 55.0, 57.0, 44.0, 42.0, 34.0, 27.0, 32.0, 31.0, 17.0, 20.0, 16.0, 12.0, 14.0, 8.0, 3.0, 2.0, 6.0, 3.0, 5.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.030609130859375, -0.02963876724243164, -0.02866840362548828, -0.027698040008544922, -0.026727676391601562, -0.025757312774658203, -0.024786949157714844, -0.023816585540771484, -0.022846221923828125, -0.021875858306884766, -0.020905494689941406, -0.019935131072998047, -0.018964767456054688, -0.017994403839111328, -0.01702404022216797, -0.01605367660522461, -0.01508331298828125, -0.01411294937133789, -0.013142585754394531, -0.012172222137451172, -0.011201858520507812, -0.010231494903564453, -0.009261131286621094, -0.008290767669677734, -0.007320404052734375, -0.006350040435791016, -0.005379676818847656, -0.004409313201904297, -0.0034389495849609375, -0.002468585968017578, -0.0014982223510742188, -0.0005278587341308594, 0.0004425048828125, 0.0014128684997558594, 0.0023832321166992188, 0.003353595733642578, 0.0043239593505859375, 0.005294322967529297, 0.006264686584472656, 0.007235050201416016, 0.008205413818359375, 0.009175777435302734, 0.010146141052246094, 0.011116504669189453, 0.012086868286132812, 0.013057231903076172, 0.014027595520019531, 0.01499795913696289, 0.01596832275390625, 0.01693868637084961, 0.01790904998779297, 0.018879413604736328, 0.019849777221679688, 0.020820140838623047, 0.021790504455566406, 0.022760868072509766, 0.023731231689453125, 0.024701595306396484, 0.025671958923339844, 0.026642322540283203, 0.027612686157226562, 0.028583049774169922, 0.02955341339111328, 0.03052377700805664, 0.031494140625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 6.0, 14.0, 10.0, 15.0, 15.0, 22.0, 31.0, 43.0, 52.0, 84.0, 77.0, 132.0, 188.0, 231.0, 349.0, 509.0, 792.0, 1542.0, 3631.0, 11118.0, 42502.0, 190422.0, 501171.0, 224431.0, 50017.0, 12730.0, 4054.0, 1724.0, 823.0, 522.0, 305.0, 240.0, 166.0, 138.0, 125.0, 85.0, 57.0, 52.0, 29.0, 23.0, 24.0, 14.0, 17.0, 7.0, 7.0, 5.0, 1.0, 4.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.2418212890625, -0.23482322692871094, -0.22782516479492188, -0.2208271026611328, -0.21382904052734375, -0.2068309783935547, -0.19983291625976562, -0.19283485412597656, -0.1858367919921875, -0.17883872985839844, -0.17184066772460938, -0.1648426055908203, -0.15784454345703125, -0.1508464813232422, -0.14384841918945312, -0.13685035705566406, -0.129852294921875, -0.12285423278808594, -0.11585617065429688, -0.10885810852050781, -0.10186004638671875, -0.09486198425292969, -0.08786392211914062, -0.08086585998535156, -0.0738677978515625, -0.06686973571777344, -0.059871673583984375, -0.05287361145019531, -0.04587554931640625, -0.03887748718261719, -0.031879425048828125, -0.024881362915039062, -0.01788330078125, -0.010885238647460938, -0.003887176513671875, 0.0031108856201171875, 0.01010894775390625, 0.017107009887695312, 0.024105072021484375, 0.031103134155273438, 0.0381011962890625, 0.04509925842285156, 0.052097320556640625, 0.05909538269042969, 0.06609344482421875, 0.07309150695800781, 0.08008956909179688, 0.08708763122558594, 0.094085693359375, 0.10108375549316406, 0.10808181762695312, 0.11507987976074219, 0.12207794189453125, 0.1290760040283203, 0.13607406616210938, 0.14307212829589844, 0.1500701904296875, 0.15706825256347656, 0.16406631469726562, 0.1710643768310547, 0.17806243896484375, 0.1850605010986328, 0.19205856323242188, 0.19905662536621094, 0.2060546875]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 0.0, 3.0, 2.0, 5.0, 5.0, 10.0, 15.0, 36.0, 52.0, 53.0, 90.0, 90.0, 103.0, 125.0, 96.0, 87.0, 76.0, 45.0, 48.0, 19.0, 21.0, 12.0, 3.0, 8.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01844477280974388, -0.017304755747318268, -0.016164736822247505, -0.015024719759821892, -0.01388470083475113, -0.012744683772325516, -0.011604665778577328, -0.01046464778482914, -0.009324629791080952, -0.008184611797332764, -0.007044593803584576, -0.005904576275497675, -0.004764558281749487, -0.003624540288001299, -0.002484522759914398, -0.0013445047661662102, -0.00020448677241802216, 0.000935531104914844, 0.0020755489822477102, 0.0032155667431652546, 0.004355584736913443, 0.005495602730661631, 0.006635620258748531, 0.007775638252496719, 0.008915656246244907, 0.010055674239993095, 0.011195692233741283, 0.012335710227489471, 0.013475727289915085, 0.014615746214985847, 0.01575576327741146, 0.016895782202482224, 0.018035799264907837, 0.01917581632733345, 0.020315835252404213, 0.021455852314829826, 0.02259587123990059, 0.023735888302326202, 0.024875905364751816, 0.02601592428982258, 0.02715594321489334, 0.028295960277318954, 0.029435979202389717, 0.03057599626481533, 0.03171601518988609, 0.03285603225231171, 0.03399604931473732, 0.03513606637716293, 0.036276087164878845, 0.03741610422730446, 0.03855612128973007, 0.039696142077445984, 0.0408361591398716, 0.04197617620229721, 0.043116193264722824, 0.04425621032714844, 0.04539622738957405, 0.046536244451999664, 0.04767626151442528, 0.04881628230214119, 0.0499562993645668, 0.051096316426992416, 0.05223633348941803, 0.05337635427713394, 0.054516371339559555]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 5.0, 2.0, 3.0, 2.0, 2.0, 5.0, 3.0, 9.0, 9.0, 12.0, 9.0, 16.0, 17.0, 14.0, 27.0, 28.0, 19.0, 28.0, 23.0, 30.0, 30.0, 34.0, 32.0, 32.0, 48.0, 39.0, 45.0, 37.0, 41.0, 23.0, 22.0, 32.0, 34.0, 34.0, 27.0, 27.0, 19.0, 21.0, 28.0, 15.0, 19.0, 21.0, 12.0, 11.0, 9.0, 11.0, 6.0, 8.0, 8.0, 6.0, 4.0, 2.0, 7.0, 1.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.014528036117553711, -0.014067028649151325, -0.01360602118074894, -0.013145013712346554, -0.012684006243944168, -0.012222998775541782, -0.011761991307139397, -0.011300983838737011, -0.010839976370334625, -0.01037896890193224, -0.009917961433529854, -0.009456953965127468, -0.008995946496725082, -0.008534939028322697, -0.008073931559920311, -0.007612924091517925, -0.0071519166231155396, -0.006690909154713154, -0.006229901686310768, -0.005768894217908382, -0.005307886749505997, -0.004846879281103611, -0.004385871812701225, -0.00392486434429884, -0.003463856875896454, -0.003002849407494068, -0.0025418419390916824, -0.0020808344706892967, -0.001619827002286911, -0.0011588195338845253, -0.0006978120654821396, -0.00023680459707975388, 0.00022420287132263184, 0.0006852103397250175, 0.0011462178081274033, 0.001607225276529789, 0.0020682327449321747, 0.0025292402133345604, 0.002990247681736946, 0.003451255150139332, 0.0039122626185417175, 0.004373270086944103, 0.004834277555346489, 0.005295285023748875, 0.00575629249215126, 0.006217299960553646, 0.006678307428956032, 0.0071393148973584175, 0.007600322365760803, 0.008061329834163189, 0.008522337302565575, 0.00898334477096796, 0.009444352239370346, 0.009905359707772732, 0.010366367176175117, 0.010827374644577503, 0.011288382112979889, 0.011749389581382275, 0.01221039704978466, 0.012671404518187046, 0.013132411986589432, 0.013593419454991817, 0.014054426923394203, 0.014515434391796589, 0.014976441860198975]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 6.0, 7.0, 10.0, 4.0, 16.0, 15.0, 12.0, 32.0, 28.0, 42.0, 44.0, 53.0, 56.0, 67.0, 51.0, 64.0, 58.0, 63.0, 52.0, 48.0, 47.0, 45.0, 30.0, 35.0, 25.0, 28.0, 22.0, 13.0, 16.0, 5.0, 7.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-106.375, -102.58984375, -98.8046875, -95.01953125, -91.234375, -87.44921875, -83.6640625, -79.87890625, -76.09375, -72.30859375, -68.5234375, -64.73828125, -60.953125, -57.16796875, -53.3828125, -49.59765625, -45.8125, -42.02734375, -38.2421875, -34.45703125, -30.671875, -26.88671875, -23.1015625, -19.31640625, -15.53125, -11.74609375, -7.9609375, -4.17578125, -0.390625, 3.39453125, 7.1796875, 10.96484375, 14.75, 18.53515625, 22.3203125, 26.10546875, 29.890625, 33.67578125, 37.4609375, 41.24609375, 45.03125, 48.81640625, 52.6015625, 56.38671875, 60.171875, 63.95703125, 67.7421875, 71.52734375, 75.3125, 79.09765625, 82.8828125, 86.66796875, 90.453125, 94.23828125, 98.0234375, 101.80859375, 105.59375, 109.37890625, 113.1640625, 116.94921875, 120.734375, 124.51953125, 128.3046875, 132.08984375, 135.875]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 12.0, 12.0, 9.0, 18.0, 25.0, 39.0, 51.0, 91.0, 157.0, 275.0, 579.0, 1297.0, 3189.0, 9144.0, 45492.0, 524672.0, 413198.0, 36994.0, 8074.0, 2846.0, 1182.0, 531.0, 268.0, 146.0, 92.0, 58.0, 35.0, 28.0, 20.0, 9.0, 9.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-28.84375, -27.7734375, -26.703125, -25.6328125, -24.5625, -23.4921875, -22.421875, -21.3515625, -20.28125, -19.2109375, -18.140625, -17.0703125, -16.0, -14.9296875, -13.859375, -12.7890625, -11.71875, -10.6484375, -9.578125, -8.5078125, -7.4375, -6.3671875, -5.296875, -4.2265625, -3.15625, -2.0859375, -1.015625, 0.0546875, 1.125, 2.1953125, 3.265625, 4.3359375, 5.40625, 6.4765625, 7.546875, 8.6171875, 9.6875, 10.7578125, 11.828125, 12.8984375, 13.96875, 15.0390625, 16.109375, 17.1796875, 18.25, 19.3203125, 20.390625, 21.4609375, 22.53125, 23.6015625, 24.671875, 25.7421875, 26.8125, 27.8828125, 28.953125, 30.0234375, 31.09375, 32.1640625, 33.234375, 34.3046875, 35.375, 36.4453125, 37.515625, 38.5859375, 39.65625]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 3.0, 5.0, 10.0, 15.0, 16.0, 11.0, 32.0, 34.0, 48.0, 49.0, 59.0, 72.0, 67.0, 2044.0, 175.0, 68.0, 72.0, 48.0, 58.0, 39.0, 36.0, 23.0, 16.0, 9.0, 16.0, 7.0, 5.0, 3.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-225.5, -219.037109375, -212.57421875, -206.111328125, -199.6484375, -193.185546875, -186.72265625, -180.259765625, -173.796875, -167.333984375, -160.87109375, -154.408203125, -147.9453125, -141.482421875, -135.01953125, -128.556640625, -122.09375, -115.630859375, -109.16796875, -102.705078125, -96.2421875, -89.779296875, -83.31640625, -76.853515625, -70.390625, -63.927734375, -57.46484375, -51.001953125, -44.5390625, -38.076171875, -31.61328125, -25.150390625, -18.6875, -12.224609375, -5.76171875, 0.701171875, 7.1640625, 13.626953125, 20.08984375, 26.552734375, 33.015625, 39.478515625, 45.94140625, 52.404296875, 58.8671875, 65.330078125, 71.79296875, 78.255859375, 84.71875, 91.181640625, 97.64453125, 104.107421875, 110.5703125, 117.033203125, 123.49609375, 129.958984375, 136.421875, 142.884765625, 149.34765625, 155.810546875, 162.2734375, 168.736328125, 175.19921875, 181.662109375, 188.125]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 8.0, 8.0, 10.0, 14.0, 28.0, 35.0, 57.0, 88.0, 141.0, 237.0, 427.0, 998.0, 2815.0, 18116.0, 2737427.0, 369077.0, 12156.0, 2202.0, 840.0, 389.0, 243.0, 133.0, 71.0, 53.0, 39.0, 24.0, 19.0, 11.0, 9.0, 6.0, 3.0, 3.0, 0.0, 1.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.34375, -48.6611328125, -46.978515625, -45.2958984375, -43.61328125, -41.9306640625, -40.248046875, -38.5654296875, -36.8828125, -35.2001953125, -33.517578125, -31.8349609375, -30.15234375, -28.4697265625, -26.787109375, -25.1044921875, -23.421875, -21.7392578125, -20.056640625, -18.3740234375, -16.69140625, -15.0087890625, -13.326171875, -11.6435546875, -9.9609375, -8.2783203125, -6.595703125, -4.9130859375, -3.23046875, -1.5478515625, 0.134765625, 1.8173828125, 3.5, 5.1826171875, 6.865234375, 8.5478515625, 10.23046875, 11.9130859375, 13.595703125, 15.2783203125, 16.9609375, 18.6435546875, 20.326171875, 22.0087890625, 23.69140625, 25.3740234375, 27.056640625, 28.7392578125, 30.421875, 32.1044921875, 33.787109375, 35.4697265625, 37.15234375, 38.8349609375, 40.517578125, 42.2001953125, 43.8828125, 45.5654296875, 47.248046875, 48.9306640625, 50.61328125, 52.2958984375, 53.978515625, 55.6611328125, 57.34375]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 7.0, 8.0, 12.0, 16.0, 33.0, 62.0, 114.0, 150.0, 180.0, 147.0, 99.0, 57.0, 39.0, 25.0, 21.0, 6.0, 4.0, 7.0, 0.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-126.16494750976562, -118.51383972167969, -110.86273193359375, -103.21162414550781, -95.56050872802734, -87.9094009399414, -80.25829315185547, -72.607177734375, -64.95606994628906, -57.304962158203125, -49.65385055541992, -42.002742767333984, -34.35163116455078, -26.700523376464844, -19.049415588378906, -11.398303985595703, -3.7472000122070312, 3.903909206390381, 11.555018424987793, 19.206127166748047, 26.857236862182617, 34.50834655761719, 42.159454345703125, 49.81056594848633, 57.461673736572266, 65.11278533935547, 72.7638931274414, 80.41500091552734, 88.06610870361328, 95.71722412109375, 103.36833190917969, 111.01943969726562, 118.67054748535156, 126.3216552734375, 133.97276306152344, 141.62387084960938, 149.2749786376953, 156.92608642578125, 164.57720947265625, 172.2283172607422, 179.87942504882812, 187.53053283691406, 195.181640625, 202.83274841308594, 210.48385620117188, 218.13497924804688, 225.78607177734375, 233.43719482421875, 241.08828735351562, 248.73939514160156, 256.3905029296875, 264.0416259765625, 271.6927185058594, 279.3438415527344, 286.99493408203125, 294.64605712890625, 302.29718017578125, 309.94830322265625, 317.5993957519531, 325.2505187988281, 332.901611328125, 340.552734375, 348.2038269042969, 355.8549499511719, 363.50604248046875]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 4.0, 4.0, 3.0, 7.0, 12.0, 13.0, 11.0, 13.0, 19.0, 13.0, 27.0, 32.0, 26.0, 31.0, 39.0, 31.0, 38.0, 37.0, 58.0, 53.0, 50.0, 51.0, 46.0, 48.0, 31.0, 45.0, 50.0, 36.0, 26.0, 24.0, 23.0, 23.0, 14.0, 8.0, 12.0, 11.0, 15.0, 4.0, 4.0, 2.0, 5.0, 0.0, 1.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-191.43292236328125, -185.52383422851562, -179.61473083496094, -173.7056427001953, -167.7965545654297, -161.887451171875, -155.97836303710938, -150.06927490234375, -144.16017150878906, -138.25108337402344, -132.34197998046875, -126.43289184570312, -120.52379608154297, -114.61470031738281, -108.70561218261719, -102.79651641845703, -96.8874282836914, -90.97833251953125, -85.06924438476562, -79.16014862060547, -73.25105285644531, -67.34196472167969, -61.43286895751953, -55.523773193359375, -49.614681243896484, -43.705589294433594, -37.79649353027344, -31.887401580810547, -25.978307723999023, -20.0692138671875, -14.16012191772461, -8.251026153564453, -2.3419342041015625, 3.5671591758728027, 9.476252555847168, 15.385345458984375, 21.2944393157959, 27.203533172607422, 33.11262512207031, 39.02172088623047, 44.93081283569336, 50.83990478515625, 56.749000549316406, 62.6580924987793, 68.56718444824219, 74.47628021240234, 80.3853759765625, 86.29446411132812, 92.20355987548828, 98.11265563964844, 104.02174377441406, 109.93083953857422, 115.83993530273438, 121.7490234375, 127.65811920166016, 133.5672149658203, 139.47630310058594, 145.38539123535156, 151.29449462890625, 157.20358276367188, 163.1126708984375, 169.0217742919922, 174.9308624267578, 180.8399658203125, 186.74905395507812]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 2.0, 7.0, 9.0, 14.0, 15.0, 21.0, 22.0, 29.0, 51.0, 53.0, 76.0, 114.0, 152.0, 202.0, 246.0, 341.0, 440.0, 702.0, 867.0, 1457.0, 1039955.0, 1045.0, 696.0, 537.0, 361.0, 287.0, 218.0, 161.0, 113.0, 81.0, 73.0, 46.0, 32.0, 36.0, 23.0, 21.0, 13.0, 9.0, 11.0, 8.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-57.93876647949219, -56.01939392089844, -54.10002517700195, -52.1806526184082, -50.26128387451172, -48.34191131591797, -46.42253875732422, -44.503170013427734, -42.58380126953125, -40.6644287109375, -38.745059967041016, -36.825687408447266, -34.90631866455078, -32.98694610595703, -31.067575454711914, -29.148204803466797, -27.228832244873047, -25.30946159362793, -23.390090942382812, -21.470718383789062, -19.551349639892578, -17.631977081298828, -15.712606430053711, -13.793235778808594, -11.873865127563477, -9.95449447631836, -8.035123825073242, -6.115752220153809, -4.196381568908691, -2.277010917663574, -0.3576393127441406, 1.5617313385009766, 3.4811019897460938, 5.400472640991211, 7.319843769073486, 9.239214897155762, 11.158585548400879, 13.077956199645996, 14.99732780456543, 16.916698455810547, 18.836069107055664, 20.75543975830078, 22.6748104095459, 24.594181060791016, 26.513553619384766, 28.43292236328125, 30.352294921875, 32.27166748046875, 34.191036224365234, 36.110408782958984, 38.02977752685547, 39.94915008544922, 41.8685188293457, 43.78789138793945, 45.70726013183594, 47.62663269042969, 49.54600524902344, 51.46537780761719, 53.38474655151367, 55.30411911010742, 57.223487854003906, 59.142860412597656, 61.062232971191406, 62.98160171508789, 64.90097045898438]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 9.0, 10.0, 17.0, 16.0, 76.0, 51462660.0, 265.0, 42.0, 10.0, 7.0, 3.0, 6.0, 10.0, 3.0, 5.0, 3.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8721.494140625, -8321.30078125, -7921.10693359375, -7520.9130859375, -7120.71923828125, -6720.525390625, -6320.33203125, -5920.13818359375, -5519.9443359375, -5119.75048828125, -4719.55712890625, -4319.36328125, -3919.16943359375, -3518.975830078125, -3118.7822265625, -2718.58837890625, -2318.39501953125, -1918.2012939453125, -1518.007568359375, -1117.81396484375, -717.6202392578125, -317.426513671875, 82.76708984375, 482.9609375, 883.154541015625, 1283.3482666015625, 1683.5419921875, 2083.735595703125, 2483.92919921875, 2884.123046875, 3284.316650390625, 3684.510498046875, 4084.7041015625, 4484.89794921875, 4885.09130859375, 5285.28515625, 5685.47900390625, 6085.6728515625, 6485.8662109375, 6886.06005859375, 7286.25390625, 7686.44775390625, 8086.64111328125, 8486.8349609375, 8887.0283203125, 9287.22265625, 9687.416015625, 10087.609375, 10487.802734375, 10887.99609375, 11288.1904296875, 11688.3837890625, 12088.5771484375, 12488.771484375, 12888.96484375, 13289.158203125, 13689.3525390625, 14089.5458984375, 14489.740234375, 14889.93359375, 15290.126953125, 15690.3212890625, 16090.5146484375, 16490.708984375, 16890.90234375]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 9.0, 21.0, 30.0, 61.0, 109.0, 138.0, 196.0, 314.0, 470.0, 695.0, 1184.0, 1798.0, 2703.0, 4017.0, 6259.0, 9713.0, 14591.0, 22522.0, 34818.0, 54802.0, 86788.0, 139914.0, 232729.0, 406592.0, 3392931.0, 992043.0, 348886.0, 202189.0, 122727.0, 76460.0, 47335.0, 30847.0, 20001.0, 12837.0, 8549.0, 5589.0, 3727.0, 2430.0, 1562.0, 974.0, 702.0, 414.0, 258.0, 173.0, 109.0, 75.0, 54.0, 36.0, 26.0, 15.0, 8.0, 3.0, 1.0, 1.0, 2.0], "bins": [-4.92578125, -4.78033447265625, -4.6348876953125, -4.48944091796875, -4.343994140625, -4.19854736328125, -4.0531005859375, -3.90765380859375, -3.76220703125, -3.61676025390625, -3.4713134765625, -3.32586669921875, -3.180419921875, -3.03497314453125, -2.8895263671875, -2.74407958984375, -2.5986328125, -2.45318603515625, -2.3077392578125, -2.16229248046875, -2.016845703125, -1.87139892578125, -1.7259521484375, -1.58050537109375, -1.43505859375, -1.28961181640625, -1.1441650390625, -0.99871826171875, -0.853271484375, -0.70782470703125, -0.5623779296875, -0.41693115234375, -0.271484375, -0.12603759765625, 0.0194091796875, 0.16485595703125, 0.310302734375, 0.45574951171875, 0.6011962890625, 0.74664306640625, 0.89208984375, 1.03753662109375, 1.1829833984375, 1.32843017578125, 1.473876953125, 1.61932373046875, 1.7647705078125, 1.91021728515625, 2.0556640625, 2.20111083984375, 2.3465576171875, 2.49200439453125, 2.637451171875, 2.78289794921875, 2.9283447265625, 3.07379150390625, 3.21923828125, 3.36468505859375, 3.5101318359375, 3.65557861328125, 3.801025390625, 3.94647216796875, 4.0919189453125, 4.23736572265625, 4.3828125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 6.0, 3.0, 4.0, 2.0, 7.0, 11.0, 11.0, 11.0, 16.0, 10.0, 20.0, 20.0, 21.0, 32.0, 32.0, 30.0, 41.0, 30.0, 46.0, 40.0, 34.0, 70.0, 384.0, 646.0, 84.0, 41.0, 56.0, 40.0, 32.0, 27.0, 31.0, 30.0, 26.0, 19.0, 23.0, 16.0, 12.0, 16.0, 14.0, 6.0, 4.0, 7.0, 7.0, 5.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-20.21875, -19.6259765625, -19.033203125, -18.4404296875, -17.84765625, -17.2548828125, -16.662109375, -16.0693359375, -15.4765625, -14.8837890625, -14.291015625, -13.6982421875, -13.10546875, -12.5126953125, -11.919921875, -11.3271484375, -10.734375, -10.1416015625, -9.548828125, -8.9560546875, -8.36328125, -7.7705078125, -7.177734375, -6.5849609375, -5.9921875, -5.3994140625, -4.806640625, -4.2138671875, -3.62109375, -3.0283203125, -2.435546875, -1.8427734375, -1.25, -0.6572265625, -0.064453125, 0.5283203125, 1.12109375, 1.7138671875, 2.306640625, 2.8994140625, 3.4921875, 4.0849609375, 4.677734375, 5.2705078125, 5.86328125, 6.4560546875, 7.048828125, 7.6416015625, 8.234375, 8.8271484375, 9.419921875, 10.0126953125, 10.60546875, 11.1982421875, 11.791015625, 12.3837890625, 12.9765625, 13.5693359375, 14.162109375, 14.7548828125, 15.34765625, 15.9404296875, 16.533203125, 17.1259765625, 17.71875]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 6.0, 7.0, 10.0, 22.0, 31.0, 43.0, 78.0, 146.0, 154.0, 312.0, 412.0, 638.0, 966.0, 1529.0, 2219.0, 3538.0, 5360.0, 8347.0, 12968.0, 20764.0, 33978.0, 57850.0, 100229.0, 185808.0, 375829.0, 2399949.0, 2272874.0, 373646.0, 185089.0, 100440.0, 56796.0, 33910.0, 20874.0, 12833.0, 8355.0, 5276.0, 3452.0, 2286.0, 1522.0, 985.0, 660.0, 453.0, 282.0, 184.0, 112.0, 71.0, 38.0, 35.0, 21.0, 14.0, 18.0, 9.0, 5.0, 3.0, 4.0], "bins": [-6.84375, -6.648193359375, -6.45263671875, -6.257080078125, -6.0615234375, -5.865966796875, -5.67041015625, -5.474853515625, -5.279296875, -5.083740234375, -4.88818359375, -4.692626953125, -4.4970703125, -4.301513671875, -4.10595703125, -3.910400390625, -3.71484375, -3.519287109375, -3.32373046875, -3.128173828125, -2.9326171875, -2.737060546875, -2.54150390625, -2.345947265625, -2.150390625, -1.954833984375, -1.75927734375, -1.563720703125, -1.3681640625, -1.172607421875, -0.97705078125, -0.781494140625, -0.5859375, -0.390380859375, -0.19482421875, 0.000732421875, 0.1962890625, 0.391845703125, 0.58740234375, 0.782958984375, 0.978515625, 1.174072265625, 1.36962890625, 1.565185546875, 1.7607421875, 1.956298828125, 2.15185546875, 2.347412109375, 2.54296875, 2.738525390625, 2.93408203125, 3.129638671875, 3.3251953125, 3.520751953125, 3.71630859375, 3.911865234375, 4.107421875, 4.302978515625, 4.49853515625, 4.694091796875, 4.8896484375, 5.085205078125, 5.28076171875, 5.476318359375, 5.671875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 12.0, 8.0, 4.0, 13.0, 13.0, 13.0, 7.0, 18.0, 19.0, 12.0, 25.0, 29.0, 30.0, 33.0, 34.0, 40.0, 40.0, 46.0, 78.0, 183.0, 668.0, 211.0, 68.0, 59.0, 38.0, 48.0, 33.0, 30.0, 38.0, 21.0, 24.0, 23.0, 20.0, 15.0, 22.0, 5.0, 13.0, 7.0, 5.0, 5.0, 5.0, 3.0, 5.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.2265625, -10.8330078125, -10.439453125, -10.0458984375, -9.65234375, -9.2587890625, -8.865234375, -8.4716796875, -8.078125, -7.6845703125, -7.291015625, -6.8974609375, -6.50390625, -6.1103515625, -5.716796875, -5.3232421875, -4.9296875, -4.5361328125, -4.142578125, -3.7490234375, -3.35546875, -2.9619140625, -2.568359375, -2.1748046875, -1.78125, -1.3876953125, -0.994140625, -0.6005859375, -0.20703125, 0.1865234375, 0.580078125, 0.9736328125, 1.3671875, 1.7607421875, 2.154296875, 2.5478515625, 2.94140625, 3.3349609375, 3.728515625, 4.1220703125, 4.515625, 4.9091796875, 5.302734375, 5.6962890625, 6.08984375, 6.4833984375, 6.876953125, 7.2705078125, 7.6640625, 8.0576171875, 8.451171875, 8.8447265625, 9.23828125, 9.6318359375, 10.025390625, 10.4189453125, 10.8125, 11.2060546875, 11.599609375, 11.9931640625, 12.38671875, 12.7802734375, 13.173828125, 13.5673828125, 13.9609375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 5.0, 4.0, 9.0, 9.0, 18.0, 16.0, 35.0, 49.0, 63.0, 70.0, 94.0, 107.0, 180.0, 213.0, 342.0, 497.0, 574.0, 738.0, 1108.0, 1653.0, 2593.0, 4234.0, 7705.0, 15977.0, 41997.0, 198570.0, 5873840.0, 87211.0, 26170.0, 11059.0, 5854.0, 3446.0, 2099.0, 1392.0, 906.0, 616.0, 494.0, 384.0, 292.0, 191.0, 132.0, 109.0, 89.0, 85.0, 69.0, 45.0, 34.0, 18.0, 11.0, 9.0, 8.0, 6.0, 4.0, 4.0, 5.0, 2.0, 2.0], "bins": [-19.5625, -18.974609375, -18.38671875, -17.798828125, -17.2109375, -16.623046875, -16.03515625, -15.447265625, -14.859375, -14.271484375, -13.68359375, -13.095703125, -12.5078125, -11.919921875, -11.33203125, -10.744140625, -10.15625, -9.568359375, -8.98046875, -8.392578125, -7.8046875, -7.216796875, -6.62890625, -6.041015625, -5.453125, -4.865234375, -4.27734375, -3.689453125, -3.1015625, -2.513671875, -1.92578125, -1.337890625, -0.75, -0.162109375, 0.42578125, 1.013671875, 1.6015625, 2.189453125, 2.77734375, 3.365234375, 3.953125, 4.541015625, 5.12890625, 5.716796875, 6.3046875, 6.892578125, 7.48046875, 8.068359375, 8.65625, 9.244140625, 9.83203125, 10.419921875, 11.0078125, 11.595703125, 12.18359375, 12.771484375, 13.359375, 13.947265625, 14.53515625, 15.123046875, 15.7109375, 16.298828125, 16.88671875, 17.474609375, 18.0625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 6.0, 9.0, 4.0, 7.0, 7.0, 12.0, 13.0, 11.0, 14.0, 17.0, 18.0, 26.0, 21.0, 35.0, 41.0, 38.0, 36.0, 37.0, 64.0, 101.0, 304.0, 528.0, 165.0, 87.0, 65.0, 50.0, 46.0, 45.0, 36.0, 28.0, 18.0, 21.0, 21.0, 15.0, 10.0, 21.0, 14.0, 9.0, 5.0, 7.0, 10.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.3828125, -9.1009521484375, -8.819091796875, -8.5372314453125, -8.25537109375, -7.9735107421875, -7.691650390625, -7.4097900390625, -7.1279296875, -6.8460693359375, -6.564208984375, -6.2823486328125, -6.00048828125, -5.7186279296875, -5.436767578125, -5.1549072265625, -4.873046875, -4.5911865234375, -4.309326171875, -4.0274658203125, -3.74560546875, -3.4637451171875, -3.181884765625, -2.9000244140625, -2.6181640625, -2.3363037109375, -2.054443359375, -1.7725830078125, -1.49072265625, -1.2088623046875, -0.927001953125, -0.6451416015625, -0.36328125, -0.0814208984375, 0.200439453125, 0.4822998046875, 0.76416015625, 1.0460205078125, 1.327880859375, 1.6097412109375, 1.8916015625, 2.1734619140625, 2.455322265625, 2.7371826171875, 3.01904296875, 3.3009033203125, 3.582763671875, 3.8646240234375, 4.146484375, 4.4283447265625, 4.710205078125, 4.9920654296875, 5.27392578125, 5.5557861328125, 5.837646484375, 6.1195068359375, 6.4013671875, 6.6832275390625, 6.965087890625, 7.2469482421875, 7.52880859375, 7.8106689453125, 8.092529296875, 8.3743896484375, 8.65625]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 5.0, 3.0, 16.0, 18.0, 39.0, 85.0, 178.0, 290.0, 174.0, 95.0, 45.0, 23.0, 10.0, 12.0, 6.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.56217384338379, -16.615549087524414, -15.668924331665039, -14.72230052947998, -13.775675773620605, -12.82905101776123, -11.882427215576172, -10.935802459716797, -9.989177703857422, -9.042552947998047, -8.095928192138672, -7.149304389953613, -6.202679634094238, -5.256054878234863, -4.3094305992126465, -3.3628063201904297, -2.4161815643310547, -1.4695570468902588, -0.5229325294494629, 0.423691987991333, 1.370316505432129, 2.316941261291504, 3.2635655403137207, 4.2101898193359375, 5.1568145751953125, 6.1034393310546875, 7.050063610076904, 7.996687889099121, 8.943312644958496, 9.889937400817871, 10.83656120300293, 11.783185958862305, 12.729808807373047, 13.676433563232422, 14.623058319091797, 15.569682121276855, 16.516307830810547, 17.462932586669922, 18.409555435180664, 19.35618019104004, 20.302804946899414, 21.24942970275879, 22.196054458618164, 23.14267921447754, 24.08930206298828, 25.035926818847656, 25.98255157470703, 26.929176330566406, 27.87580108642578, 28.822425842285156, 29.76905059814453, 30.715675354003906, 31.66230010986328, 32.608924865722656, 33.55554962158203, 34.502174377441406, 35.44879913330078, 36.395423889160156, 37.34204864501953, 38.288673400878906, 39.23529815673828, 40.181922912597656, 41.12854766845703, 42.075172424316406, 43.021793365478516]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 5.0, 5.0, 2.0, 5.0, 8.0, 5.0, 6.0, 6.0, 9.0, 13.0, 14.0, 19.0, 10.0, 10.0, 18.0, 24.0, 28.0, 31.0, 25.0, 21.0, 34.0, 29.0, 31.0, 38.0, 29.0, 39.0, 35.0, 30.0, 39.0, 38.0, 21.0, 32.0, 44.0, 28.0, 21.0, 28.0, 19.0, 24.0, 19.0, 17.0, 20.0, 15.0, 21.0, 19.0, 6.0, 16.0, 9.0, 13.0, 7.0, 5.0, 5.0, 7.0, 2.0, 3.0, 7.0, 2.0, 0.0, 0.0, 1.0, 3.0], "bins": [-9.99074935913086, -9.672858238220215, -9.35496711730957, -9.037075996398926, -8.719184875488281, -8.40129280090332, -8.083401679992676, -7.765510559082031, -7.447619438171387, -7.129728317260742, -6.811837196350098, -6.493945598602295, -6.17605447769165, -5.858163356781006, -5.540271759033203, -5.222380638122559, -4.904489517211914, -4.5865983963012695, -4.268707275390625, -3.9508156776428223, -3.6329245567321777, -3.315033435821533, -2.9971420764923096, -2.679250717163086, -2.3613595962524414, -2.043468475341797, -1.7255771160125732, -1.4076858758926392, -1.089794635772705, -0.771903395652771, -0.4540121555328369, -0.13612079620361328, 0.18177032470703125, 0.49966156482696533, 0.8175528049468994, 1.1354440450668335, 1.4533352851867676, 1.7712265253067017, 2.0891177654266357, 2.4070091247558594, 2.724900245666504, 3.0427913665771484, 3.360682725906372, 3.6785740852355957, 3.9964652061462402, 4.314356327056885, 4.6322479248046875, 4.950139045715332, 5.268030166625977, 5.585921287536621, 5.903812408447266, 6.221704006195068, 6.539595127105713, 6.857486248016357, 7.17537784576416, 7.493268966674805, 7.811160087585449, 8.129051208496094, 8.446942329406738, 8.764833450317383, 9.082725524902344, 9.400616645812988, 9.718507766723633, 10.036398887634277, 10.354290008544922]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 7.0, 9.0, 10.0, 27.0, 27.0, 59.0, 106.0, 106.0, 218.0, 297.0, 474.0, 705.0, 1093.0, 1495.0, 2349.0, 3567.0, 5844.0, 10844.0, 23964.0, 70985.0, 3841268.0, 155699.0, 38770.0, 16246.0, 8012.0, 4407.0, 2577.0, 1609.0, 1018.0, 709.0, 480.0, 350.0, 253.0, 175.0, 125.0, 86.0, 71.0, 56.0, 47.0, 38.0, 32.0, 18.0, 12.0, 12.0, 10.0, 8.0, 3.0, 4.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2288818359375, -0.2196216583251953, -0.21036148071289062, -0.20110130310058594, -0.19184112548828125, -0.18258094787597656, -0.17332077026367188, -0.1640605926513672, -0.1548004150390625, -0.1455402374267578, -0.13628005981445312, -0.12701988220214844, -0.11775970458984375, -0.10849952697753906, -0.09923934936523438, -0.08997917175292969, -0.080718994140625, -0.07145881652832031, -0.062198638916015625, -0.05293846130371094, -0.04367828369140625, -0.03441810607910156, -0.025157928466796875, -0.015897750854492188, -0.0066375732421875, 0.0026226043701171875, 0.011882781982421875, 0.021142959594726562, 0.03040313720703125, 0.03966331481933594, 0.048923492431640625, 0.05818367004394531, 0.06744384765625, 0.07670402526855469, 0.08596420288085938, 0.09522438049316406, 0.10448455810546875, 0.11374473571777344, 0.12300491333007812, 0.1322650909423828, 0.1415252685546875, 0.1507854461669922, 0.16004562377929688, 0.16930580139160156, 0.17856597900390625, 0.18782615661621094, 0.19708633422851562, 0.2063465118408203, 0.215606689453125, 0.2248668670654297, 0.23412704467773438, 0.24338722229003906, 0.25264739990234375, 0.26190757751464844, 0.2711677551269531, 0.2804279327392578, 0.2896881103515625, 0.2989482879638672, 0.3082084655761719, 0.31746864318847656, 0.32672882080078125, 0.33598899841308594, 0.3452491760253906, 0.3545093536376953, 0.36376953125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 4.0, 3.0, 4.0, 1.0, 5.0, 2.0, 1.0, 4.0, 1.0, 8.0, 13.0, 11.0, 20.0, 15.0, 11.0, 778.0, 20.0, 13.0, 14.0, 11.0, 17.0, 7.0, 11.0, 4.0, 8.0, 2.0, 1.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.031890869140625, -0.030734539031982422, -0.029578208923339844, -0.028421878814697266, -0.027265548706054688, -0.02610921859741211, -0.02495288848876953, -0.023796558380126953, -0.022640228271484375, -0.021483898162841797, -0.02032756805419922, -0.01917123794555664, -0.018014907836914062, -0.016858577728271484, -0.015702247619628906, -0.014545917510986328, -0.01338958740234375, -0.012233257293701172, -0.011076927185058594, -0.009920597076416016, -0.008764266967773438, -0.007607936859130859, -0.006451606750488281, -0.005295276641845703, -0.004138946533203125, -0.002982616424560547, -0.0018262863159179688, -0.0006699562072753906, 0.0004863739013671875, 0.0016427040100097656, 0.0027990341186523438, 0.003955364227294922, 0.0051116943359375, 0.006268024444580078, 0.007424354553222656, 0.008580684661865234, 0.009737014770507812, 0.01089334487915039, 0.012049674987792969, 0.013206005096435547, 0.014362335205078125, 0.015518665313720703, 0.01667499542236328, 0.01783132553100586, 0.018987655639648438, 0.020143985748291016, 0.021300315856933594, 0.022456645965576172, 0.02361297607421875, 0.024769306182861328, 0.025925636291503906, 0.027081966400146484, 0.028238296508789062, 0.02939462661743164, 0.03055095672607422, 0.0317072868347168, 0.032863616943359375, 0.03401994705200195, 0.03517627716064453, 0.03633260726928711, 0.03748893737792969, 0.038645267486572266, 0.039801597595214844, 0.04095792770385742, 0.0421142578125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 3.0, 5.0, 13.0, 13.0, 10.0, 17.0, 15.0, 12.0, 30.0, 29.0, 38.0, 74.0, 75.0, 106.0, 148.0, 242.0, 480.0, 1100.0, 3042.0, 10611.0, 47841.0, 332242.0, 3320737.0, 405047.0, 54112.0, 12189.0, 3514.0, 1246.0, 468.0, 237.0, 149.0, 110.0, 82.0, 52.0, 50.0, 32.0, 19.0, 28.0, 14.0, 17.0, 9.0, 9.0, 5.0, 3.0, 7.0, 4.0, 3.0, 0.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.329833984375, -0.3190345764160156, -0.30823516845703125, -0.2974357604980469, -0.2866363525390625, -0.2758369445800781, -0.26503753662109375, -0.2542381286621094, -0.243438720703125, -0.23263931274414062, -0.22183990478515625, -0.21104049682617188, -0.2002410888671875, -0.18944168090820312, -0.17864227294921875, -0.16784286499023438, -0.15704345703125, -0.14624404907226562, -0.13544464111328125, -0.12464523315429688, -0.1138458251953125, -0.10304641723632812, -0.09224700927734375, -0.08144760131835938, -0.070648193359375, -0.059848785400390625, -0.04904937744140625, -0.038249969482421875, -0.0274505615234375, -0.016651153564453125, -0.00585174560546875, 0.004947662353515625, 0.0157470703125, 0.026546478271484375, 0.03734588623046875, 0.048145294189453125, 0.0589447021484375, 0.06974411010742188, 0.08054351806640625, 0.09134292602539062, 0.102142333984375, 0.11294174194335938, 0.12374114990234375, 0.13454055786132812, 0.1453399658203125, 0.15613937377929688, 0.16693878173828125, 0.17773818969726562, 0.18853759765625, 0.19933700561523438, 0.21013641357421875, 0.22093582153320312, 0.2317352294921875, 0.24253463745117188, 0.25333404541015625, 0.2641334533691406, 0.274932861328125, 0.2857322692871094, 0.29653167724609375, 0.3073310852050781, 0.3181304931640625, 0.3289299011230469, 0.33972930908203125, 0.3505287170410156, 0.361328125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 3.0, 4.0, 8.0, 10.0, 12.0, 7.0, 13.0, 12.0, 13.0, 30.0, 23.0, 40.0, 45.0, 47.0, 61.0, 67.0, 73.0, 106.0, 124.0, 177.0, 207.0, 338.0, 815.0, 567.0, 297.0, 211.0, 140.0, 123.0, 79.0, 68.0, 68.0, 37.0, 41.0, 46.0, 30.0, 23.0, 23.0, 14.0, 16.0, 17.0, 6.0, 5.0, 6.0, 3.0, 4.0, 7.0, 4.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.051239013671875, -0.049576759338378906, -0.04791450500488281, -0.04625225067138672, -0.044589996337890625, -0.04292774200439453, -0.04126548767089844, -0.039603233337402344, -0.03794097900390625, -0.036278724670410156, -0.03461647033691406, -0.03295421600341797, -0.031291961669921875, -0.02962970733642578, -0.027967453002929688, -0.026305198669433594, -0.0246429443359375, -0.022980690002441406, -0.021318435668945312, -0.01965618133544922, -0.017993927001953125, -0.01633167266845703, -0.014669418334960938, -0.013007164001464844, -0.01134490966796875, -0.009682655334472656, -0.008020401000976562, -0.006358146667480469, -0.004695892333984375, -0.0030336380004882812, -0.0013713836669921875, 0.00029087066650390625, 0.001953125, 0.0036153793334960938, 0.0052776336669921875, 0.006939888000488281, 0.008602142333984375, 0.010264396667480469, 0.011926651000976562, 0.013588905334472656, 0.01525115966796875, 0.016913414001464844, 0.018575668334960938, 0.02023792266845703, 0.021900177001953125, 0.02356243133544922, 0.025224685668945312, 0.026886940002441406, 0.0285491943359375, 0.030211448669433594, 0.03187370300292969, 0.03353595733642578, 0.035198211669921875, 0.03686046600341797, 0.03852272033691406, 0.040184974670410156, 0.04184722900390625, 0.043509483337402344, 0.04517173767089844, 0.04683399200439453, 0.048496246337890625, 0.05015850067138672, 0.05182075500488281, 0.053483009338378906, 0.055145263671875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 8.0, 9.0, 7.0, 11.0, 18.0, 23.0, 34.0, 53.0, 60.0, 93.0, 108.0, 120.0, 124.0, 96.0, 69.0, 42.0, 34.0, 21.0, 22.0, 18.0, 11.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4901188910007477, -0.4759203791618347, -0.46172186732292175, -0.4475233554840088, -0.43332481384277344, -0.4191263020038605, -0.4049277901649475, -0.39072927832603455, -0.3765307664871216, -0.3623322546482086, -0.34813374280929565, -0.3339352011680603, -0.31973668932914734, -0.3055381774902344, -0.2913396656513214, -0.27714115381240845, -0.2629426121711731, -0.24874410033226013, -0.23454557359218597, -0.220347061753273, -0.20614853501319885, -0.1919500231742859, -0.17775151133537292, -0.16355299949645996, -0.1493544727563858, -0.13515596091747284, -0.12095743417739868, -0.10675892233848572, -0.09256040304899216, -0.0783618837594986, -0.06416337192058563, -0.04996485263109207, -0.03576630353927612, -0.02156778611242771, -0.0073692686855793, 0.006829246878623962, 0.021027766168117523, 0.035226285457611084, 0.04942479729652405, 0.06362331658601761, 0.07782183587551117, 0.09202035516500473, 0.10621887445449829, 0.12041738629341125, 0.13461589813232422, 0.14881442487239838, 0.16301293671131134, 0.1772114634513855, 0.19140997529029846, 0.20560848712921143, 0.21980701386928558, 0.23400552570819855, 0.2482040524482727, 0.26240256428718567, 0.27660107612609863, 0.2907995879650116, 0.30499809980392456, 0.3191966116428375, 0.3333951234817505, 0.34759366512298584, 0.3617921769618988, 0.37599068880081177, 0.39018920063972473, 0.4043877124786377, 0.41858625411987305]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 8.0, 5.0, 13.0, 14.0, 16.0, 17.0, 14.0, 24.0, 31.0, 28.0, 30.0, 32.0, 54.0, 40.0, 47.0, 51.0, 32.0, 38.0, 61.0, 53.0, 31.0, 48.0, 51.0, 31.0, 26.0, 44.0, 24.0, 26.0, 18.0, 16.0, 21.0, 9.0, 9.0, 7.0, 4.0, 5.0, 1.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.3213180899620056, -0.3113866150379181, -0.30145516991615295, -0.29152369499206543, -0.2815922498703003, -0.27166077494621277, -0.26172930002212524, -0.2517978549003601, -0.24186637997627258, -0.23193491995334625, -0.22200345993041992, -0.2120719850063324, -0.20214052498340607, -0.19220906496047974, -0.1822776049375534, -0.17234614491462708, -0.16241468489170074, -0.15248322486877441, -0.14255176484584808, -0.13262030482292175, -0.12268882989883423, -0.1127573698759079, -0.10282590985298157, -0.09289444237947464, -0.08296298235654831, -0.07303152233362198, -0.06310005486011505, -0.05316859483718872, -0.04323713108897209, -0.03330566734075546, -0.023374207317829132, -0.013442739844322205, -0.003511279821395874, 0.00642018299549818, 0.016351645812392235, 0.026283107697963715, 0.036214571446180344, 0.04614603519439697, 0.0560774952173233, 0.06600896269083023, 0.07594042271375656, 0.08587188273668289, 0.09580335021018982, 0.10573481023311615, 0.11566627025604248, 0.12559774518013, 0.13552919030189514, 0.14546066522598267, 0.155392125248909, 0.16532358527183533, 0.17525504529476166, 0.185186505317688, 0.1951179802417755, 0.20504944026470184, 0.21498090028762817, 0.2249123752117157, 0.23484382033348083, 0.24477528035640717, 0.2547067403793335, 0.264638215303421, 0.27456966042518616, 0.2845011353492737, 0.2944325804710388, 0.30436405539512634, 0.31429553031921387]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 7.0, 10.0, 9.0, 12.0, 23.0, 29.0, 35.0, 72.0, 131.0, 183.0, 304.0, 547.0, 991.0, 1984.0, 4686.0, 12710.0, 55555.0, 873227.0, 73423.0, 14636.0, 5234.0, 2276.0, 1080.0, 560.0, 307.0, 166.0, 119.0, 79.0, 47.0, 36.0, 27.0, 10.0, 11.0, 9.0, 10.0, 4.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.314697265625, -0.3040504455566406, -0.29340362548828125, -0.2827568054199219, -0.2721099853515625, -0.2614631652832031, -0.25081634521484375, -0.24016952514648438, -0.229522705078125, -0.21887588500976562, -0.20822906494140625, -0.19758224487304688, -0.1869354248046875, -0.17628860473632812, -0.16564178466796875, -0.15499496459960938, -0.14434814453125, -0.13370132446289062, -0.12305450439453125, -0.11240768432617188, -0.1017608642578125, -0.09111404418945312, -0.08046722412109375, -0.06982040405273438, -0.059173583984375, -0.048526763916015625, -0.03787994384765625, -0.027233123779296875, -0.0165863037109375, -0.005939483642578125, 0.00470733642578125, 0.015354156494140625, 0.0260009765625, 0.036647796630859375, 0.04729461669921875, 0.057941436767578125, 0.0685882568359375, 0.07923507690429688, 0.08988189697265625, 0.10052871704101562, 0.111175537109375, 0.12182235717773438, 0.13246917724609375, 0.14311599731445312, 0.1537628173828125, 0.16440963745117188, 0.17505645751953125, 0.18570327758789062, 0.19635009765625, 0.20699691772460938, 0.21764373779296875, 0.22829055786132812, 0.2389373779296875, 0.24958419799804688, 0.26023101806640625, 0.2708778381347656, 0.281524658203125, 0.2921714782714844, 0.30281829833984375, 0.3134651184082031, 0.3241119384765625, 0.3347587585449219, 0.34540557861328125, 0.3560523986816406, 0.36669921875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 4.0, 1.0, 2.0, 4.0, 8.0, 5.0, 7.0, 9.0, 7.0, 10.0, 34.0, 72.0, 190.0, 262.0, 210.0, 82.0, 27.0, 9.0, 15.0, 10.0, 12.0, 6.0, 5.0, 6.0, 2.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.035614013671875, -0.03432464599609375, -0.0330352783203125, -0.03174591064453125, -0.03045654296875, -0.02916717529296875, -0.0278778076171875, -0.02658843994140625, -0.025299072265625, -0.02400970458984375, -0.0227203369140625, -0.02143096923828125, -0.0201416015625, -0.01885223388671875, -0.0175628662109375, -0.01627349853515625, -0.014984130859375, -0.01369476318359375, -0.0124053955078125, -0.01111602783203125, -0.00982666015625, -0.00853729248046875, -0.0072479248046875, -0.00595855712890625, -0.004669189453125, -0.00337982177734375, -0.0020904541015625, -0.00080108642578125, 0.00048828125, 0.00177764892578125, 0.0030670166015625, 0.00435638427734375, 0.005645751953125, 0.00693511962890625, 0.0082244873046875, 0.00951385498046875, 0.01080322265625, 0.01209259033203125, 0.0133819580078125, 0.01467132568359375, 0.015960693359375, 0.01725006103515625, 0.0185394287109375, 0.01982879638671875, 0.0211181640625, 0.02240753173828125, 0.0236968994140625, 0.02498626708984375, 0.026275634765625, 0.02756500244140625, 0.0288543701171875, 0.03014373779296875, 0.03143310546875, 0.03272247314453125, 0.0340118408203125, 0.03530120849609375, 0.036590576171875, 0.03787994384765625, 0.0391693115234375, 0.04045867919921875, 0.041748046875, 0.04303741455078125, 0.0443267822265625, 0.04561614990234375, 0.046905517578125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 1.0, 6.0, 2.0, 1.0, 9.0, 14.0, 17.0, 28.0, 46.0, 76.0, 101.0, 236.0, 643.0, 1912.0, 10907.0, 264324.0, 744764.0, 21108.0, 2856.0, 827.0, 305.0, 141.0, 86.0, 47.0, 32.0, 8.0, 18.0, 10.0, 7.0, 10.0, 2.0, 4.0, 5.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51708984375, -0.49566650390625, -0.4742431640625, -0.45281982421875, -0.431396484375, -0.40997314453125, -0.3885498046875, -0.36712646484375, -0.345703125, -0.32427978515625, -0.3028564453125, -0.28143310546875, -0.260009765625, -0.23858642578125, -0.2171630859375, -0.19573974609375, -0.17431640625, -0.15289306640625, -0.1314697265625, -0.11004638671875, -0.088623046875, -0.06719970703125, -0.0457763671875, -0.02435302734375, -0.0029296875, 0.01849365234375, 0.0399169921875, 0.06134033203125, 0.082763671875, 0.10418701171875, 0.1256103515625, 0.14703369140625, 0.16845703125, 0.18988037109375, 0.2113037109375, 0.23272705078125, 0.254150390625, 0.27557373046875, 0.2969970703125, 0.31842041015625, 0.33984375, 0.36126708984375, 0.3826904296875, 0.40411376953125, 0.425537109375, 0.44696044921875, 0.4683837890625, 0.48980712890625, 0.51123046875, 0.53265380859375, 0.5540771484375, 0.57550048828125, 0.596923828125, 0.61834716796875, 0.6397705078125, 0.66119384765625, 0.6826171875, 0.70404052734375, 0.7254638671875, 0.74688720703125, 0.768310546875, 0.78973388671875, 0.8111572265625, 0.83258056640625, 0.85400390625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 1.0, 5.0, 11.0, 11.0, 11.0, 9.0, 8.0, 18.0, 22.0, 19.0, 20.0, 30.0, 26.0, 41.0, 38.0, 33.0, 45.0, 37.0, 37.0, 50.0, 52.0, 45.0, 40.0, 35.0, 40.0, 37.0, 34.0, 38.0, 32.0, 28.0, 23.0, 21.0, 12.0, 20.0, 16.0, 12.0, 11.0, 5.0, 8.0, 3.0, 4.0, 4.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0], "bins": [-0.165771484375, -0.16121292114257812, -0.15665435791015625, -0.15209579467773438, -0.1475372314453125, -0.14297866821289062, -0.13842010498046875, -0.13386154174804688, -0.129302978515625, -0.12474441528320312, -0.12018585205078125, -0.11562728881835938, -0.1110687255859375, -0.10651016235351562, -0.10195159912109375, -0.09739303588867188, -0.09283447265625, -0.08827590942382812, -0.08371734619140625, -0.07915878295898438, -0.0746002197265625, -0.07004165649414062, -0.06548309326171875, -0.060924530029296875, -0.056365966796875, -0.051807403564453125, -0.04724884033203125, -0.042690277099609375, -0.0381317138671875, -0.033573150634765625, -0.02901458740234375, -0.024456024169921875, -0.0198974609375, -0.015338897705078125, -0.01078033447265625, -0.006221771240234375, -0.0016632080078125, 0.002895355224609375, 0.00745391845703125, 0.012012481689453125, 0.016571044921875, 0.021129608154296875, 0.02568817138671875, 0.030246734619140625, 0.0348052978515625, 0.039363861083984375, 0.04392242431640625, 0.048480987548828125, 0.05303955078125, 0.057598114013671875, 0.06215667724609375, 0.06671524047851562, 0.0712738037109375, 0.07583236694335938, 0.08039093017578125, 0.08494949340820312, 0.089508056640625, 0.09406661987304688, 0.09862518310546875, 0.10318374633789062, 0.1077423095703125, 0.11230087280273438, 0.11685943603515625, 0.12141799926757812, 0.1259765625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 5.0, 10.0, 7.0, 18.0, 23.0, 33.0, 45.0, 67.0, 114.0, 216.0, 461.0, 1022.0, 3146.0, 18861.0, 854929.0, 157917.0, 8250.0, 1908.0, 750.0, 291.0, 190.0, 99.0, 71.0, 38.0, 23.0, 13.0, 11.0, 13.0, 6.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.51953125, -0.5050201416015625, -0.490509033203125, -0.4759979248046875, -0.46148681640625, -0.4469757080078125, -0.432464599609375, -0.4179534912109375, -0.4034423828125, -0.3889312744140625, -0.374420166015625, -0.3599090576171875, -0.34539794921875, -0.3308868408203125, -0.316375732421875, -0.3018646240234375, -0.287353515625, -0.2728424072265625, -0.258331298828125, -0.2438201904296875, -0.22930908203125, -0.2147979736328125, -0.200286865234375, -0.1857757568359375, -0.1712646484375, -0.1567535400390625, -0.142242431640625, -0.1277313232421875, -0.11322021484375, -0.0987091064453125, -0.084197998046875, -0.0696868896484375, -0.05517578125, -0.0406646728515625, -0.026153564453125, -0.0116424560546875, 0.00286865234375, 0.0173797607421875, 0.031890869140625, 0.0464019775390625, 0.0609130859375, 0.0754241943359375, 0.089935302734375, 0.1044464111328125, 0.11895751953125, 0.1334686279296875, 0.147979736328125, 0.1624908447265625, 0.177001953125, 0.1915130615234375, 0.206024169921875, 0.2205352783203125, 0.23504638671875, 0.2495574951171875, 0.264068603515625, 0.2785797119140625, 0.2930908203125, 0.3076019287109375, 0.322113037109375, 0.3366241455078125, 0.35113525390625, 0.3656463623046875, 0.380157470703125, 0.3946685791015625, 0.4091796875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 3.0, 9.0, 7.0, 18.0, 13.0, 21.0, 38.0, 45.0, 60.0, 88.0, 118.0, 104.0, 131.0, 102.0, 79.0, 52.0, 44.0, 20.0, 18.0, 10.0, 3.0, 6.0, 4.0, 4.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.621246337890625e-05, -1.5391036868095398e-05, -1.4569610357284546e-05, -1.3748183846473694e-05, -1.2926757335662842e-05, -1.210533082485199e-05, -1.1283904314041138e-05, -1.0462477803230286e-05, -9.641051292419434e-06, -8.819624781608582e-06, -7.99819827079773e-06, -7.1767717599868774e-06, -6.355345249176025e-06, -5.533918738365173e-06, -4.712492227554321e-06, -3.891065716743469e-06, -3.069639205932617e-06, -2.248212695121765e-06, -1.426786184310913e-06, -6.05359673500061e-07, 2.1606683731079102e-07, 1.037493348121643e-06, 1.8589198589324951e-06, 2.680346369743347e-06, 3.5017728805541992e-06, 4.323199391365051e-06, 5.144625902175903e-06, 5.966052412986755e-06, 6.787478923797607e-06, 7.6089054346084595e-06, 8.430331945419312e-06, 9.251758456230164e-06, 1.0073184967041016e-05, 1.0894611477851868e-05, 1.171603798866272e-05, 1.2537464499473572e-05, 1.3358891010284424e-05, 1.4180317521095276e-05, 1.5001744031906128e-05, 1.582317054271698e-05, 1.6644597053527832e-05, 1.7466023564338684e-05, 1.8287450075149536e-05, 1.9108876585960388e-05, 1.993030309677124e-05, 2.0751729607582092e-05, 2.1573156118392944e-05, 2.2394582629203796e-05, 2.321600914001465e-05, 2.40374356508255e-05, 2.4858862161636353e-05, 2.5680288672447205e-05, 2.6501715183258057e-05, 2.732314169406891e-05, 2.814456820487976e-05, 2.8965994715690613e-05, 2.9787421226501465e-05, 3.060884773731232e-05, 3.143027424812317e-05, 3.225170075893402e-05, 3.307312726974487e-05, 3.3894553780555725e-05, 3.471598029136658e-05, 3.553740680217743e-05, 3.635883331298828e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 1.0, 4.0, 9.0, 10.0, 15.0, 21.0, 42.0, 39.0, 73.0, 93.0, 143.0, 226.0, 334.0, 578.0, 1098.0, 1887.0, 3591.0, 7464.0, 17460.0, 46313.0, 158006.0, 502455.0, 211924.0, 57891.0, 20791.0, 8787.0, 4094.0, 2075.0, 1242.0, 694.0, 413.0, 257.0, 186.0, 105.0, 62.0, 52.0, 35.0, 26.0, 16.0, 16.0, 10.0, 4.0, 7.0, 2.0, 1.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1319580078125, -0.12791061401367188, -0.12386322021484375, -0.11981582641601562, -0.1157684326171875, -0.11172103881835938, -0.10767364501953125, -0.10362625122070312, -0.099578857421875, -0.09553146362304688, -0.09148406982421875, -0.08743667602539062, -0.0833892822265625, -0.07934188842773438, -0.07529449462890625, -0.07124710083007812, -0.06719970703125, -0.06315231323242188, -0.05910491943359375, -0.055057525634765625, -0.0510101318359375, -0.046962738037109375, -0.04291534423828125, -0.038867950439453125, -0.034820556640625, -0.030773162841796875, -0.02672576904296875, -0.022678375244140625, -0.0186309814453125, -0.014583587646484375, -0.01053619384765625, -0.006488800048828125, -0.00244140625, 0.001605987548828125, 0.00565338134765625, 0.009700775146484375, 0.0137481689453125, 0.017795562744140625, 0.02184295654296875, 0.025890350341796875, 0.029937744140625, 0.033985137939453125, 0.03803253173828125, 0.042079925537109375, 0.0461273193359375, 0.050174713134765625, 0.05422210693359375, 0.058269500732421875, 0.06231689453125, 0.06636428833007812, 0.07041168212890625, 0.07445907592773438, 0.0785064697265625, 0.08255386352539062, 0.08660125732421875, 0.09064865112304688, 0.094696044921875, 0.09874343872070312, 0.10279083251953125, 0.10683822631835938, 0.1108856201171875, 0.11493301391601562, 0.11898040771484375, 0.12302780151367188, 0.1270751953125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 7.0, 4.0, 10.0, 4.0, 9.0, 14.0, 13.0, 13.0, 19.0, 26.0, 33.0, 38.0, 44.0, 37.0, 54.0, 65.0, 82.0, 69.0, 70.0, 57.0, 54.0, 61.0, 42.0, 36.0, 31.0, 22.0, 22.0, 17.0, 9.0, 11.0, 6.0, 9.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10931396484375, -0.10613155364990234, -0.10294914245605469, -0.09976673126220703, -0.09658432006835938, -0.09340190887451172, -0.09021949768066406, -0.0870370864868164, -0.08385467529296875, -0.0806722640991211, -0.07748985290527344, -0.07430744171142578, -0.07112503051757812, -0.06794261932373047, -0.06476020812988281, -0.061577796936035156, -0.0583953857421875, -0.055212974548339844, -0.05203056335449219, -0.04884815216064453, -0.045665740966796875, -0.04248332977294922, -0.03930091857910156, -0.036118507385253906, -0.03293609619140625, -0.029753684997558594, -0.026571273803710938, -0.02338886260986328, -0.020206451416015625, -0.01702404022216797, -0.013841629028320312, -0.010659217834472656, -0.007476806640625, -0.004294395446777344, -0.0011119842529296875, 0.0020704269409179688, 0.005252838134765625, 0.008435249328613281, 0.011617660522460938, 0.014800071716308594, 0.01798248291015625, 0.021164894104003906, 0.024347305297851562, 0.02752971649169922, 0.030712127685546875, 0.03389453887939453, 0.03707695007324219, 0.040259361267089844, 0.0434417724609375, 0.046624183654785156, 0.04980659484863281, 0.05298900604248047, 0.056171417236328125, 0.05935382843017578, 0.06253623962402344, 0.0657186508178711, 0.06890106201171875, 0.0720834732055664, 0.07526588439941406, 0.07844829559326172, 0.08163070678710938, 0.08481311798095703, 0.08799552917480469, 0.09117794036865234, 0.0943603515625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 5.0, 3.0, 4.0, 12.0, 9.0, 19.0, 21.0, 69.0, 151.0, 301.0, 217.0, 84.0, 52.0, 16.0, 6.0, 8.0, 6.0, 5.0, 3.0, 2.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.5330069065093994, -3.452249765396118, -3.371492624282837, -3.2907354831695557, -3.2099783420562744, -3.129221200942993, -3.048464059829712, -2.9677069187164307, -2.8869497776031494, -2.806192636489868, -2.725435495376587, -2.6446783542633057, -2.5639212131500244, -2.483164072036743, -2.402406930923462, -2.3216497898101807, -2.2408926486968994, -2.160135507583618, -2.079378366470337, -1.9986212253570557, -1.9178640842437744, -1.8371069431304932, -1.756349802017212, -1.6755926609039307, -1.5948355197906494, -1.5140783786773682, -1.433321237564087, -1.3525640964508057, -1.2718069553375244, -1.1910498142242432, -1.110292673110962, -1.0295355319976807, -0.9487782716751099, -0.8680211305618286, -0.7872639894485474, -0.7065068483352661, -0.6257497072219849, -0.5449925661087036, -0.46423542499542236, -0.3834782838821411, -0.30272114276885986, -0.2219640016555786, -0.14120686054229736, -0.06044971942901611, 0.020307421684265137, 0.10106456279754639, 0.18182170391082764, 0.2625788450241089, 0.34333598613739014, 0.4240931272506714, 0.5048502683639526, 0.5856074094772339, 0.6663645505905151, 0.7471216917037964, 0.8278788328170776, 0.9086359739303589, 0.9893931150436401, 1.0701502561569214, 1.1509073972702026, 1.2316645383834839, 1.3124216794967651, 1.3931788206100464, 1.4739359617233276, 1.5546931028366089, 1.6354502439498901]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 7.0, 6.0, 1.0, 3.0, 10.0, 3.0, 6.0, 10.0, 18.0, 29.0, 68.0, 111.0, 176.0, 213.0, 126.0, 89.0, 49.0, 21.0, 10.0, 8.0, 7.0, 6.0, 4.0, 2.0, 6.0, 2.0, 2.0, 0.0, 4.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-4.052558898925781, -3.9489827156066895, -3.8454065322875977, -3.741830348968506, -3.638254404067993, -3.5346782207489014, -3.4311020374298096, -3.3275258541107178, -3.223949909210205, -3.1203737258911133, -3.0167975425720215, -2.9132213592529297, -2.809645414352417, -2.706069231033325, -2.6024930477142334, -2.4989168643951416, -2.39534068107605, -2.291764497756958, -2.188188314437866, -2.0846123695373535, -1.9810361862182617, -1.87746000289917, -1.7738838195800781, -1.6703076362609863, -1.566731572151184, -1.4631553888320923, -1.35957932472229, -1.2560031414031982, -1.1524269580841064, -1.0488508939743042, -0.9452747106552124, -0.8416985869407654, -0.7381222248077393, -0.6345461010932922, -0.5309699773788452, -0.4273937940597534, -0.3238176703453064, -0.22024154663085938, -0.11666536331176758, -0.013089239597320557, 0.09048688411712646, 0.19406302273273468, 0.2976391613483429, 0.4012153148651123, 0.5047914385795593, 0.6083675622940063, 0.7119437456130981, 0.8155198693275452, 0.9190959930419922, 1.022672176361084, 1.1262482404708862, 1.229824423789978, 1.3334004878997803, 1.436976671218872, 1.5405528545379639, 1.6441290378570557, 1.747705101966858, 1.8512812852859497, 1.954857349395752, 2.0584335327148438, 2.1620097160339355, 2.2655858993530273, 2.369162082672119, 2.472738027572632, 2.5763142108917236]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 8.0, 7.0, 7.0, 6.0, 11.0, 15.0, 18.0, 16.0, 30.0, 46.0, 67.0, 294.0, 2680.0, 167970.0, 4016570.0, 5719.0, 492.0, 135.0, 48.0, 31.0, 21.0, 13.0, 11.0, 11.0, 13.0, 5.0, 7.0, 5.0, 3.0, 5.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-2.9609375, -2.87896728515625, -2.7969970703125, -2.71502685546875, -2.633056640625, -2.55108642578125, -2.4691162109375, -2.38714599609375, -2.30517578125, -2.22320556640625, -2.1412353515625, -2.05926513671875, -1.977294921875, -1.89532470703125, -1.8133544921875, -1.73138427734375, -1.6494140625, -1.56744384765625, -1.4854736328125, -1.40350341796875, -1.321533203125, -1.23956298828125, -1.1575927734375, -1.07562255859375, -0.99365234375, -0.91168212890625, -0.8297119140625, -0.74774169921875, -0.665771484375, -0.58380126953125, -0.5018310546875, -0.41986083984375, -0.337890625, -0.25592041015625, -0.1739501953125, -0.09197998046875, -0.010009765625, 0.07196044921875, 0.1539306640625, 0.23590087890625, 0.31787109375, 0.39984130859375, 0.4818115234375, 0.56378173828125, 0.645751953125, 0.72772216796875, 0.8096923828125, 0.89166259765625, 0.9736328125, 1.05560302734375, 1.1375732421875, 1.21954345703125, 1.301513671875, 1.38348388671875, 1.4654541015625, 1.54742431640625, 1.62939453125, 1.71136474609375, 1.7933349609375, 1.87530517578125, 1.957275390625, 2.03924560546875, 2.1212158203125, 2.20318603515625, 2.28515625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 3.0, 3.0, 6.0, 11.0, 15.0, 10.0, 16.0, 22.0, 32.0, 62.0, 75.0, 112.0, 133.0, 134.0, 108.0, 76.0, 49.0, 35.0, 20.0, 10.0, 12.0, 5.0, 7.0, 8.0, 3.0, 2.0, 5.0, 4.0, 4.0, 1.0, 0.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02301025390625, -0.022160053253173828, -0.021309852600097656, -0.020459651947021484, -0.019609451293945312, -0.01875925064086914, -0.01790904998779297, -0.017058849334716797, -0.016208648681640625, -0.015358448028564453, -0.014508247375488281, -0.01365804672241211, -0.012807846069335938, -0.011957645416259766, -0.011107444763183594, -0.010257244110107422, -0.00940704345703125, -0.008556842803955078, -0.007706642150878906, -0.006856441497802734, -0.0060062408447265625, -0.005156040191650391, -0.004305839538574219, -0.003455638885498047, -0.002605438232421875, -0.0017552375793457031, -0.0009050369262695312, -5.4836273193359375e-05, 0.0007953643798828125, 0.0016455650329589844, 0.0024957656860351562, 0.003345966339111328, 0.0041961669921875, 0.005046367645263672, 0.005896568298339844, 0.006746768951416016, 0.0075969696044921875, 0.00844717025756836, 0.009297370910644531, 0.010147571563720703, 0.010997772216796875, 0.011847972869873047, 0.012698173522949219, 0.01354837417602539, 0.014398574829101562, 0.015248775482177734, 0.016098976135253906, 0.016949176788330078, 0.01779937744140625, 0.018649578094482422, 0.019499778747558594, 0.020349979400634766, 0.021200180053710938, 0.02205038070678711, 0.02290058135986328, 0.023750782012939453, 0.024600982666015625, 0.025451183319091797, 0.02630138397216797, 0.02715158462524414, 0.028001785278320312, 0.028851985931396484, 0.029702186584472656, 0.030552387237548828, 0.031402587890625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 8.0, 4.0, 7.0, 11.0, 8.0, 18.0, 25.0, 52.0, 59.0, 148.0, 268.0, 607.0, 1736.0, 5735.0, 29553.0, 642052.0, 3440691.0, 59954.0, 9183.0, 2481.0, 858.0, 383.0, 165.0, 90.0, 56.0, 45.0, 30.0, 18.0, 14.0, 11.0, 8.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.6796875, -0.6591873168945312, -0.6386871337890625, -0.6181869506835938, -0.597686767578125, -0.5771865844726562, -0.5566864013671875, -0.5361862182617188, -0.51568603515625, -0.49518585205078125, -0.4746856689453125, -0.45418548583984375, -0.433685302734375, -0.41318511962890625, -0.3926849365234375, -0.37218475341796875, -0.3516845703125, -0.33118438720703125, -0.3106842041015625, -0.29018402099609375, -0.269683837890625, -0.24918365478515625, -0.2286834716796875, -0.20818328857421875, -0.18768310546875, -0.16718292236328125, -0.1466827392578125, -0.12618255615234375, -0.105682373046875, -0.08518218994140625, -0.0646820068359375, -0.04418182373046875, -0.023681640625, -0.00318145751953125, 0.0173187255859375, 0.03781890869140625, 0.058319091796875, 0.07881927490234375, 0.0993194580078125, 0.11981964111328125, 0.14031982421875, 0.16082000732421875, 0.1813201904296875, 0.20182037353515625, 0.222320556640625, 0.24282073974609375, 0.2633209228515625, 0.28382110595703125, 0.3043212890625, 0.32482147216796875, 0.3453216552734375, 0.36582183837890625, 0.386322021484375, 0.40682220458984375, 0.4273223876953125, 0.44782257080078125, 0.46832275390625, 0.48882293701171875, 0.5093231201171875, 0.5298233032226562, 0.550323486328125, 0.5708236694335938, 0.5913238525390625, 0.6118240356445312, 0.63232421875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 9.0, 8.0, 4.0, 8.0, 12.0, 16.0, 25.0, 29.0, 72.0, 110.0, 170.0, 344.0, 898.0, 1341.0, 463.0, 186.0, 129.0, 66.0, 51.0, 29.0, 10.0, 15.0, 16.0, 8.0, 10.0, 7.0, 7.0, 6.0, 3.0, 4.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.050445556640625, -0.04882526397705078, -0.04720497131347656, -0.045584678649902344, -0.043964385986328125, -0.042344093322753906, -0.04072380065917969, -0.03910350799560547, -0.03748321533203125, -0.03586292266845703, -0.03424263000488281, -0.032622337341308594, -0.031002044677734375, -0.029381752014160156, -0.027761459350585938, -0.02614116668701172, -0.0245208740234375, -0.02290058135986328, -0.021280288696289062, -0.019659996032714844, -0.018039703369140625, -0.016419410705566406, -0.014799118041992188, -0.013178825378417969, -0.01155853271484375, -0.009938240051269531, -0.008317947387695312, -0.006697654724121094, -0.005077362060546875, -0.0034570693969726562, -0.0018367767333984375, -0.00021648406982421875, 0.00140380859375, 0.0030241012573242188, 0.0046443939208984375, 0.006264686584472656, 0.007884979248046875, 0.009505271911621094, 0.011125564575195312, 0.012745857238769531, 0.01436614990234375, 0.01598644256591797, 0.017606735229492188, 0.019227027893066406, 0.020847320556640625, 0.022467613220214844, 0.024087905883789062, 0.02570819854736328, 0.0273284912109375, 0.02894878387451172, 0.030569076538085938, 0.032189369201660156, 0.033809661865234375, 0.035429954528808594, 0.03705024719238281, 0.03867053985595703, 0.04029083251953125, 0.04191112518310547, 0.04353141784667969, 0.045151710510253906, 0.046772003173828125, 0.048392295837402344, 0.05001258850097656, 0.05163288116455078, 0.053253173828125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [5.0, 9.0, 95.0, 604.0, 262.0, 31.0, 9.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17334377765655518, -0.12600946426391602, -0.07867513597011566, -0.03134080767631531, 0.015993505716323853, 0.06332781910896301, 0.11066216230392456, 0.15799647569656372, 0.20533078908920288, 0.25266510248184204, 0.2999994158744812, 0.34733375906944275, 0.3946680724620819, 0.44200238585472107, 0.4893367290496826, 0.5366710424423218, 0.5840053558349609, 0.6313396692276001, 0.6786739826202393, 0.7260082960128784, 0.7733426094055176, 0.8206769227981567, 0.8680112957954407, 0.9153456091880798, 0.962679922580719, 1.010014295578003, 1.057348608970642, 1.1046829223632812, 1.1520172357559204, 1.1993515491485596, 1.2466858625411987, 1.294020175933838, 1.3413543701171875, 1.3886886835098267, 1.4360229969024658, 1.483357310295105, 1.5306916236877441, 1.5780259370803833, 1.6253602504730225, 1.6726946830749512, 1.7200288772583008, 1.76736319065094, 1.814697504043579, 1.8620318174362183, 1.9093661308288574, 1.9567004442214966, 2.0040347576141357, 2.0513691902160645, 2.098703384399414, 2.1460378170013428, 2.1933720111846924, 2.240706443786621, 2.2880406379699707, 2.3353750705718994, 2.382709264755249, 2.4300436973571777, 2.4773781299591064, 2.524712562561035, 2.5720467567443848, 2.6193811893463135, 2.666715383529663, 2.714049816131592, 2.7613840103149414, 2.80871844291687, 2.8560526371002197]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 1.0, 1.0, 5.0, 1.0, 3.0, 1.0, 7.0, 6.0, 7.0, 14.0, 10.0, 17.0, 36.0, 42.0, 50.0, 58.0, 81.0, 79.0, 109.0, 90.0, 89.0, 69.0, 59.0, 50.0, 26.0, 26.0, 15.0, 10.0, 9.0, 9.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2200174331665039, -0.21175579726696014, -0.20349416136741638, -0.19523251056671143, -0.18697087466716766, -0.1787092387676239, -0.17044760286808014, -0.16218596696853638, -0.15392431616783142, -0.14566268026828766, -0.1374010443687439, -0.12913939356803894, -0.12087775766849518, -0.11261612176895142, -0.10435448586940765, -0.09609284996986389, -0.08783121407032013, -0.07956957817077637, -0.07130793482065201, -0.06304629892110825, -0.054784659296274185, -0.046523019671440125, -0.03826138377189636, -0.0299997441470623, -0.02173810452222824, -0.013476465828716755, -0.005214827135205269, 0.0030468106269836426, 0.011308450251817703, 0.019570089876651764, 0.027831725776195526, 0.03609336540102959, 0.04435500502586365, 0.05261664465069771, 0.06087828427553177, 0.06913992017507553, 0.07740156352519989, 0.08566319942474365, 0.09392483532428741, 0.10218647122383118, 0.11044811457395554, 0.1187097504734993, 0.12697139382362366, 0.13523302972316742, 0.14349466562271118, 0.15175631642341614, 0.1600179374217987, 0.16827958822250366, 0.17654122412204742, 0.1848028600215912, 0.19306449592113495, 0.2013261318206787, 0.20958778262138367, 0.21784941852092743, 0.2261110544204712, 0.23437269032001495, 0.24263432621955872, 0.25089597702026367, 0.25915759801864624, 0.2674192488193512, 0.27568086981773376, 0.2839425206184387, 0.2922041416168213, 0.30046579241752625, 0.3087274432182312]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 8.0, 8.0, 7.0, 14.0, 35.0, 24.0, 39.0, 77.0, 96.0, 168.0, 239.0, 409.0, 617.0, 1101.0, 2038.0, 3881.0, 7932.0, 18541.0, 57907.0, 307497.0, 506178.0, 94868.0, 26095.0, 10192.0, 4801.0, 2372.0, 1373.0, 727.0, 469.0, 289.0, 182.0, 112.0, 87.0, 52.0, 44.0, 23.0, 18.0, 15.0, 8.0, 5.0, 5.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1885986328125, -0.18234634399414062, -0.17609405517578125, -0.16984176635742188, -0.1635894775390625, -0.15733718872070312, -0.15108489990234375, -0.14483261108398438, -0.138580322265625, -0.13232803344726562, -0.12607574462890625, -0.11982345581054688, -0.1135711669921875, -0.10731887817382812, -0.10106658935546875, -0.09481430053710938, -0.08856201171875, -0.08230972290039062, -0.07605743408203125, -0.06980514526367188, -0.0635528564453125, -0.057300567626953125, -0.05104827880859375, -0.044795989990234375, -0.038543701171875, -0.032291412353515625, -0.02603912353515625, -0.019786834716796875, -0.0135345458984375, -0.007282257080078125, -0.00102996826171875, 0.005222320556640625, 0.011474609375, 0.017726898193359375, 0.02397918701171875, 0.030231475830078125, 0.0364837646484375, 0.042736053466796875, 0.04898834228515625, 0.055240631103515625, 0.061492919921875, 0.06774520874023438, 0.07399749755859375, 0.08024978637695312, 0.0865020751953125, 0.09275436401367188, 0.09900665283203125, 0.10525894165039062, 0.11151123046875, 0.11776351928710938, 0.12401580810546875, 0.13026809692382812, 0.1365203857421875, 0.14277267456054688, 0.14902496337890625, 0.15527725219726562, 0.161529541015625, 0.16778182983398438, 0.17403411865234375, 0.18028640747070312, 0.1865386962890625, 0.19279098510742188, 0.19904327392578125, 0.20529556274414062, 0.2115478515625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 5.0, 1.0, 5.0, 1.0, 6.0, 8.0, 13.0, 16.0, 20.0, 33.0, 44.0, 75.0, 79.0, 108.0, 116.0, 108.0, 80.0, 61.0, 56.0, 31.0, 22.0, 21.0, 16.0, 15.0, 7.0, 9.0, 9.0, 8.0, 5.0, 3.0, 4.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0198974609375, -0.019253253936767578, -0.018609046936035156, -0.017964839935302734, -0.017320632934570312, -0.01667642593383789, -0.01603221893310547, -0.015388011932373047, -0.014743804931640625, -0.014099597930908203, -0.013455390930175781, -0.01281118392944336, -0.012166976928710938, -0.011522769927978516, -0.010878562927246094, -0.010234355926513672, -0.00959014892578125, -0.008945941925048828, -0.008301734924316406, -0.007657527923583984, -0.0070133209228515625, -0.006369113922119141, -0.005724906921386719, -0.005080699920654297, -0.004436492919921875, -0.003792285919189453, -0.0031480789184570312, -0.0025038719177246094, -0.0018596649169921875, -0.0012154579162597656, -0.0005712509155273438, 7.295608520507812e-05, 0.0007171630859375, 0.0013613700866699219, 0.0020055770874023438, 0.0026497840881347656, 0.0032939910888671875, 0.003938198089599609, 0.004582405090332031, 0.005226612091064453, 0.005870819091796875, 0.006515026092529297, 0.007159233093261719, 0.007803440093994141, 0.008447647094726562, 0.009091854095458984, 0.009736061096191406, 0.010380268096923828, 0.01102447509765625, 0.011668682098388672, 0.012312889099121094, 0.012957096099853516, 0.013601303100585938, 0.01424551010131836, 0.014889717102050781, 0.015533924102783203, 0.016178131103515625, 0.016822338104248047, 0.01746654510498047, 0.01811075210571289, 0.018754959106445312, 0.019399166107177734, 0.020043373107910156, 0.020687580108642578, 0.021331787109375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 4.0, 1.0, 1.0, 5.0, 2.0, 6.0, 13.0, 33.0, 74.0, 520.0, 29964.0, 989901.0, 27351.0, 537.0, 68.0, 28.0, 9.0, 8.0, 5.0, 2.0, 5.0, 5.0, 3.0, 5.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.85693359375, -0.828826904296875, -0.80072021484375, -0.772613525390625, -0.7445068359375, -0.716400146484375, -0.68829345703125, -0.660186767578125, -0.632080078125, -0.603973388671875, -0.57586669921875, -0.547760009765625, -0.5196533203125, -0.491546630859375, -0.46343994140625, -0.435333251953125, -0.4072265625, -0.379119873046875, -0.35101318359375, -0.322906494140625, -0.2947998046875, -0.266693115234375, -0.23858642578125, -0.210479736328125, -0.182373046875, -0.154266357421875, -0.12615966796875, -0.098052978515625, -0.0699462890625, -0.041839599609375, -0.01373291015625, 0.014373779296875, 0.04248046875, 0.070587158203125, 0.09869384765625, 0.126800537109375, 0.1549072265625, 0.183013916015625, 0.21112060546875, 0.239227294921875, 0.267333984375, 0.295440673828125, 0.32354736328125, 0.351654052734375, 0.3797607421875, 0.407867431640625, 0.43597412109375, 0.464080810546875, 0.4921875, 0.520294189453125, 0.54840087890625, 0.576507568359375, 0.6046142578125, 0.632720947265625, 0.66082763671875, 0.688934326171875, 0.717041015625, 0.745147705078125, 0.77325439453125, 0.801361083984375, 0.8294677734375, 0.857574462890625, 0.88568115234375, 0.913787841796875, 0.94189453125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 3.0, 1.0, 9.0, 7.0, 10.0, 15.0, 10.0, 14.0, 10.0, 11.0, 15.0, 23.0, 31.0, 22.0, 36.0, 28.0, 30.0, 35.0, 44.0, 42.0, 30.0, 50.0, 49.0, 47.0, 50.0, 36.0, 46.0, 30.0, 32.0, 35.0, 23.0, 26.0, 20.0, 15.0, 14.0, 16.0, 8.0, 15.0, 12.0, 8.0, 10.0, 7.0, 7.0, 8.0, 6.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.08660888671875, -0.0839986801147461, -0.08138847351074219, -0.07877826690673828, -0.07616806030273438, -0.07355785369873047, -0.07094764709472656, -0.06833744049072266, -0.06572723388671875, -0.06311702728271484, -0.06050682067871094, -0.05789661407470703, -0.055286407470703125, -0.05267620086669922, -0.05006599426269531, -0.047455787658691406, -0.0448455810546875, -0.042235374450683594, -0.03962516784667969, -0.03701496124267578, -0.034404754638671875, -0.03179454803466797, -0.029184341430664062, -0.026574134826660156, -0.02396392822265625, -0.021353721618652344, -0.018743515014648438, -0.01613330841064453, -0.013523101806640625, -0.010912895202636719, -0.008302688598632812, -0.005692481994628906, -0.003082275390625, -0.00047206878662109375, 0.0021381378173828125, 0.004748344421386719, 0.007358551025390625, 0.009968757629394531, 0.012578964233398438, 0.015189170837402344, 0.01779937744140625, 0.020409584045410156, 0.023019790649414062, 0.02562999725341797, 0.028240203857421875, 0.03085041046142578, 0.03346061706542969, 0.036070823669433594, 0.0386810302734375, 0.041291236877441406, 0.04390144348144531, 0.04651165008544922, 0.049121856689453125, 0.05173206329345703, 0.05434226989746094, 0.056952476501464844, 0.05956268310546875, 0.062172889709472656, 0.06478309631347656, 0.06739330291748047, 0.07000350952148438, 0.07261371612548828, 0.07522392272949219, 0.0778341293334961, 0.0804443359375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 8.0, 17.0, 39.0, 105.0, 508.0, 37103.0, 1008633.0, 1847.0, 200.0, 53.0, 14.0, 10.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.392578125, -1.347991943359375, -1.30340576171875, -1.258819580078125, -1.2142333984375, -1.169647216796875, -1.12506103515625, -1.080474853515625, -1.035888671875, -0.991302490234375, -0.94671630859375, -0.902130126953125, -0.8575439453125, -0.812957763671875, -0.76837158203125, -0.723785400390625, -0.67919921875, -0.634613037109375, -0.59002685546875, -0.545440673828125, -0.5008544921875, -0.456268310546875, -0.41168212890625, -0.367095947265625, -0.322509765625, -0.277923583984375, -0.23333740234375, -0.188751220703125, -0.1441650390625, -0.099578857421875, -0.05499267578125, -0.010406494140625, 0.0341796875, 0.078765869140625, 0.12335205078125, 0.167938232421875, 0.2125244140625, 0.257110595703125, 0.30169677734375, 0.346282958984375, 0.390869140625, 0.435455322265625, 0.48004150390625, 0.524627685546875, 0.5692138671875, 0.613800048828125, 0.65838623046875, 0.702972412109375, 0.74755859375, 0.792144775390625, 0.83673095703125, 0.881317138671875, 0.9259033203125, 0.970489501953125, 1.01507568359375, 1.059661865234375, 1.104248046875, 1.148834228515625, 1.19342041015625, 1.238006591796875, 1.2825927734375, 1.327178955078125, 1.37176513671875, 1.416351318359375, 1.4609375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 5.0, 2.0, 9.0, 8.0, 11.0, 8.0, 21.0, 32.0, 53.0, 52.0, 80.0, 99.0, 129.0, 128.0, 116.0, 70.0, 46.0, 32.0, 25.0, 17.0, 13.0, 13.0, 3.0, 7.0, 2.0, 4.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.042552947998047e-05, -4.8928894102573395e-05, -4.743225872516632e-05, -4.593562334775925e-05, -4.443898797035217e-05, -4.29423525929451e-05, -4.1445717215538025e-05, -3.994908183813095e-05, -3.845244646072388e-05, -3.69558110833168e-05, -3.545917570590973e-05, -3.3962540328502655e-05, -3.246590495109558e-05, -3.096926957368851e-05, -2.9472634196281433e-05, -2.797599881887436e-05, -2.6479363441467285e-05, -2.498272806406021e-05, -2.3486092686653137e-05, -2.1989457309246063e-05, -2.049282193183899e-05, -1.8996186554431915e-05, -1.749955117702484e-05, -1.6002915799617767e-05, -1.4506280422210693e-05, -1.300964504480362e-05, -1.1513009667396545e-05, -1.0016374289989471e-05, -8.519738912582397e-06, -7.0231035351753235e-06, -5.5264681577682495e-06, -4.0298327803611755e-06, -2.5331974029541016e-06, -1.0365620255470276e-06, 4.600733518600464e-07, 1.9567087292671204e-06, 3.4533441066741943e-06, 4.949979484081268e-06, 6.446614861488342e-06, 7.943250238895416e-06, 9.43988561630249e-06, 1.0936520993709564e-05, 1.2433156371116638e-05, 1.3929791748523712e-05, 1.5426427125930786e-05, 1.692306250333786e-05, 1.8419697880744934e-05, 1.9916333258152008e-05, 2.1412968635559082e-05, 2.2909604012966156e-05, 2.440623939037323e-05, 2.5902874767780304e-05, 2.7399510145187378e-05, 2.8896145522594452e-05, 3.0392780900001526e-05, 3.18894162774086e-05, 3.3386051654815674e-05, 3.488268703222275e-05, 3.637932240962982e-05, 3.7875957787036896e-05, 3.937259316444397e-05, 4.0869228541851044e-05, 4.236586391925812e-05, 4.386249929666519e-05, 4.5359134674072266e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 5.0, 6.0, 10.0, 19.0, 24.0, 24.0, 39.0, 52.0, 85.0, 112.0, 185.0, 272.0, 499.0, 962.0, 1944.0, 4454.0, 11945.0, 37413.0, 141348.0, 430796.0, 299926.0, 80661.0, 23287.0, 7873.0, 3306.0, 1461.0, 707.0, 391.0, 242.0, 168.0, 120.0, 69.0, 43.0, 34.0, 14.0, 14.0, 13.0, 9.0, 6.0, 4.0, 1.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.165771484375, -0.16071701049804688, -0.15566253662109375, -0.15060806274414062, -0.1455535888671875, -0.14049911499023438, -0.13544464111328125, -0.13039016723632812, -0.125335693359375, -0.12028121948242188, -0.11522674560546875, -0.11017227172851562, -0.1051177978515625, -0.10006332397460938, -0.09500885009765625, -0.08995437622070312, -0.08489990234375, -0.07984542846679688, -0.07479095458984375, -0.06973648071289062, -0.0646820068359375, -0.059627532958984375, -0.05457305908203125, -0.049518585205078125, -0.044464111328125, -0.039409637451171875, -0.03435516357421875, -0.029300689697265625, -0.0242462158203125, -0.019191741943359375, -0.01413726806640625, -0.009082794189453125, -0.0040283203125, 0.001026153564453125, 0.00608062744140625, 0.011135101318359375, 0.0161895751953125, 0.021244049072265625, 0.02629852294921875, 0.031352996826171875, 0.036407470703125, 0.041461944580078125, 0.04651641845703125, 0.051570892333984375, 0.0566253662109375, 0.061679840087890625, 0.06673431396484375, 0.07178878784179688, 0.07684326171875, 0.08189773559570312, 0.08695220947265625, 0.09200668334960938, 0.0970611572265625, 0.10211563110351562, 0.10717010498046875, 0.11222457885742188, 0.117279052734375, 0.12233352661132812, 0.12738800048828125, 0.13244247436523438, 0.1374969482421875, 0.14255142211914062, 0.14760589599609375, 0.15266036987304688, 0.15771484375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 6.0, 9.0, 16.0, 22.0, 23.0, 37.0, 51.0, 72.0, 82.0, 86.0, 98.0, 103.0, 89.0, 78.0, 65.0, 56.0, 41.0, 16.0, 9.0, 15.0, 10.0, 6.0, 5.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11810302734375, -0.11415576934814453, -0.11020851135253906, -0.1062612533569336, -0.10231399536132812, -0.09836673736572266, -0.09441947937011719, -0.09047222137451172, -0.08652496337890625, -0.08257770538330078, -0.07863044738769531, -0.07468318939208984, -0.07073593139648438, -0.0667886734008789, -0.06284141540527344, -0.05889415740966797, -0.0549468994140625, -0.05099964141845703, -0.04705238342285156, -0.043105125427246094, -0.039157867431640625, -0.035210609436035156, -0.03126335144042969, -0.02731609344482422, -0.02336883544921875, -0.01942157745361328, -0.015474319458007812, -0.011527061462402344, -0.007579803466796875, -0.0036325454711914062, 0.0003147125244140625, 0.004261970520019531, 0.008209228515625, 0.012156486511230469, 0.016103744506835938, 0.020051002502441406, 0.023998260498046875, 0.027945518493652344, 0.03189277648925781, 0.03584003448486328, 0.03978729248046875, 0.04373455047607422, 0.04768180847167969, 0.051629066467285156, 0.055576324462890625, 0.059523582458496094, 0.06347084045410156, 0.06741809844970703, 0.0713653564453125, 0.07531261444091797, 0.07925987243652344, 0.0832071304321289, 0.08715438842773438, 0.09110164642333984, 0.09504890441894531, 0.09899616241455078, 0.10294342041015625, 0.10689067840576172, 0.11083793640136719, 0.11478519439697266, 0.11873245239257812, 0.1226797103881836, 0.12662696838378906, 0.13057422637939453, 0.134521484375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 7.0, 4.0, 15.0, 22.0, 75.0, 175.0, 293.0, 239.0, 88.0, 48.0, 19.0, 4.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2781274318695068, -1.2165273427963257, -1.1549272537231445, -1.0933270454406738, -1.0317269563674927, -0.9701268672943115, -0.9085267782211304, -0.8469266891479492, -0.7853265404701233, -0.7237264513969421, -0.6621263027191162, -0.6005262136459351, -0.5389261245727539, -0.477325975894928, -0.4157258868217468, -0.3541257679462433, -0.29252564907073975, -0.2309255301952362, -0.16932542622089386, -0.10772532224655151, -0.046125203371047974, 0.015474915504455566, 0.07707500457763672, 0.13867512345314026, 0.2002752423286438, 0.26187536120414734, 0.3234754800796509, 0.38507556915283203, 0.44667568802833557, 0.5082758069038391, 0.5698758959770203, 0.6314760446548462, 0.6930761337280273, 0.7546762228012085, 0.8162763714790344, 0.8778764605522156, 0.9394766092300415, 1.0010766983032227, 1.0626767873764038, 1.124276876449585, 1.1858770847320557, 1.2474771738052368, 1.309077262878418, 1.3706774711608887, 1.4322775602340698, 1.493877649307251, 1.5554777383804321, 1.6170778274536133, 1.6786779165267944, 1.7402780055999756, 1.8018780946731567, 1.863478183746338, 1.9250783920288086, 1.9866784811019897, 2.048278570175171, 2.1098787784576416, 2.171478748321533, 2.233078956604004, 2.2946789264678955, 2.356279134750366, 2.417879104614258, 2.4794793128967285, 2.541079521179199, 2.602679491043091, 2.6642796993255615]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 2.0, 2.0, 3.0, 8.0, 9.0, 10.0, 16.0, 13.0, 27.0, 28.0, 38.0, 68.0, 76.0, 109.0, 101.0, 99.0, 101.0, 72.0, 52.0, 56.0, 29.0, 19.0, 18.0, 16.0, 4.0, 6.0, 3.0, 4.0, 2.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3563207387924194, -1.318979024887085, -1.281637191772461, -1.2442954778671265, -1.206953763961792, -1.169611930847168, -1.1322702169418335, -1.094928503036499, -1.057586669921875, -1.0202449560165405, -0.9829031825065613, -0.945561408996582, -0.9082196950912476, -0.8708779215812683, -0.8335361480712891, -0.7961944341659546, -0.7588527202606201, -0.7215109467506409, -0.6841692328453064, -0.6468274593353271, -0.6094857454299927, -0.5721439719200134, -0.5348021984100342, -0.4974604547023773, -0.46011871099472046, -0.4227769672870636, -0.38543522357940674, -0.3480934500694275, -0.31075170636177063, -0.27340996265411377, -0.23606820404529572, -0.19872644543647766, -0.16138482093811035, -0.1240430697798729, -0.08670131862163544, -0.04935956746339798, -0.012017816305160522, 0.025323927402496338, 0.06266568601131439, 0.10000744462013245, 0.1373491883277893, 0.17469093203544617, 0.21203269064426422, 0.24937444925308228, 0.28671619296073914, 0.324057936668396, 0.36139971017837524, 0.3987414538860321, 0.43608319759368896, 0.4734249413013458, 0.5107666850090027, 0.5481084585189819, 0.5854501724243164, 0.6227919459342957, 0.6601337194442749, 0.6974754333496094, 0.7348172068595886, 0.7721589803695679, 0.8095006942749023, 0.8468424677848816, 0.8841842412948608, 0.9215259552001953, 0.9588677287101746, 0.9962095022201538, 1.0335512161254883]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 4.0, 0.0, 4.0, 4.0, 6.0, 4.0, 7.0, 6.0, 10.0, 14.0, 7.0, 9.0, 25.0, 17.0, 24.0, 54.0, 113.0, 229.0, 549.0, 1702.0, 7313.0, 77496.0, 4020237.0, 74505.0, 8530.0, 2162.0, 693.0, 260.0, 126.0, 54.0, 30.0, 22.0, 14.0, 13.0, 4.0, 4.0, 5.0, 12.0, 0.0, 2.0, 2.0, 4.0, 4.0, 0.0, 2.0, 4.0, 2.0, 0.0, 0.0, 4.0, 0.0, 0.0, 4.0], "bins": [-0.98974609375, -0.9601974487304688, -0.9306488037109375, -0.9011001586914062, -0.871551513671875, -0.8420028686523438, -0.8124542236328125, -0.7829055786132812, -0.75335693359375, -0.7238082885742188, -0.6942596435546875, -0.6647109985351562, -0.635162353515625, -0.6056137084960938, -0.5760650634765625, -0.5465164184570312, -0.5169677734375, -0.48741912841796875, -0.4578704833984375, -0.42832183837890625, -0.398773193359375, -0.36922454833984375, -0.3396759033203125, -0.31012725830078125, -0.28057861328125, -0.25102996826171875, -0.2214813232421875, -0.19193267822265625, -0.162384033203125, -0.13283538818359375, -0.1032867431640625, -0.07373809814453125, -0.044189453125, -0.01464080810546875, 0.0149078369140625, 0.04445648193359375, 0.074005126953125, 0.10355377197265625, 0.1331024169921875, 0.16265106201171875, 0.19219970703125, 0.22174835205078125, 0.2512969970703125, 0.28084564208984375, 0.310394287109375, 0.33994293212890625, 0.3694915771484375, 0.39904022216796875, 0.4285888671875, 0.45813751220703125, 0.4876861572265625, 0.5172348022460938, 0.546783447265625, 0.5763320922851562, 0.6058807373046875, 0.6354293823242188, 0.66497802734375, 0.6945266723632812, 0.7240753173828125, 0.7536239624023438, 0.783172607421875, 0.8127212524414062, 0.8422698974609375, 0.8718185424804688, 0.9013671875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 7.0, 5.0, 7.0, 8.0, 10.0, 16.0, 16.0, 28.0, 32.0, 45.0, 59.0, 76.0, 70.0, 91.0, 86.0, 93.0, 71.0, 56.0, 36.0, 43.0, 34.0, 27.0, 15.0, 15.0, 10.0, 9.0, 7.0, 9.0, 3.0, 2.0, 6.0, 6.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.019683837890625, -0.019113779067993164, -0.018543720245361328, -0.017973661422729492, -0.017403602600097656, -0.01683354377746582, -0.016263484954833984, -0.01569342613220215, -0.015123367309570312, -0.014553308486938477, -0.01398324966430664, -0.013413190841674805, -0.012843132019042969, -0.012273073196411133, -0.011703014373779297, -0.011132955551147461, -0.010562896728515625, -0.009992837905883789, -0.009422779083251953, -0.008852720260620117, -0.008282661437988281, -0.007712602615356445, -0.007142543792724609, -0.0065724849700927734, -0.0060024261474609375, -0.0054323673248291016, -0.004862308502197266, -0.00429224967956543, -0.0037221908569335938, -0.003152132034301758, -0.002582073211669922, -0.002012014389038086, -0.00144195556640625, -0.0008718967437744141, -0.0003018379211425781, 0.0002682209014892578, 0.0008382797241210938, 0.0014083385467529297, 0.0019783973693847656, 0.0025484561920166016, 0.0031185150146484375, 0.0036885738372802734, 0.004258632659912109, 0.004828691482543945, 0.005398750305175781, 0.005968809127807617, 0.006538867950439453, 0.007108926773071289, 0.007678985595703125, 0.008249044418334961, 0.008819103240966797, 0.009389162063598633, 0.009959220886230469, 0.010529279708862305, 0.01109933853149414, 0.011669397354125977, 0.012239456176757812, 0.012809514999389648, 0.013379573822021484, 0.01394963264465332, 0.014519691467285156, 0.015089750289916992, 0.015659809112548828, 0.016229867935180664, 0.0167999267578125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 4.0, 17.0, 16.0, 64.0, 118.0, 197.0, 646.0, 26567.0, 4149493.0, 16272.0, 524.0, 186.0, 90.0, 49.0, 27.0, 19.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.759765625, -2.7028121948242188, -2.6458587646484375, -2.5889053344726562, -2.531951904296875, -2.4749984741210938, -2.4180450439453125, -2.3610916137695312, -2.30413818359375, -2.2471847534179688, -2.1902313232421875, -2.1332778930664062, -2.076324462890625, -2.0193710327148438, -1.9624176025390625, -1.9054641723632812, -1.8485107421875, -1.7915573120117188, -1.7346038818359375, -1.6776504516601562, -1.620697021484375, -1.5637435913085938, -1.5067901611328125, -1.4498367309570312, -1.39288330078125, -1.3359298706054688, -1.2789764404296875, -1.2220230102539062, -1.165069580078125, -1.1081161499023438, -1.0511627197265625, -0.9942092895507812, -0.937255859375, -0.8803024291992188, -0.8233489990234375, -0.7663955688476562, -0.709442138671875, -0.6524887084960938, -0.5955352783203125, -0.5385818481445312, -0.48162841796875, -0.42467498779296875, -0.3677215576171875, -0.31076812744140625, -0.253814697265625, -0.19686126708984375, -0.1399078369140625, -0.08295440673828125, -0.0260009765625, 0.03095245361328125, 0.0879058837890625, 0.14485931396484375, 0.201812744140625, 0.25876617431640625, 0.3157196044921875, 0.37267303466796875, 0.42962646484375, 0.48657989501953125, 0.5435333251953125, 0.6004867553710938, 0.657440185546875, 0.7143936157226562, 0.7713470458984375, 0.8283004760742188, 0.88525390625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 10.0, 20.0, 27.0, 33.0, 52.0, 87.0, 121.0, 253.0, 602.0, 1650.0, 585.0, 274.0, 152.0, 68.0, 33.0, 29.0, 31.0, 6.0, 9.0, 8.0, 7.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.08758544921875, -0.0856170654296875, -0.083648681640625, -0.0816802978515625, -0.0797119140625, -0.0777435302734375, -0.075775146484375, -0.0738067626953125, -0.07183837890625, -0.0698699951171875, -0.067901611328125, -0.0659332275390625, -0.06396484375, -0.0619964599609375, -0.060028076171875, -0.0580596923828125, -0.05609130859375, -0.0541229248046875, -0.052154541015625, -0.0501861572265625, -0.0482177734375, -0.0462493896484375, -0.044281005859375, -0.0423126220703125, -0.04034423828125, -0.0383758544921875, -0.036407470703125, -0.0344390869140625, -0.032470703125, -0.0305023193359375, -0.028533935546875, -0.0265655517578125, -0.02459716796875, -0.0226287841796875, -0.020660400390625, -0.0186920166015625, -0.0167236328125, -0.0147552490234375, -0.012786865234375, -0.0108184814453125, -0.00885009765625, -0.0068817138671875, -0.004913330078125, -0.0029449462890625, -0.0009765625, 0.0009918212890625, 0.002960205078125, 0.0049285888671875, 0.00689697265625, 0.0088653564453125, 0.010833740234375, 0.0128021240234375, 0.0147705078125, 0.0167388916015625, 0.018707275390625, 0.0206756591796875, 0.02264404296875, 0.0246124267578125, 0.026580810546875, 0.0285491943359375, 0.030517578125, 0.0324859619140625, 0.034454345703125, 0.0364227294921875, 0.03839111328125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 22.0, 231.0, 655.0, 87.0, 10.0, 6.0, 2.0, 2.0], "bins": [-6.573306560516357, -6.460382461547852, -6.347458362579346, -6.23453426361084, -6.121610164642334, -6.008686065673828, -5.895761966705322, -5.782837867736816, -5.6699137687683105, -5.556989669799805, -5.444065570831299, -5.331141471862793, -5.218217372894287, -5.105293273925781, -4.992369174957275, -4.8794450759887695, -4.766520977020264, -4.653596878051758, -4.540672779083252, -4.427748680114746, -4.31482458114624, -4.201900482177734, -4.0889763832092285, -3.9760522842407227, -3.8631279468536377, -3.750203847885132, -3.637279748916626, -3.52435564994812, -3.4114315509796143, -3.2985074520111084, -3.1855833530426025, -3.0726592540740967, -2.95973539352417, -2.846811294555664, -2.733887195587158, -2.6209630966186523, -2.5080389976501465, -2.3951148986816406, -2.2821907997131348, -2.169266700744629, -2.056342363357544, -1.943418264389038, -1.8304941654205322, -1.7175700664520264, -1.6046459674835205, -1.4917218685150146, -1.3787977695465088, -1.265873670578003, -1.152949571609497, -1.0400254726409912, -0.9271013736724854, -0.8141772747039795, -0.7012531757354736, -0.588329017162323, -0.47540491819381714, -0.3624808192253113, -0.24955672025680542, -0.13663262128829956, -0.023708507418632507, 0.08921560645103455, 0.2021397054195404, 0.31506383419036865, 0.4279879331588745, 0.5409120321273804, 0.6538361310958862]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 16.0, 31.0, 65.0, 141.0, 233.0, 199.0, 154.0, 98.0, 48.0, 15.0, 7.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.841445803642273, -1.8053256273269653, -1.7692055702209473, -1.7330853939056396, -1.696965217590332, -1.6608450412750244, -1.6247249841690063, -1.5886048078536987, -1.5524847507476807, -1.516364574432373, -1.480244517326355, -1.4441243410110474, -1.4080041646957397, -1.3718841075897217, -1.335763931274414, -1.2996437549591064, -1.2635235786437988, -1.2274034023284912, -1.1912833452224731, -1.1551631689071655, -1.119042992591858, -1.0829229354858398, -1.0468027591705322, -1.0106825828552246, -0.9745624661445618, -0.9384423494338989, -0.9023221731185913, -0.8662020564079285, -0.8300819396972656, -0.793961763381958, -0.7578416466712952, -0.7217215299606323, -0.6856013536453247, -0.6494812369346619, -0.6133610606193542, -0.5772409439086914, -0.5411207675933838, -0.505000650882721, -0.4688805341720581, -0.4327603876590729, -0.39664024114608765, -0.3605200946331024, -0.3243999481201172, -0.28827983140945435, -0.2521596848964691, -0.2160395383834839, -0.17991940677165985, -0.14379927515983582, -0.10767912864685059, -0.07155898958444595, -0.03543885052204132, 0.0006812885403633118, 0.036801427602767944, 0.07292157411575317, 0.10904170572757721, 0.14516183733940125, 0.18128198385238647, 0.2174021303653717, 0.25352227687835693, 0.2896423935890198, 0.325762540102005, 0.36188268661499023, 0.3980028033256531, 0.4341229498386383, 0.47024309635162354]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 5.0, 6.0, 11.0, 8.0, 10.0, 13.0, 12.0, 25.0, 19.0, 20.0, 41.0, 42.0, 46.0, 43.0, 48.0, 68.0, 137.0, 1046517.0, 1073.0, 44.0, 43.0, 52.0, 39.0, 36.0, 32.0, 38.0, 18.0, 26.0, 20.0, 13.0, 14.0, 6.0, 2.0, 2.0, 5.0, 3.0, 5.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-5.57421875, -5.408447265625, -5.24267578125, -5.076904296875, -4.9111328125, -4.745361328125, -4.57958984375, -4.413818359375, -4.248046875, -4.082275390625, -3.91650390625, -3.750732421875, -3.5849609375, -3.419189453125, -3.25341796875, -3.087646484375, -2.921875, -2.756103515625, -2.59033203125, -2.424560546875, -2.2587890625, -2.093017578125, -1.92724609375, -1.761474609375, -1.595703125, -1.429931640625, -1.26416015625, -1.098388671875, -0.9326171875, -0.766845703125, -0.60107421875, -0.435302734375, -0.26953125, -0.103759765625, 0.06201171875, 0.227783203125, 0.3935546875, 0.559326171875, 0.72509765625, 0.890869140625, 1.056640625, 1.222412109375, 1.38818359375, 1.553955078125, 1.7197265625, 1.885498046875, 2.05126953125, 2.217041015625, 2.3828125, 2.548583984375, 2.71435546875, 2.880126953125, 3.0458984375, 3.211669921875, 3.37744140625, 3.543212890625, 3.708984375, 3.874755859375, 4.04052734375, 4.206298828125, 4.3720703125, 4.537841796875, 4.70361328125, 4.869384765625, 5.03515625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 139.0, 629.0, 234.0, 15.0], "bins": [-0.46630859375, -0.45873546600341797, -0.45116233825683594, -0.4435892105102539, -0.4360160827636719, -0.42844295501708984, -0.4208698272705078, -0.4132966995239258, -0.40572357177734375, -0.3981504440307617, -0.3905773162841797, -0.38300418853759766, -0.3754310607910156, -0.3678579330444336, -0.36028480529785156, -0.35271167755126953, -0.3451385498046875, -0.33756542205810547, -0.32999229431152344, -0.3224191665649414, -0.3148460388183594, -0.30727291107177734, -0.2996997833251953, -0.2921266555786133, -0.28455352783203125, -0.2769804000854492, -0.2694072723388672, -0.26183414459228516, -0.2542610168457031, -0.2466878890991211, -0.23911476135253906, -0.23154163360595703, -0.223968505859375, -0.21639537811279297, -0.20882225036621094, -0.2012491226196289, -0.19367599487304688, -0.18610286712646484, -0.1785297393798828, -0.17095661163330078, -0.16338348388671875, -0.15581035614013672, -0.1482372283935547, -0.14066410064697266, -0.13309097290039062, -0.1255178451538086, -0.11794471740722656, -0.11037158966064453, -0.1027984619140625, -0.09522533416748047, -0.08765220642089844, -0.0800790786743164, -0.07250595092773438, -0.06493282318115234, -0.05735969543457031, -0.04978656768798828, -0.04221343994140625, -0.03464031219482422, -0.027067184448242188, -0.019494056701660156, -0.011920928955078125, -0.004347801208496094, 0.0032253265380859375, 0.010798454284667969, 0.01837158203125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 4.0, 4.0, 4.0, 6.0, 9.0, 12.0, 19.0, 21.0, 43.0, 44.0, 64.0, 103.0, 169.0, 240.0, 411.0, 662.0, 1237.0, 2295.0, 4811.0, 11260.0, 30536.0, 113119.0, 579489.0, 226728.0, 47933.0, 16105.0, 6547.0, 3012.0, 1440.0, 857.0, 518.0, 278.0, 164.0, 124.0, 84.0, 64.0, 32.0, 35.0, 25.0, 15.0, 14.0, 7.0, 3.0, 7.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.77880859375, -0.7534332275390625, -0.728057861328125, -0.7026824951171875, -0.67730712890625, -0.6519317626953125, -0.626556396484375, -0.6011810302734375, -0.5758056640625, -0.5504302978515625, -0.525054931640625, -0.4996795654296875, -0.47430419921875, -0.4489288330078125, -0.423553466796875, -0.3981781005859375, -0.372802734375, -0.3474273681640625, -0.322052001953125, -0.2966766357421875, -0.27130126953125, -0.2459259033203125, -0.220550537109375, -0.1951751708984375, -0.1697998046875, -0.1444244384765625, -0.119049072265625, -0.0936737060546875, -0.06829833984375, -0.0429229736328125, -0.017547607421875, 0.0078277587890625, 0.033203125, 0.0585784912109375, 0.083953857421875, 0.1093292236328125, 0.13470458984375, 0.1600799560546875, 0.185455322265625, 0.2108306884765625, 0.2362060546875, 0.2615814208984375, 0.286956787109375, 0.3123321533203125, 0.33770751953125, 0.3630828857421875, 0.388458251953125, 0.4138336181640625, 0.439208984375, 0.4645843505859375, 0.489959716796875, 0.5153350830078125, 0.54071044921875, 0.5660858154296875, 0.591461181640625, 0.6168365478515625, 0.6422119140625, 0.6675872802734375, 0.692962646484375, 0.7183380126953125, 0.74371337890625, 0.7690887451171875, 0.794464111328125, 0.8198394775390625, 0.84521484375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 5.0, 3.0, 4.0, 16.0, 7.0, 14.0, 26.0, 16.0, 20.0, 38.0, 39.0, 49.0, 50.0, 68.0, 64.0, 65.0, 56.0, 68.0, 63.0, 52.0, 49.0, 40.0, 39.0, 34.0, 29.0, 22.0, 13.0, 11.0, 13.0, 4.0, 7.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.301513671875, -0.2904052734375, -0.279296875, -0.2681884765625, -0.257080078125, -0.2459716796875, -0.23486328125, -0.2237548828125, -0.212646484375, -0.2015380859375, -0.1904296875, -0.1793212890625, -0.168212890625, -0.1571044921875, -0.14599609375, -0.1348876953125, -0.123779296875, -0.1126708984375, -0.1015625, -0.0904541015625, -0.079345703125, -0.0682373046875, -0.05712890625, -0.0460205078125, -0.034912109375, -0.0238037109375, -0.0126953125, -0.0015869140625, 0.009521484375, 0.0206298828125, 0.03173828125, 0.0428466796875, 0.053955078125, 0.0650634765625, 0.076171875, 0.0872802734375, 0.098388671875, 0.1094970703125, 0.12060546875, 0.1317138671875, 0.142822265625, 0.1539306640625, 0.1650390625, 0.1761474609375, 0.187255859375, 0.1983642578125, 0.20947265625, 0.2205810546875, 0.231689453125, 0.2427978515625, 0.25390625, 0.2650146484375, 0.276123046875, 0.2872314453125, 0.29833984375, 0.3094482421875, 0.320556640625, 0.3316650390625, 0.3427734375, 0.3538818359375, 0.364990234375, 0.3760986328125, 0.38720703125, 0.3983154296875, 0.409423828125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 1.0, 2.0, 3.0, 10.0, 11.0, 9.0, 16.0, 30.0, 29.0, 53.0, 78.0, 97.0, 120.0, 210.0, 305.0, 521.0, 797.0, 1326.0, 2534.0, 5299.0, 12747.0, 42925.0, 234995.0, 588075.0, 114553.0, 26005.0, 8895.0, 3947.0, 1946.0, 1110.0, 632.0, 432.0, 287.0, 178.0, 99.0, 75.0, 55.0, 42.0, 33.0, 23.0, 12.0, 7.0, 2.0, 12.0, 11.0, 5.0, 5.0, 0.0, 3.0, 3.0, 0.0, 2.0], "bins": [-0.72412109375, -0.70361328125, -0.68310546875, -0.66259765625, -0.64208984375, -0.62158203125, -0.60107421875, -0.58056640625, -0.56005859375, -0.53955078125, -0.51904296875, -0.49853515625, -0.47802734375, -0.45751953125, -0.43701171875, -0.41650390625, -0.39599609375, -0.37548828125, -0.35498046875, -0.33447265625, -0.31396484375, -0.29345703125, -0.27294921875, -0.25244140625, -0.23193359375, -0.21142578125, -0.19091796875, -0.17041015625, -0.14990234375, -0.12939453125, -0.10888671875, -0.08837890625, -0.06787109375, -0.04736328125, -0.02685546875, -0.00634765625, 0.01416015625, 0.03466796875, 0.05517578125, 0.07568359375, 0.09619140625, 0.11669921875, 0.13720703125, 0.15771484375, 0.17822265625, 0.19873046875, 0.21923828125, 0.23974609375, 0.26025390625, 0.28076171875, 0.30126953125, 0.32177734375, 0.34228515625, 0.36279296875, 0.38330078125, 0.40380859375, 0.42431640625, 0.44482421875, 0.46533203125, 0.48583984375, 0.50634765625, 0.52685546875, 0.54736328125, 0.56787109375, 0.58837890625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 7.0, 9.0, 11.0, 34.0, 86.0, 280.0, 361.0, 125.0, 47.0, 18.0, 7.0, 8.0, 4.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002505779266357422, -0.00024061650037765503, -0.00023065507411956787, -0.0002206936478614807, -0.00021073222160339355, -0.0002007707953453064, -0.00019080936908721924, -0.00018084794282913208, -0.00017088651657104492, -0.00016092509031295776, -0.0001509636640548706, -0.00014100223779678345, -0.0001310408115386963, -0.00012107938528060913, -0.00011111795902252197, -0.00010115653276443481, -9.119510650634766e-05, -8.12336802482605e-05, -7.127225399017334e-05, -6.131082773208618e-05, -5.1349401473999023e-05, -4.1387975215911865e-05, -3.142654895782471e-05, -2.146512269973755e-05, -1.150369644165039e-05, -1.5422701835632324e-06, 8.419156074523926e-06, 1.8380582332611084e-05, 2.8342008590698242e-05, 3.83034348487854e-05, 4.826486110687256e-05, 5.822628736495972e-05, 6.818771362304688e-05, 7.814913988113403e-05, 8.811056613922119e-05, 9.807199239730835e-05, 0.00010803341865539551, 0.00011799484491348267, 0.00012795627117156982, 0.00013791769742965698, 0.00014787912368774414, 0.0001578405499458313, 0.00016780197620391846, 0.00017776340246200562, 0.00018772482872009277, 0.00019768625497817993, 0.0002076476812362671, 0.00021760910749435425, 0.0002275705337524414, 0.00023753196001052856, 0.0002474933862686157, 0.0002574548125267029, 0.00026741623878479004, 0.0002773776650428772, 0.00028733909130096436, 0.0002973005175590515, 0.00030726194381713867, 0.00031722337007522583, 0.000327184796333313, 0.00033714622259140015, 0.0003471076488494873, 0.00035706907510757446, 0.0003670305013656616, 0.0003769919276237488, 0.00038695335388183594]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 2.0, 11.0, 7.0, 18.0, 19.0, 27.0, 38.0, 87.0, 119.0, 216.0, 395.0, 798.0, 1809.0, 4710.0, 13877.0, 66152.0, 694381.0, 224928.0, 27903.0, 7735.0, 2881.0, 1228.0, 533.0, 279.0, 153.0, 99.0, 57.0, 41.0, 17.0, 19.0, 9.0, 6.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.83056640625, -0.8016738891601562, -0.7727813720703125, -0.7438888549804688, -0.714996337890625, -0.6861038208007812, -0.6572113037109375, -0.6283187866210938, -0.59942626953125, -0.5705337524414062, -0.5416412353515625, -0.5127487182617188, -0.483856201171875, -0.45496368408203125, -0.4260711669921875, -0.39717864990234375, -0.3682861328125, -0.33939361572265625, -0.3105010986328125, -0.28160858154296875, -0.252716064453125, -0.22382354736328125, -0.1949310302734375, -0.16603851318359375, -0.13714599609375, -0.10825347900390625, -0.0793609619140625, -0.05046844482421875, -0.021575927734375, 0.00731658935546875, 0.0362091064453125, 0.06510162353515625, 0.093994140625, 0.12288665771484375, 0.1517791748046875, 0.18067169189453125, 0.209564208984375, 0.23845672607421875, 0.2673492431640625, 0.29624176025390625, 0.32513427734375, 0.35402679443359375, 0.3829193115234375, 0.41181182861328125, 0.440704345703125, 0.46959686279296875, 0.4984893798828125, 0.5273818969726562, 0.5562744140625, 0.5851669311523438, 0.6140594482421875, 0.6429519653320312, 0.671844482421875, 0.7007369995117188, 0.7296295166015625, 0.7585220336914062, 0.78741455078125, 0.8163070678710938, 0.8451995849609375, 0.8740921020507812, 0.902984619140625, 0.9318771362304688, 0.9607696533203125, 0.9896621704101562, 1.0185546875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 6.0, 4.0, 9.0, 9.0, 12.0, 13.0, 29.0, 35.0, 61.0, 89.0, 119.0, 135.0, 111.0, 111.0, 79.0, 44.0, 39.0, 38.0, 13.0, 9.0, 8.0, 7.0, 10.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.42578125, -0.4150848388671875, -0.404388427734375, -0.3936920166015625, -0.38299560546875, -0.3722991943359375, -0.361602783203125, -0.3509063720703125, -0.3402099609375, -0.3295135498046875, -0.318817138671875, -0.3081207275390625, -0.29742431640625, -0.2867279052734375, -0.276031494140625, -0.2653350830078125, -0.254638671875, -0.2439422607421875, -0.233245849609375, -0.2225494384765625, -0.21185302734375, -0.2011566162109375, -0.190460205078125, -0.1797637939453125, -0.1690673828125, -0.1583709716796875, -0.147674560546875, -0.1369781494140625, -0.12628173828125, -0.1155853271484375, -0.104888916015625, -0.0941925048828125, -0.08349609375, -0.0727996826171875, -0.062103271484375, -0.0514068603515625, -0.04071044921875, -0.0300140380859375, -0.019317626953125, -0.0086212158203125, 0.0020751953125, 0.0127716064453125, 0.023468017578125, 0.0341644287109375, 0.04486083984375, 0.0555572509765625, 0.066253662109375, 0.0769500732421875, 0.087646484375, 0.0983428955078125, 0.109039306640625, 0.1197357177734375, 0.13043212890625, 0.1411285400390625, 0.151824951171875, 0.1625213623046875, 0.1732177734375, 0.1839141845703125, 0.194610595703125, 0.2053070068359375, 0.21600341796875, 0.2266998291015625, 0.237396240234375, 0.2480926513671875, 0.2587890625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 17.0, 27.0, 118.0, 295.0, 317.0, 127.0, 56.0, 23.0, 12.0, 8.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.660445213317871, -5.390282154083252, -5.120119571685791, -4.849956512451172, -4.579793453216553, -4.309630393981934, -4.039467811584473, -3.7693047523498535, -3.4991419315338135, -3.2289791107177734, -2.9588160514831543, -2.6886532306671143, -2.418490409851074, -2.148327350616455, -1.878164529800415, -1.6080015897750854, -1.3378386497497559, -1.0676757097244263, -0.7975128293037415, -0.5273499488830566, -0.25718700885772705, 0.012975931167602539, 0.2831387519836426, 0.5533016920089722, 0.8234646320343018, 1.0936275720596313, 1.363790512084961, 1.633953332901001, 1.9041162729263306, 2.17427921295166, 2.4444420337677, 2.7146048545837402, 2.9847679138183594, 3.2549307346343994, 3.5250937938690186, 3.7952566146850586, 4.065419673919678, 4.335582733154297, 4.605745315551758, 4.875908374786377, 5.146071434020996, 5.416234493255615, 5.686397075653076, 5.956560134887695, 6.2267231941223145, 6.496886253356934, 6.7670488357543945, 7.037211894989014, 7.307374477386475, 7.577537536621094, 7.847700119018555, 8.117862701416016, 8.388026237487793, 8.658188819885254, 8.928352355957031, 9.198514938354492, 9.468677520751953, 9.738840103149414, 10.009003639221191, 10.279166221618652, 10.549328804016113, 10.81949234008789, 11.089654922485352, 11.359817504882812, 11.62998104095459]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 9.0, 8.0, 6.0, 14.0, 19.0, 15.0, 18.0, 16.0, 21.0, 26.0, 37.0, 28.0, 38.0, 41.0, 40.0, 34.0, 48.0, 53.0, 54.0, 52.0, 46.0, 47.0, 44.0, 36.0, 40.0, 33.0, 31.0, 26.0, 24.0, 15.0, 18.0, 16.0, 11.0, 10.0, 6.0, 7.0, 6.0, 6.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8338738679885864, -1.777823805809021, -1.7217738628387451, -1.6657238006591797, -1.6096737384796143, -1.5536236763000488, -1.497573733329773, -1.4415236711502075, -1.3854737281799316, -1.3294236660003662, -1.2733737230300903, -1.217323660850525, -1.1612735986709595, -1.1052236557006836, -1.0491735935211182, -0.9931235313415527, -0.9370734691619873, -0.8810234665870667, -0.8249734044075012, -0.7689234018325806, -0.7128733396530151, -0.6568233370780945, -0.6007733345031738, -0.5447232723236084, -0.48867326974868774, -0.4326232373714447, -0.37657320499420166, -0.320523202419281, -0.26447317004203796, -0.20842313766479492, -0.15237313508987427, -0.09632310271263123, -0.040273189544677734, 0.01577683538198471, 0.07182686030864716, 0.127876877784729, 0.18392691016197205, 0.2399769425392151, 0.29602694511413574, 0.3520769774913788, 0.4081270098686218, 0.46417704224586487, 0.5202270746231079, 0.5762770771980286, 0.6323270797729492, 0.6883771419525146, 0.7444271445274353, 0.800477147102356, 0.8565272092819214, 0.912577211856842, 0.9686272740364075, 1.0246772766113281, 1.0807273387908936, 1.136777400970459, 1.1928273439407349, 1.2488774061203003, 1.3049273490905762, 1.3609774112701416, 1.4170273542404175, 1.473077416419983, 1.5291274785995483, 1.5851774215698242, 1.6412274837493896, 1.697277545928955, 1.7533276081085205]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 6.0, 5.0, 9.0, 9.0, 15.0, 11.0, 17.0, 17.0, 31.0, 36.0, 31.0, 33.0, 41.0, 46.0, 61.0, 72.0, 122.0, 497.0, 4153990.0, 38841.0, 219.0, 73.0, 35.0, 29.0, 20.0, 11.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-16.984375, -16.63641357421875, -16.2884521484375, -15.94049072265625, -15.592529296875, -15.24456787109375, -14.8966064453125, -14.54864501953125, -14.20068359375, -13.85272216796875, -13.5047607421875, -13.15679931640625, -12.808837890625, -12.46087646484375, -12.1129150390625, -11.76495361328125, -11.4169921875, -11.06903076171875, -10.7210693359375, -10.37310791015625, -10.025146484375, -9.67718505859375, -9.3292236328125, -8.98126220703125, -8.63330078125, -8.28533935546875, -7.9373779296875, -7.58941650390625, -7.241455078125, -6.89349365234375, -6.5455322265625, -6.19757080078125, -5.849609375, -5.50164794921875, -5.1536865234375, -4.80572509765625, -4.457763671875, -4.10980224609375, -3.7618408203125, -3.41387939453125, -3.06591796875, -2.71795654296875, -2.3699951171875, -2.02203369140625, -1.674072265625, -1.32611083984375, -0.9781494140625, -0.63018798828125, -0.2822265625, 0.06573486328125, 0.4136962890625, 0.76165771484375, 1.109619140625, 1.45758056640625, 1.8055419921875, 2.15350341796875, 2.50146484375, 2.84942626953125, 3.1973876953125, 3.54534912109375, 3.893310546875, 4.24127197265625, 4.5892333984375, 4.93719482421875, 5.28515625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 30.0, 112.0, 295.0, 341.0, 176.0, 47.0, 13.0, 4.0], "bins": [-0.489990234375, -0.4817051887512207, -0.4734201431274414, -0.4651350975036621, -0.4568500518798828, -0.4485650062561035, -0.4402799606323242, -0.4319949150085449, -0.4237098693847656, -0.41542482376098633, -0.40713977813720703, -0.39885473251342773, -0.39056968688964844, -0.38228464126586914, -0.37399959564208984, -0.36571455001831055, -0.35742950439453125, -0.34914445877075195, -0.34085941314697266, -0.33257436752319336, -0.32428932189941406, -0.31600427627563477, -0.30771923065185547, -0.29943418502807617, -0.2911491394042969, -0.2828640937805176, -0.2745790481567383, -0.266294002532959, -0.2580089569091797, -0.2497239112854004, -0.2414388656616211, -0.2331538200378418, -0.2248687744140625, -0.2165837287902832, -0.2082986831665039, -0.2000136375427246, -0.1917285919189453, -0.18344354629516602, -0.17515850067138672, -0.16687345504760742, -0.15858840942382812, -0.15030336380004883, -0.14201831817626953, -0.13373327255249023, -0.12544822692871094, -0.11716318130493164, -0.10887813568115234, -0.10059309005737305, -0.09230804443359375, -0.08402299880981445, -0.07573795318603516, -0.06745290756225586, -0.05916786193847656, -0.050882816314697266, -0.04259777069091797, -0.03431272506713867, -0.026027679443359375, -0.017742633819580078, -0.009457588195800781, -0.0011725425720214844, 0.0071125030517578125, 0.01539754867553711, 0.023682594299316406, 0.0319676399230957, 0.040252685546875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 6.0, 5.0, 8.0, 13.0, 21.0, 28.0, 27.0, 48.0, 48.0, 72.0, 108.0, 123.0, 156.0, 180.0, 929.0, 4137543.0, 53914.0, 428.0, 157.0, 106.0, 76.0, 50.0, 68.0, 58.0, 48.0, 18.0, 15.0, 13.0, 11.0, 8.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.40625, -18.683837890625, -17.96142578125, -17.239013671875, -16.5166015625, -15.794189453125, -15.07177734375, -14.349365234375, -13.626953125, -12.904541015625, -12.18212890625, -11.459716796875, -10.7373046875, -10.014892578125, -9.29248046875, -8.570068359375, -7.84765625, -7.125244140625, -6.40283203125, -5.680419921875, -4.9580078125, -4.235595703125, -3.51318359375, -2.790771484375, -2.068359375, -1.345947265625, -0.62353515625, 0.098876953125, 0.8212890625, 1.543701171875, 2.26611328125, 2.988525390625, 3.7109375, 4.433349609375, 5.15576171875, 5.878173828125, 6.6005859375, 7.322998046875, 8.04541015625, 8.767822265625, 9.490234375, 10.212646484375, 10.93505859375, 11.657470703125, 12.3798828125, 13.102294921875, 13.82470703125, 14.547119140625, 15.26953125, 15.991943359375, 16.71435546875, 17.436767578125, 18.1591796875, 18.881591796875, 19.60400390625, 20.326416015625, 21.048828125, 21.771240234375, 22.49365234375, 23.216064453125, 23.9384765625, 24.660888671875, 25.38330078125, 26.105712890625, 26.828125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 32.0, 129.0, 3463.0, 354.0, 75.0, 10.0, 9.0, 6.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.658203125, -2.6077423095703125, -2.557281494140625, -2.5068206787109375, -2.45635986328125, -2.4058990478515625, -2.355438232421875, -2.3049774169921875, -2.2545166015625, -2.2040557861328125, -2.153594970703125, -2.1031341552734375, -2.05267333984375, -2.0022125244140625, -1.951751708984375, -1.9012908935546875, -1.850830078125, -1.8003692626953125, -1.749908447265625, -1.6994476318359375, -1.64898681640625, -1.5985260009765625, -1.548065185546875, -1.4976043701171875, -1.4471435546875, -1.3966827392578125, -1.346221923828125, -1.2957611083984375, -1.24530029296875, -1.1948394775390625, -1.144378662109375, -1.0939178466796875, -1.04345703125, -0.9929962158203125, -0.942535400390625, -0.8920745849609375, -0.84161376953125, -0.7911529541015625, -0.740692138671875, -0.6902313232421875, -0.6397705078125, -0.5893096923828125, -0.538848876953125, -0.4883880615234375, -0.43792724609375, -0.3874664306640625, -0.337005615234375, -0.2865447998046875, -0.236083984375, -0.1856231689453125, -0.135162353515625, -0.0847015380859375, -0.03424072265625, 0.0162200927734375, 0.066680908203125, 0.1171417236328125, 0.1676025390625, 0.2180633544921875, 0.268524169921875, 0.3189849853515625, 0.36944580078125, 0.4199066162109375, 0.470367431640625, 0.5208282470703125, 0.5712890625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 5.0, 11.0, 66.0, 658.0, 227.0, 32.0, 8.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-61.27079772949219, -60.03901290893555, -58.80722427368164, -57.575439453125, -56.34365463256836, -55.11186599731445, -53.88008117675781, -52.648292541503906, -51.416507720947266, -50.184722900390625, -48.95293426513672, -47.72114944458008, -46.48936462402344, -45.25757598876953, -44.02579116821289, -42.79400634765625, -41.562217712402344, -40.3304328918457, -39.0986442565918, -37.866859436035156, -36.635074615478516, -35.40328598022461, -34.17150115966797, -32.93971252441406, -31.707931518554688, -30.476144790649414, -29.244359970092773, -28.0125732421875, -26.780786514282227, -25.548999786376953, -24.317214965820312, -23.08542823791504, -21.853641510009766, -20.621854782104492, -19.39006996154785, -18.158283233642578, -16.926496505737305, -15.694710731506348, -14.46292495727539, -13.231138229370117, -11.99935245513916, -10.767566680908203, -9.53577995300293, -8.303994178771973, -7.072207927703857, -5.840421676635742, -4.608635902404785, -3.3768491744995117, -2.1450634002685547, -0.913277268409729, 0.3185088634490967, 1.5502948760986328, 2.782081127166748, 4.013867378234863, 5.24565315246582, 6.477439880371094, 7.709225654602051, 8.941011428833008, 10.172798156738281, 11.404583930969238, 12.636369705200195, 13.868156433105469, 15.099942207336426, 16.331729888916016, 17.563514709472656]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 4.0, 7.0, 20.0, 36.0, 60.0, 102.0, 127.0, 149.0, 141.0, 117.0, 95.0, 68.0, 37.0, 22.0, 11.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.504648208618164, -8.22883415222168, -7.9530205726623535, -7.677206993103027, -7.401392936706543, -7.125579357147217, -6.849765777587891, -6.573951721191406, -6.298137664794922, -6.022324085235596, -5.746510028839111, -5.470696449279785, -5.194882392883301, -4.919068813323975, -4.643255233764648, -4.367441177368164, -4.091627597808838, -3.8158137798309326, -3.5399999618530273, -3.264186382293701, -2.988372325897217, -2.7125587463378906, -2.4367449283599854, -2.16093111038208, -1.8851172924041748, -1.6093034744262695, -1.3334896564483643, -1.0576759576797485, -0.7818621397018433, -0.506048321723938, -0.23023462295532227, 0.04557919502258301, 0.3213930130004883, 0.5972068309783936, 0.873020589351654, 1.1488343477249146, 1.4246481657028198, 1.700461983680725, 1.9762756824493408, 2.252089500427246, 2.5279033184051514, 2.8037171363830566, 3.079530954360962, 3.355344772338867, 3.6311583518981934, 3.9069724082946777, 4.182785987854004, 4.458600044250488, 4.7344136238098145, 5.010227203369141, 5.286041259765625, 5.561854839324951, 5.8376688957214355, 6.113482475280762, 6.389296531677246, 6.665110111236572, 6.940923690795898, 7.216737270355225, 7.492551326751709, 7.768364906311035, 8.04417896270752, 8.319993019104004, 8.595806121826172, 8.871620178222656, 9.14743423461914]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 7.0, 6.0, 20.0, 15.0, 23.0, 23.0, 36.0, 47.0, 74.0, 140.0, 280.0, 524.0, 1308.0, 4565.0, 40977.0, 834252.0, 151708.0, 10822.0, 2007.0, 793.0, 381.0, 187.0, 113.0, 67.0, 53.0, 32.0, 27.0, 13.0, 15.0, 10.0, 6.0, 7.0, 7.0, 2.0, 1.0, 4.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.16796875, -6.9420166015625, -6.716064453125, -6.4901123046875, -6.26416015625, -6.0382080078125, -5.812255859375, -5.5863037109375, -5.3603515625, -5.1343994140625, -4.908447265625, -4.6824951171875, -4.45654296875, -4.2305908203125, -4.004638671875, -3.7786865234375, -3.552734375, -3.3267822265625, -3.100830078125, -2.8748779296875, -2.64892578125, -2.4229736328125, -2.197021484375, -1.9710693359375, -1.7451171875, -1.5191650390625, -1.293212890625, -1.0672607421875, -0.84130859375, -0.6153564453125, -0.389404296875, -0.1634521484375, 0.0625, 0.2884521484375, 0.514404296875, 0.7403564453125, 0.96630859375, 1.1922607421875, 1.418212890625, 1.6441650390625, 1.8701171875, 2.0960693359375, 2.322021484375, 2.5479736328125, 2.77392578125, 2.9998779296875, 3.225830078125, 3.4517822265625, 3.677734375, 3.9036865234375, 4.129638671875, 4.3555908203125, 4.58154296875, 4.8074951171875, 5.033447265625, 5.2593994140625, 5.4853515625, 5.7113037109375, 5.937255859375, 6.1632080078125, 6.38916015625, 6.6151123046875, 6.841064453125, 7.0670166015625, 7.29296875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 4.0, 13.0, 23.0, 36.0, 78.0, 127.0, 172.0, 181.0, 147.0, 100.0, 63.0, 36.0, 15.0, 8.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.701171875, -0.6849327087402344, -0.6686935424804688, -0.6524543762207031, -0.6362152099609375, -0.6199760437011719, -0.6037368774414062, -0.5874977111816406, -0.571258544921875, -0.5550193786621094, -0.5387802124023438, -0.5225410461425781, -0.5063018798828125, -0.4900627136230469, -0.47382354736328125, -0.4575843811035156, -0.44134521484375, -0.4251060485839844, -0.40886688232421875, -0.3926277160644531, -0.3763885498046875, -0.3601493835449219, -0.34391021728515625, -0.3276710510253906, -0.311431884765625, -0.2951927185058594, -0.27895355224609375, -0.2627143859863281, -0.2464752197265625, -0.23023605346679688, -0.21399688720703125, -0.19775772094726562, -0.1815185546875, -0.16527938842773438, -0.14904022216796875, -0.13280105590820312, -0.1165618896484375, -0.10032272338867188, -0.08408355712890625, -0.06784439086914062, -0.051605224609375, -0.035366058349609375, -0.01912689208984375, -0.002887725830078125, 0.0133514404296875, 0.029590606689453125, 0.04582977294921875, 0.062068939208984375, 0.07830810546875, 0.09454727172851562, 0.11078643798828125, 0.12702560424804688, 0.1432647705078125, 0.15950393676757812, 0.17574310302734375, 0.19198226928710938, 0.208221435546875, 0.22446060180664062, 0.24069976806640625, 0.2569389343261719, 0.2731781005859375, 0.2894172668457031, 0.30565643310546875, 0.3218955993652344, 0.338134765625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 2.0, 5.0, 11.0, 17.0, 19.0, 26.0, 32.0, 32.0, 90.0, 87.0, 135.0, 215.0, 382.0, 581.0, 1146.0, 2566.0, 6568.0, 19637.0, 75335.0, 538532.0, 326146.0, 52575.0, 14865.0, 5075.0, 2147.0, 917.0, 501.0, 278.0, 208.0, 141.0, 73.0, 69.0, 51.0, 28.0, 17.0, 11.0, 12.0, 9.0, 8.0, 2.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.32421875, -2.2575836181640625, -2.190948486328125, -2.1243133544921875, -2.05767822265625, -1.9910430908203125, -1.924407958984375, -1.8577728271484375, -1.7911376953125, -1.7245025634765625, -1.657867431640625, -1.5912322998046875, -1.52459716796875, -1.4579620361328125, -1.391326904296875, -1.3246917724609375, -1.258056640625, -1.1914215087890625, -1.124786376953125, -1.0581512451171875, -0.99151611328125, -0.9248809814453125, -0.858245849609375, -0.7916107177734375, -0.7249755859375, -0.6583404541015625, -0.591705322265625, -0.5250701904296875, -0.45843505859375, -0.3917999267578125, -0.325164794921875, -0.2585296630859375, -0.19189453125, -0.1252593994140625, -0.058624267578125, 0.0080108642578125, 0.07464599609375, 0.1412811279296875, 0.207916259765625, 0.2745513916015625, 0.3411865234375, 0.4078216552734375, 0.474456787109375, 0.5410919189453125, 0.60772705078125, 0.6743621826171875, 0.740997314453125, 0.8076324462890625, 0.874267578125, 0.9409027099609375, 1.007537841796875, 1.0741729736328125, 1.14080810546875, 1.2074432373046875, 1.274078369140625, 1.3407135009765625, 1.4073486328125, 1.4739837646484375, 1.540618896484375, 1.6072540283203125, 1.67388916015625, 1.7405242919921875, 1.807159423828125, 1.8737945556640625, 1.9404296875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 2.0, 2.0, 11.0, 4.0, 9.0, 13.0, 14.0, 15.0, 16.0, 26.0, 33.0, 25.0, 29.0, 57.0, 45.0, 50.0, 57.0, 60.0, 68.0, 57.0, 51.0, 39.0, 46.0, 52.0, 34.0, 26.0, 34.0, 20.0, 21.0, 16.0, 15.0, 16.0, 5.0, 12.0, 7.0, 3.0, 5.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80126953125, -0.775054931640625, -0.74884033203125, -0.722625732421875, -0.6964111328125, -0.670196533203125, -0.64398193359375, -0.617767333984375, -0.591552734375, -0.565338134765625, -0.53912353515625, -0.512908935546875, -0.4866943359375, -0.460479736328125, -0.43426513671875, -0.408050537109375, -0.3818359375, -0.355621337890625, -0.32940673828125, -0.303192138671875, -0.2769775390625, -0.250762939453125, -0.22454833984375, -0.198333740234375, -0.172119140625, -0.145904541015625, -0.11968994140625, -0.093475341796875, -0.0672607421875, -0.041046142578125, -0.01483154296875, 0.011383056640625, 0.03759765625, 0.063812255859375, 0.09002685546875, 0.116241455078125, 0.1424560546875, 0.168670654296875, 0.19488525390625, 0.221099853515625, 0.247314453125, 0.273529052734375, 0.29974365234375, 0.325958251953125, 0.3521728515625, 0.378387451171875, 0.40460205078125, 0.430816650390625, 0.45703125, 0.483245849609375, 0.50946044921875, 0.535675048828125, 0.5618896484375, 0.588104248046875, 0.61431884765625, 0.640533447265625, 0.666748046875, 0.692962646484375, 0.71917724609375, 0.745391845703125, 0.7716064453125, 0.797821044921875, 0.82403564453125, 0.850250244140625, 0.87646484375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 7.0, 1.0, 5.0, 2.0, 7.0, 6.0, 5.0, 22.0, 24.0, 47.0, 65.0, 120.0, 176.0, 344.0, 664.0, 1632.0, 4922.0, 25604.0, 723982.0, 267231.0, 17165.0, 3872.0, 1326.0, 573.0, 290.0, 183.0, 102.0, 66.0, 29.0, 27.0, 25.0, 16.0, 4.0, 5.0, 9.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0], "bins": [-4.08203125, -3.977081298828125, -3.87213134765625, -3.767181396484375, -3.6622314453125, -3.557281494140625, -3.45233154296875, -3.347381591796875, -3.242431640625, -3.137481689453125, -3.03253173828125, -2.927581787109375, -2.8226318359375, -2.717681884765625, -2.61273193359375, -2.507781982421875, -2.40283203125, -2.297882080078125, -2.19293212890625, -2.087982177734375, -1.9830322265625, -1.878082275390625, -1.77313232421875, -1.668182373046875, -1.563232421875, -1.458282470703125, -1.35333251953125, -1.248382568359375, -1.1434326171875, -1.038482666015625, -0.93353271484375, -0.828582763671875, -0.7236328125, -0.618682861328125, -0.51373291015625, -0.408782958984375, -0.3038330078125, -0.198883056640625, -0.09393310546875, 0.011016845703125, 0.115966796875, 0.220916748046875, 0.32586669921875, 0.430816650390625, 0.5357666015625, 0.640716552734375, 0.74566650390625, 0.850616455078125, 0.95556640625, 1.060516357421875, 1.16546630859375, 1.270416259765625, 1.3753662109375, 1.480316162109375, 1.58526611328125, 1.690216064453125, 1.795166015625, 1.900115966796875, 2.00506591796875, 2.110015869140625, 2.2149658203125, 2.319915771484375, 2.42486572265625, 2.529815673828125, 2.634765625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 5.0, 6.0, 17.0, 17.0, 25.0, 26.0, 74.0, 175.0, 290.0, 159.0, 82.0, 40.0, 17.0, 17.0, 10.0, 8.0, 10.0, 10.0, 7.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003447532653808594, -0.00033174455165863037, -0.00031873583793640137, -0.00030572712421417236, -0.00029271841049194336, -0.00027970969676971436, -0.00026670098304748535, -0.00025369226932525635, -0.00024068355560302734, -0.00022767484188079834, -0.00021466612815856934, -0.00020165741443634033, -0.00018864870071411133, -0.00017563998699188232, -0.00016263127326965332, -0.00014962255954742432, -0.0001366138458251953, -0.0001236051321029663, -0.0001105964183807373, -9.75877046585083e-05, -8.45789909362793e-05, -7.157027721405029e-05, -5.856156349182129e-05, -4.5552849769592285e-05, -3.254413604736328e-05, -1.9535422325134277e-05, -6.5267086029052734e-06, 6.4820051193237305e-06, 1.9490718841552734e-05, 3.249943256378174e-05, 4.550814628601074e-05, 5.8516860008239746e-05, 7.152557373046875e-05, 8.453428745269775e-05, 9.754300117492676e-05, 0.00011055171489715576, 0.00012356042861938477, 0.00013656914234161377, 0.00014957785606384277, 0.00016258656978607178, 0.00017559528350830078, 0.00018860399723052979, 0.0002016127109527588, 0.0002146214246749878, 0.0002276301383972168, 0.0002406388521194458, 0.0002536475658416748, 0.0002666562795639038, 0.0002796649932861328, 0.0002926737070083618, 0.0003056824207305908, 0.0003186911344528198, 0.00033169984817504883, 0.00034470856189727783, 0.00035771727561950684, 0.00037072598934173584, 0.00038373470306396484, 0.00039674341678619385, 0.00040975213050842285, 0.00042276084423065186, 0.00043576955795288086, 0.00044877827167510986, 0.00046178698539733887, 0.00047479569911956787, 0.0004878044128417969]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 8.0, 13.0, 16.0, 27.0, 30.0, 54.0, 114.0, 185.0, 370.0, 704.0, 1468.0, 3931.0, 12225.0, 58040.0, 739582.0, 195946.0, 24773.0, 6654.0, 2295.0, 1015.0, 466.0, 258.0, 144.0, 84.0, 47.0, 32.0, 25.0, 12.0, 13.0, 6.0, 4.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7197265625, -1.6554412841796875, -1.591156005859375, -1.5268707275390625, -1.46258544921875, -1.3983001708984375, -1.334014892578125, -1.2697296142578125, -1.2054443359375, -1.1411590576171875, -1.076873779296875, -1.0125885009765625, -0.94830322265625, -0.8840179443359375, -0.819732666015625, -0.7554473876953125, -0.691162109375, -0.6268768310546875, -0.562591552734375, -0.4983062744140625, -0.43402099609375, -0.3697357177734375, -0.305450439453125, -0.2411651611328125, -0.1768798828125, -0.1125946044921875, -0.048309326171875, 0.0159759521484375, 0.08026123046875, 0.1445465087890625, 0.208831787109375, 0.2731170654296875, 0.33740234375, 0.4016876220703125, 0.465972900390625, 0.5302581787109375, 0.59454345703125, 0.6588287353515625, 0.723114013671875, 0.7873992919921875, 0.8516845703125, 0.9159698486328125, 0.980255126953125, 1.0445404052734375, 1.10882568359375, 1.1731109619140625, 1.237396240234375, 1.3016815185546875, 1.365966796875, 1.4302520751953125, 1.494537353515625, 1.5588226318359375, 1.62310791015625, 1.6873931884765625, 1.751678466796875, 1.8159637451171875, 1.8802490234375, 1.9445343017578125, 2.008819580078125, 2.0731048583984375, 2.13739013671875, 2.2016754150390625, 2.265960693359375, 2.3302459716796875, 2.39453125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 5.0, 5.0, 2.0, 3.0, 4.0, 7.0, 12.0, 15.0, 14.0, 14.0, 20.0, 38.0, 39.0, 53.0, 95.0, 106.0, 126.0, 124.0, 96.0, 59.0, 51.0, 23.0, 18.0, 18.0, 12.0, 12.0, 6.0, 5.0, 6.0, 2.0, 6.0, 5.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.61376953125, -0.5904693603515625, -0.567169189453125, -0.5438690185546875, -0.52056884765625, -0.4972686767578125, -0.473968505859375, -0.4506683349609375, -0.4273681640625, -0.4040679931640625, -0.380767822265625, -0.3574676513671875, -0.33416748046875, -0.3108673095703125, -0.287567138671875, -0.2642669677734375, -0.240966796875, -0.2176666259765625, -0.194366455078125, -0.1710662841796875, -0.14776611328125, -0.1244659423828125, -0.101165771484375, -0.0778656005859375, -0.0545654296875, -0.0312652587890625, -0.007965087890625, 0.0153350830078125, 0.03863525390625, 0.0619354248046875, 0.085235595703125, 0.1085357666015625, 0.1318359375, 0.1551361083984375, 0.178436279296875, 0.2017364501953125, 0.22503662109375, 0.2483367919921875, 0.271636962890625, 0.2949371337890625, 0.3182373046875, 0.3415374755859375, 0.364837646484375, 0.3881378173828125, 0.41143798828125, 0.4347381591796875, 0.458038330078125, 0.4813385009765625, 0.504638671875, 0.5279388427734375, 0.551239013671875, 0.5745391845703125, 0.59783935546875, 0.6211395263671875, 0.644439697265625, 0.6677398681640625, 0.6910400390625, 0.7143402099609375, 0.737640380859375, 0.7609405517578125, 0.78424072265625, 0.8075408935546875, 0.830841064453125, 0.8541412353515625, 0.87744140625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 18.0, 64.0, 270.0, 390.0, 183.0, 39.0, 21.0, 6.0, 2.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.416507720947266, -29.623523712158203, -28.83053970336914, -28.037555694580078, -27.244569778442383, -26.45158576965332, -25.658601760864258, -24.865617752075195, -24.0726318359375, -23.279647827148438, -22.486663818359375, -21.693679809570312, -20.900693893432617, -20.107709884643555, -19.314725875854492, -18.52174186706543, -17.728757858276367, -16.935773849487305, -16.142789840698242, -15.349804878234863, -14.556819915771484, -13.763835906982422, -12.97085189819336, -12.177867889404297, -11.384882926940918, -10.591898918151855, -9.798913955688477, -9.005929946899414, -8.212945938110352, -7.419960975646973, -6.62697696685791, -5.8339924812316895, -5.041009902954102, -4.248025417327881, -3.4550411701202393, -2.6620569229125977, -1.869072437286377, -1.0760879516601562, -0.28310394287109375, 0.509880542755127, 1.3028650283813477, 2.0958495140075684, 2.88883376121521, 3.6818180084228516, 4.474802494049072, 5.267786979675293, 6.0607709884643555, 6.853755474090576, 7.646739959716797, 8.43972396850586, 9.232708930969238, 10.0256929397583, 10.81867790222168, 11.611661911010742, 12.404645919799805, 13.197629928588867, 13.990614891052246, 14.783598899841309, 15.576583862304688, 16.36956787109375, 17.162551879882812, 17.955535888671875, 18.748519897460938, 19.541505813598633, 20.334489822387695]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 5.0, 3.0, 1.0, 12.0, 15.0, 20.0, 17.0, 34.0, 34.0, 25.0, 31.0, 42.0, 55.0, 53.0, 49.0, 60.0, 54.0, 57.0, 47.0, 57.0, 52.0, 52.0, 31.0, 38.0, 25.0, 30.0, 22.0, 14.0, 17.0, 13.0, 7.0, 6.0, 4.0, 4.0, 3.0, 3.0, 3.0, 1.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.527797222137451, -5.354232311248779, -5.180667400360107, -5.0071024894714355, -4.833537578582764, -4.659972667694092, -4.486408233642578, -4.312843322753906, -4.139278411865234, -3.9657135009765625, -3.7921485900878906, -3.6185836791992188, -3.445018768310547, -3.271453857421875, -3.0978891849517822, -2.9243242740631104, -2.7507591247558594, -2.5771942138671875, -2.4036293029785156, -2.2300643920898438, -2.056499481201172, -1.8829346895217896, -1.7093698978424072, -1.5358049869537354, -1.3622400760650635, -1.1886751651763916, -1.0151102542877197, -0.8415454626083374, -0.6679805517196655, -0.49441564083099365, -0.32085084915161133, -0.14728593826293945, 0.02627849578857422, 0.1998433768749237, 0.3734082579612732, 0.5469731092453003, 0.7205380201339722, 0.894102931022644, 1.0676677227020264, 1.2412326335906982, 1.4147975444793701, 1.588362455368042, 1.7619273662567139, 1.9354921579360962, 2.1090569496154785, 2.2826218605041504, 2.4561867713928223, 2.629751682281494, 2.803316593170166, 2.976881504058838, 3.1504464149475098, 3.3240113258361816, 3.4975762367248535, 3.6711411476135254, 3.844705820083618, 4.018270492553711, 4.191835403442383, 4.365400314331055, 4.538965225219727, 4.712530136108398, 4.88609504699707, 5.059659957885742, 5.233224868774414, 5.406789779663086, 5.580354690551758]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 3.0, 8.0, 4.0, 3.0, 4.0, 6.0, 10.0, 12.0, 12.0, 15.0, 14.0, 24.0, 13.0, 22.0, 42.0, 51.0, 60.0, 101.0, 153.0, 246.0, 413.0, 880.0, 2649.0, 10797.0, 91415.0, 4027789.0, 48474.0, 7985.0, 1905.0, 643.0, 263.0, 124.0, 72.0, 33.0, 18.0, 7.0, 7.0, 4.0, 3.0, 3.0, 1.0], "bins": [-13.5234375, -13.24383544921875, -12.9642333984375, -12.68463134765625, -12.405029296875, -12.12542724609375, -11.8458251953125, -11.56622314453125, -11.28662109375, -11.00701904296875, -10.7274169921875, -10.44781494140625, -10.168212890625, -9.88861083984375, -9.6090087890625, -9.32940673828125, -9.0498046875, -8.77020263671875, -8.4906005859375, -8.21099853515625, -7.931396484375, -7.65179443359375, -7.3721923828125, -7.09259033203125, -6.81298828125, -6.53338623046875, -6.2537841796875, -5.97418212890625, -5.694580078125, -5.41497802734375, -5.1353759765625, -4.85577392578125, -4.576171875, -4.29656982421875, -4.0169677734375, -3.73736572265625, -3.457763671875, -3.17816162109375, -2.8985595703125, -2.61895751953125, -2.33935546875, -2.05975341796875, -1.7801513671875, -1.50054931640625, -1.220947265625, -0.94134521484375, -0.6617431640625, -0.38214111328125, -0.1025390625, 0.17706298828125, 0.4566650390625, 0.73626708984375, 1.015869140625, 1.29547119140625, 1.5750732421875, 1.85467529296875, 2.13427734375, 2.41387939453125, 2.6934814453125, 2.97308349609375, 3.252685546875, 3.53228759765625, 3.8118896484375, 4.09149169921875, 4.37109375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 3.0, 8.0, 13.0, 24.0, 40.0, 76.0, 108.0, 141.0, 152.0, 143.0, 100.0, 80.0, 46.0, 37.0, 19.0, 8.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.69677734375, -0.68243408203125, -0.6680908203125, -0.65374755859375, -0.639404296875, -0.62506103515625, -0.6107177734375, -0.59637451171875, -0.58203125, -0.56768798828125, -0.5533447265625, -0.53900146484375, -0.524658203125, -0.51031494140625, -0.4959716796875, -0.48162841796875, -0.46728515625, -0.45294189453125, -0.4385986328125, -0.42425537109375, -0.409912109375, -0.39556884765625, -0.3812255859375, -0.36688232421875, -0.3525390625, -0.33819580078125, -0.3238525390625, -0.30950927734375, -0.295166015625, -0.28082275390625, -0.2664794921875, -0.25213623046875, -0.23779296875, -0.22344970703125, -0.2091064453125, -0.19476318359375, -0.180419921875, -0.16607666015625, -0.1517333984375, -0.13739013671875, -0.123046875, -0.10870361328125, -0.0943603515625, -0.08001708984375, -0.065673828125, -0.05133056640625, -0.0369873046875, -0.02264404296875, -0.00830078125, 0.00604248046875, 0.0203857421875, 0.03472900390625, 0.049072265625, 0.06341552734375, 0.0777587890625, 0.09210205078125, 0.1064453125, 0.12078857421875, 0.1351318359375, 0.14947509765625, 0.163818359375, 0.17816162109375, 0.1925048828125, 0.20684814453125, 0.22119140625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 2.0, 5.0, 8.0, 15.0, 17.0, 21.0, 49.0, 81.0, 189.0, 391.0, 964.0, 2771.0, 14155.0, 1663164.0, 2493544.0, 14374.0, 2765.0, 952.0, 394.0, 201.0, 105.0, 43.0, 24.0, 22.0, 9.0, 5.0, 4.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.421875, -10.1060791015625, -9.790283203125, -9.4744873046875, -9.15869140625, -8.8428955078125, -8.527099609375, -8.2113037109375, -7.8955078125, -7.5797119140625, -7.263916015625, -6.9481201171875, -6.63232421875, -6.3165283203125, -6.000732421875, -5.6849365234375, -5.369140625, -5.0533447265625, -4.737548828125, -4.4217529296875, -4.10595703125, -3.7901611328125, -3.474365234375, -3.1585693359375, -2.8427734375, -2.5269775390625, -2.211181640625, -1.8953857421875, -1.57958984375, -1.2637939453125, -0.947998046875, -0.6322021484375, -0.31640625, -0.0006103515625, 0.315185546875, 0.6309814453125, 0.94677734375, 1.2625732421875, 1.578369140625, 1.8941650390625, 2.2099609375, 2.5257568359375, 2.841552734375, 3.1573486328125, 3.47314453125, 3.7889404296875, 4.104736328125, 4.4205322265625, 4.736328125, 5.0521240234375, 5.367919921875, 5.6837158203125, 5.99951171875, 6.3153076171875, 6.631103515625, 6.9468994140625, 7.2626953125, 7.5784912109375, 7.894287109375, 8.2100830078125, 8.52587890625, 8.8416748046875, 9.157470703125, 9.4732666015625, 9.7890625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 9.0, 7.0, 9.0, 17.0, 27.0, 46.0, 81.0, 192.0, 2326.0, 996.0, 155.0, 72.0, 46.0, 37.0, 17.0, 14.0, 5.0, 2.0, 4.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1005859375, -1.06500244140625, -1.0294189453125, -0.99383544921875, -0.958251953125, -0.92266845703125, -0.8870849609375, -0.85150146484375, -0.81591796875, -0.78033447265625, -0.7447509765625, -0.70916748046875, -0.673583984375, -0.63800048828125, -0.6024169921875, -0.56683349609375, -0.53125, -0.49566650390625, -0.4600830078125, -0.42449951171875, -0.388916015625, -0.35333251953125, -0.3177490234375, -0.28216552734375, -0.24658203125, -0.21099853515625, -0.1754150390625, -0.13983154296875, -0.104248046875, -0.06866455078125, -0.0330810546875, 0.00250244140625, 0.0380859375, 0.07366943359375, 0.1092529296875, 0.14483642578125, 0.180419921875, 0.21600341796875, 0.2515869140625, 0.28717041015625, 0.32275390625, 0.35833740234375, 0.3939208984375, 0.42950439453125, 0.465087890625, 0.50067138671875, 0.5362548828125, 0.57183837890625, 0.607421875, 0.64300537109375, 0.6785888671875, 0.71417236328125, 0.749755859375, 0.78533935546875, 0.8209228515625, 0.85650634765625, 0.89208984375, 0.92767333984375, 0.9632568359375, 0.99884033203125, 1.034423828125, 1.07000732421875, 1.1055908203125, 1.14117431640625, 1.1767578125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 7.0, 10.0, 22.0, 78.0, 158.0, 333.0, 232.0, 85.0, 33.0, 17.0, 9.0, 3.0, 6.0, 3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.726259231567383, -11.406473159790039, -11.086686134338379, -10.766900062561035, -10.447113037109375, -10.127326965332031, -9.807539939880371, -9.487753868103027, -9.167966842651367, -8.848180770874023, -8.528393745422363, -8.20860767364502, -7.888820648193359, -7.569034576416016, -7.249248027801514, -6.929461479187012, -6.609675407409668, -6.289888858795166, -5.970102310180664, -5.650315761566162, -5.33052921295166, -5.010743141174316, -4.6909565925598145, -4.3711700439453125, -4.0513834953308105, -3.7315969467163086, -3.4118103981018066, -3.092024087905884, -2.772237539291382, -2.45245099067688, -2.132664680480957, -1.812878131866455, -1.4930925369262695, -1.1733059883117676, -0.8535195589065552, -0.533733069896698, -0.21394658088684082, 0.10583996772766113, 0.42562639713287354, 0.7454128265380859, 1.065199375152588, 1.3849859237670898, 1.7047723531723022, 2.0245587825775146, 2.3443453311920166, 2.6641318798065186, 2.9839181900024414, 3.3037047386169434, 3.6234912872314453, 3.9432778358459473, 4.263064384460449, 4.582850933074951, 4.902637481689453, 5.222423553466797, 5.542210102081299, 5.861996650695801, 6.181783199310303, 6.501569747924805, 6.821356296539307, 7.141142845153809, 7.460928916931152, 7.7807159423828125, 8.100502014160156, 8.4202880859375, 8.74007511138916]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 3.0, 9.0, 6.0, 14.0, 35.0, 40.0, 56.0, 83.0, 77.0, 102.0, 100.0, 103.0, 93.0, 80.0, 78.0, 39.0, 32.0, 20.0, 18.0, 7.0, 7.0, 4.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.785714626312256, -5.627998352050781, -5.470282077789307, -5.31256628036499, -5.154850006103516, -4.997133731842041, -4.839417457580566, -4.681701183319092, -4.523984909057617, -4.366268634796143, -4.208552360534668, -4.050836563110352, -3.893120288848877, -3.7354040145874023, -3.5776877403259277, -3.419971466064453, -3.2622556686401367, -3.104539394378662, -2.9468233585357666, -2.789107084274292, -2.6313910484313965, -2.473674774169922, -2.3159584999084473, -2.1582422256469727, -2.000526189804077, -1.842810034751892, -1.685093879699707, -1.5273776054382324, -1.3696614503860474, -1.2119452953338623, -1.0542290210723877, -0.8965128660202026, -0.7387971878051758, -0.5810810327529907, -0.4233648180961609, -0.26564863324165344, -0.107932448387146, 0.04978370666503906, 0.2074999213218689, 0.36521613597869873, 0.5229322910308838, 0.6806484460830688, 0.8383646607398987, 0.9960808753967285, 1.1537970304489136, 1.3115131855010986, 1.4692294597625732, 1.6269456148147583, 1.7846617698669434, 1.9423779249191284, 2.1000940799713135, 2.257810354232788, 2.4155263900756836, 2.573242664337158, 2.730958938598633, 2.8886752128601074, 3.046391248703003, 3.2041075229644775, 3.361823558807373, 3.5195398330688477, 3.6772561073303223, 3.8349721431732178, 3.9926884174346924, 4.150404453277588, 4.3081207275390625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 7.0, 10.0, 13.0, 13.0, 17.0, 25.0, 43.0, 30.0, 61.0, 91.0, 162.0, 275.0, 477.0, 1101.0, 2937.0, 12132.0, 85765.0, 810461.0, 114565.0, 14337.0, 3436.0, 1228.0, 534.0, 320.0, 162.0, 107.0, 79.0, 42.0, 38.0, 23.0, 15.0, 9.0, 7.0, 10.0, 9.0, 3.0, 8.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.20703125, -5.03662109375, -4.8662109375, -4.69580078125, -4.525390625, -4.35498046875, -4.1845703125, -4.01416015625, -3.84375, -3.67333984375, -3.5029296875, -3.33251953125, -3.162109375, -2.99169921875, -2.8212890625, -2.65087890625, -2.48046875, -2.31005859375, -2.1396484375, -1.96923828125, -1.798828125, -1.62841796875, -1.4580078125, -1.28759765625, -1.1171875, -0.94677734375, -0.7763671875, -0.60595703125, -0.435546875, -0.26513671875, -0.0947265625, 0.07568359375, 0.24609375, 0.41650390625, 0.5869140625, 0.75732421875, 0.927734375, 1.09814453125, 1.2685546875, 1.43896484375, 1.609375, 1.77978515625, 1.9501953125, 2.12060546875, 2.291015625, 2.46142578125, 2.6318359375, 2.80224609375, 2.97265625, 3.14306640625, 3.3134765625, 3.48388671875, 3.654296875, 3.82470703125, 3.9951171875, 4.16552734375, 4.3359375, 4.50634765625, 4.6767578125, 4.84716796875, 5.017578125, 5.18798828125, 5.3583984375, 5.52880859375, 5.69921875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 3.0, 3.0, 7.0, 16.0, 33.0, 47.0, 67.0, 101.0, 111.0, 134.0, 134.0, 93.0, 93.0, 56.0, 48.0, 23.0, 11.0, 12.0, 7.0, 5.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.669921875, -0.6526679992675781, -0.6354141235351562, -0.6181602478027344, -0.6009063720703125, -0.5836524963378906, -0.5663986206054688, -0.5491447448730469, -0.531890869140625, -0.5146369934082031, -0.49738311767578125, -0.4801292419433594, -0.4628753662109375, -0.4456214904785156, -0.42836761474609375, -0.4111137390136719, -0.39385986328125, -0.3766059875488281, -0.35935211181640625, -0.3420982360839844, -0.3248443603515625, -0.3075904846191406, -0.29033660888671875, -0.2730827331542969, -0.255828857421875, -0.23857498168945312, -0.22132110595703125, -0.20406723022460938, -0.1868133544921875, -0.16955947875976562, -0.15230560302734375, -0.13505172729492188, -0.1177978515625, -0.10054397583007812, -0.08329010009765625, -0.06603622436523438, -0.0487823486328125, -0.031528472900390625, -0.01427459716796875, 0.002979278564453125, 0.020233154296875, 0.037487030029296875, 0.05474090576171875, 0.07199478149414062, 0.0892486572265625, 0.10650253295898438, 0.12375640869140625, 0.14101028442382812, 0.15826416015625, 0.17551803588867188, 0.19277191162109375, 0.21002578735351562, 0.2272796630859375, 0.24453353881835938, 0.26178741455078125, 0.2790412902832031, 0.296295166015625, 0.3135490417480469, 0.33080291748046875, 0.3480567932128906, 0.3653106689453125, 0.3825645446777344, 0.39981842041015625, 0.4170722961425781, 0.434326171875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 5.0, 3.0, 5.0, 7.0, 11.0, 15.0, 12.0, 25.0, 31.0, 42.0, 52.0, 71.0, 86.0, 139.0, 224.0, 329.0, 606.0, 936.0, 1542.0, 3063.0, 6208.0, 15810.0, 48743.0, 214347.0, 546753.0, 148557.0, 36889.0, 12501.0, 5305.0, 2515.0, 1319.0, 857.0, 477.0, 336.0, 201.0, 154.0, 105.0, 76.0, 54.0, 33.0, 18.0, 21.0, 16.0, 12.0, 13.0, 11.0, 7.0, 5.0, 7.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.8291015625, -1.7708282470703125, -1.712554931640625, -1.6542816162109375, -1.59600830078125, -1.5377349853515625, -1.479461669921875, -1.4211883544921875, -1.3629150390625, -1.3046417236328125, -1.246368408203125, -1.1880950927734375, -1.12982177734375, -1.0715484619140625, -1.013275146484375, -0.9550018310546875, -0.896728515625, -0.8384552001953125, -0.780181884765625, -0.7219085693359375, -0.66363525390625, -0.6053619384765625, -0.547088623046875, -0.4888153076171875, -0.4305419921875, -0.3722686767578125, -0.313995361328125, -0.2557220458984375, -0.19744873046875, -0.1391754150390625, -0.080902099609375, -0.0226287841796875, 0.03564453125, 0.0939178466796875, 0.152191162109375, 0.2104644775390625, 0.26873779296875, 0.3270111083984375, 0.385284423828125, 0.4435577392578125, 0.5018310546875, 0.5601043701171875, 0.618377685546875, 0.6766510009765625, 0.73492431640625, 0.7931976318359375, 0.851470947265625, 0.9097442626953125, 0.968017578125, 1.0262908935546875, 1.084564208984375, 1.1428375244140625, 1.20111083984375, 1.2593841552734375, 1.317657470703125, 1.3759307861328125, 1.4342041015625, 1.4924774169921875, 1.550750732421875, 1.6090240478515625, 1.66729736328125, 1.7255706787109375, 1.783843994140625, 1.8421173095703125, 1.900390625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 7.0, 5.0, 7.0, 7.0, 9.0, 8.0, 16.0, 14.0, 21.0, 24.0, 27.0, 23.0, 33.0, 31.0, 33.0, 45.0, 45.0, 43.0, 44.0, 53.0, 46.0, 60.0, 45.0, 34.0, 39.0, 45.0, 32.0, 31.0, 32.0, 26.0, 17.0, 20.0, 15.0, 14.0, 13.0, 9.0, 5.0, 5.0, 7.0, 3.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.91943359375, -0.8886947631835938, -0.8579559326171875, -0.8272171020507812, -0.796478271484375, -0.7657394409179688, -0.7350006103515625, -0.7042617797851562, -0.67352294921875, -0.6427841186523438, -0.6120452880859375, -0.5813064575195312, -0.550567626953125, -0.5198287963867188, -0.4890899658203125, -0.45835113525390625, -0.4276123046875, -0.39687347412109375, -0.3661346435546875, -0.33539581298828125, -0.304656982421875, -0.27391815185546875, -0.2431793212890625, -0.21244049072265625, -0.18170166015625, -0.15096282958984375, -0.1202239990234375, -0.08948516845703125, -0.058746337890625, -0.02800750732421875, 0.0027313232421875, 0.03347015380859375, 0.064208984375, 0.09494781494140625, 0.1256866455078125, 0.15642547607421875, 0.187164306640625, 0.21790313720703125, 0.2486419677734375, 0.27938079833984375, 0.31011962890625, 0.34085845947265625, 0.3715972900390625, 0.40233612060546875, 0.433074951171875, 0.46381378173828125, 0.4945526123046875, 0.5252914428710938, 0.5560302734375, 0.5867691040039062, 0.6175079345703125, 0.6482467651367188, 0.678985595703125, 0.7097244262695312, 0.7404632568359375, 0.7712020874023438, 0.80194091796875, 0.8326797485351562, 0.8634185791015625, 0.8941574096679688, 0.924896240234375, 0.9556350708007812, 0.9863739013671875, 1.0171127319335938, 1.0478515625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 5.0, 8.0, 7.0, 10.0, 8.0, 24.0, 27.0, 42.0, 74.0, 97.0, 169.0, 286.0, 509.0, 880.0, 1555.0, 2991.0, 6199.0, 15060.0, 48313.0, 315412.0, 550825.0, 70717.0, 19475.0, 7892.0, 3662.0, 1816.0, 1067.0, 545.0, 375.0, 196.0, 100.0, 58.0, 46.0, 42.0, 11.0, 21.0, 5.0, 7.0, 9.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2099609375, -1.17230224609375, -1.1346435546875, -1.09698486328125, -1.059326171875, -1.02166748046875, -0.9840087890625, -0.94635009765625, -0.90869140625, -0.87103271484375, -0.8333740234375, -0.79571533203125, -0.758056640625, -0.72039794921875, -0.6827392578125, -0.64508056640625, -0.607421875, -0.56976318359375, -0.5321044921875, -0.49444580078125, -0.456787109375, -0.41912841796875, -0.3814697265625, -0.34381103515625, -0.30615234375, -0.26849365234375, -0.2308349609375, -0.19317626953125, -0.155517578125, -0.11785888671875, -0.0802001953125, -0.04254150390625, -0.0048828125, 0.03277587890625, 0.0704345703125, 0.10809326171875, 0.145751953125, 0.18341064453125, 0.2210693359375, 0.25872802734375, 0.29638671875, 0.33404541015625, 0.3717041015625, 0.40936279296875, 0.447021484375, 0.48468017578125, 0.5223388671875, 0.55999755859375, 0.59765625, 0.63531494140625, 0.6729736328125, 0.71063232421875, 0.748291015625, 0.78594970703125, 0.8236083984375, 0.86126708984375, 0.89892578125, 0.93658447265625, 0.9742431640625, 1.01190185546875, 1.049560546875, 1.08721923828125, 1.1248779296875, 1.16253662109375, 1.2001953125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 1.0, 3.0, 4.0, 2.0, 3.0, 3.0, 5.0, 8.0, 12.0, 22.0, 33.0, 61.0, 89.0, 179.0, 231.0, 131.0, 86.0, 36.0, 33.0, 15.0, 18.0, 5.0, 5.0, 2.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003745555877685547, -0.0003632940351963043, -0.00035203248262405396, -0.0003407709300518036, -0.0003295093774795532, -0.00031824782490730286, -0.0003069862723350525, -0.0002957247197628021, -0.00028446316719055176, -0.0002732016146183014, -0.000261940062046051, -0.00025067850947380066, -0.0002394169569015503, -0.00022815540432929993, -0.00021689385175704956, -0.0002056322991847992, -0.00019437074661254883, -0.00018310919404029846, -0.0001718476414680481, -0.00016058608889579773, -0.00014932453632354736, -0.000138062983751297, -0.00012680143117904663, -0.00011553987860679626, -0.0001042783260345459, -9.301677346229553e-05, -8.175522089004517e-05, -7.04936683177948e-05, -5.9232115745544434e-05, -4.797056317329407e-05, -3.67090106010437e-05, -2.5447458028793335e-05, -1.4185905456542969e-05, -2.9243528842926025e-06, 8.337199687957764e-06, 1.959875226020813e-05, 3.0860304832458496e-05, 4.212185740470886e-05, 5.338340997695923e-05, 6.46449625492096e-05, 7.590651512145996e-05, 8.716806769371033e-05, 9.84296202659607e-05, 0.00010969117283821106, 0.00012095272541046143, 0.0001322142779827118, 0.00014347583055496216, 0.00015473738312721252, 0.0001659989356994629, 0.00017726048827171326, 0.00018852204084396362, 0.000199783593416214, 0.00021104514598846436, 0.00022230669856071472, 0.0002335682511329651, 0.00024482980370521545, 0.0002560913562774658, 0.0002673529088497162, 0.00027861446142196655, 0.0002898760139942169, 0.0003011375665664673, 0.00031239911913871765, 0.000323660671710968, 0.0003349222242832184, 0.00034618377685546875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 7.0, 6.0, 15.0, 17.0, 24.0, 18.0, 30.0, 44.0, 37.0, 65.0, 94.0, 148.0, 217.0, 354.0, 529.0, 897.0, 1419.0, 2759.0, 5124.0, 11047.0, 27588.0, 101388.0, 615886.0, 207744.0, 42559.0, 15382.0, 6800.0, 3406.0, 1855.0, 1089.0, 637.0, 451.0, 282.0, 197.0, 119.0, 102.0, 59.0, 47.0, 24.0, 20.0, 14.0, 16.0, 11.0, 10.0, 7.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-1.00390625, -0.97222900390625, -0.9405517578125, -0.90887451171875, -0.877197265625, -0.84552001953125, -0.8138427734375, -0.78216552734375, -0.75048828125, -0.71881103515625, -0.6871337890625, -0.65545654296875, -0.623779296875, -0.59210205078125, -0.5604248046875, -0.52874755859375, -0.4970703125, -0.46539306640625, -0.4337158203125, -0.40203857421875, -0.370361328125, -0.33868408203125, -0.3070068359375, -0.27532958984375, -0.24365234375, -0.21197509765625, -0.1802978515625, -0.14862060546875, -0.116943359375, -0.08526611328125, -0.0535888671875, -0.02191162109375, 0.009765625, 0.04144287109375, 0.0731201171875, 0.10479736328125, 0.136474609375, 0.16815185546875, 0.1998291015625, 0.23150634765625, 0.26318359375, 0.29486083984375, 0.3265380859375, 0.35821533203125, 0.389892578125, 0.42156982421875, 0.4532470703125, 0.48492431640625, 0.5166015625, 0.54827880859375, 0.5799560546875, 0.61163330078125, 0.643310546875, 0.67498779296875, 0.7066650390625, 0.73834228515625, 0.77001953125, 0.80169677734375, 0.8333740234375, 0.86505126953125, 0.896728515625, 0.92840576171875, 0.9600830078125, 0.99176025390625, 1.0234375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 6.0, 3.0, 10.0, 6.0, 11.0, 12.0, 18.0, 28.0, 38.0, 43.0, 59.0, 84.0, 128.0, 129.0, 99.0, 76.0, 62.0, 37.0, 33.0, 21.0, 18.0, 15.0, 15.0, 10.0, 3.0, 7.0, 10.0, 7.0, 5.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56640625, -0.545562744140625, -0.52471923828125, -0.503875732421875, -0.4830322265625, -0.462188720703125, -0.44134521484375, -0.420501708984375, -0.399658203125, -0.378814697265625, -0.35797119140625, -0.337127685546875, -0.3162841796875, -0.295440673828125, -0.27459716796875, -0.253753662109375, -0.23291015625, -0.212066650390625, -0.19122314453125, -0.170379638671875, -0.1495361328125, -0.128692626953125, -0.10784912109375, -0.087005615234375, -0.066162109375, -0.045318603515625, -0.02447509765625, -0.003631591796875, 0.0172119140625, 0.038055419921875, 0.05889892578125, 0.079742431640625, 0.1005859375, 0.121429443359375, 0.14227294921875, 0.163116455078125, 0.1839599609375, 0.204803466796875, 0.22564697265625, 0.246490478515625, 0.267333984375, 0.288177490234375, 0.30902099609375, 0.329864501953125, 0.3507080078125, 0.371551513671875, 0.39239501953125, 0.413238525390625, 0.43408203125, 0.454925537109375, 0.47576904296875, 0.496612548828125, 0.5174560546875, 0.538299560546875, 0.55914306640625, 0.579986572265625, 0.600830078125, 0.621673583984375, 0.64251708984375, 0.663360595703125, 0.6842041015625, 0.705047607421875, 0.72589111328125, 0.746734619140625, 0.767578125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 8.0, 9.0, 20.0, 25.0, 47.0, 83.0, 138.0, 148.0, 178.0, 132.0, 90.0, 53.0, 27.0, 16.0, 9.0, 8.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-15.609170913696289, -15.20824146270752, -14.80731201171875, -14.40638256072998, -14.005453109741211, -13.604522705078125, -13.203594207763672, -12.802663803100586, -12.401734352111816, -12.000804901123047, -11.599875450134277, -11.198945999145508, -10.798016548156738, -10.397087097167969, -9.996156692504883, -9.595227241516113, -9.194297790527344, -8.793368339538574, -8.392438888549805, -7.991509437561035, -7.590579509735107, -7.189650058746338, -6.788720607757568, -6.387790679931641, -5.9868621826171875, -5.585932731628418, -5.185003280639648, -4.784073829650879, -4.383143901824951, -3.9822144508361816, -3.581284999847412, -3.1803553104400635, -2.779425621032715, -2.3784961700439453, -1.9775664806365967, -1.5766370296478271, -1.175707459449768, -0.774777889251709, -0.37384843826293945, 0.02708125114440918, 0.4280107021331787, 0.8289402723312378, 1.2298698425292969, 1.6307992935180664, 2.031728744506836, 2.4326584339141846, 2.833587884902954, 3.2345175743103027, 3.6354470252990723, 4.036376476287842, 4.437305927276611, 4.838235855102539, 5.239165306091309, 5.640094757080078, 6.041024208068848, 6.441953659057617, 6.842883110046387, 7.243812561035156, 7.644742012023926, 8.045671463012695, 8.446600914001465, 8.847530364990234, 9.24846076965332, 9.64939022064209, 10.05031967163086]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 4.0, 4.0, 7.0, 11.0, 6.0, 7.0, 12.0, 10.0, 10.0, 12.0, 14.0, 19.0, 23.0, 24.0, 34.0, 36.0, 25.0, 25.0, 37.0, 38.0, 41.0, 49.0, 41.0, 63.0, 48.0, 34.0, 32.0, 33.0, 35.0, 27.0, 34.0, 24.0, 31.0, 18.0, 23.0, 19.0, 13.0, 12.0, 13.0, 12.0, 8.0, 3.0, 5.0, 8.0, 4.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.402581691741943, -5.239711761474609, -5.076841831207275, -4.913971900939941, -4.751101493835449, -4.588231563568115, -4.425361633300781, -4.262491703033447, -4.099621772766113, -3.9367518424987793, -3.7738819122314453, -3.6110117435455322, -3.4481418132781982, -3.2852718830108643, -3.122401714324951, -2.959531784057617, -2.796661853790283, -2.633791923522949, -2.4709219932556152, -2.308051824569702, -2.145181894302368, -1.9823119640350342, -1.8194419145584106, -1.656571865081787, -1.4937019348144531, -1.3308320045471191, -1.1679619550704956, -1.005091905593872, -0.8422219753265381, -0.6793519854545593, -0.5164819955825806, -0.35361194610595703, -0.19074153900146484, -0.027871549129486084, 0.13499844074249268, 0.29786843061447144, 0.4607384204864502, 0.623608410358429, 0.7864784002304077, 0.9493484497070312, 1.1122183799743652, 1.2750883102416992, 1.4379583597183228, 1.6008284091949463, 1.7636983394622803, 1.9265682697296143, 2.0894384384155273, 2.2523083686828613, 2.4151782989501953, 2.5780482292175293, 2.7409181594848633, 2.9037883281707764, 3.0666582584381104, 3.2295281887054443, 3.3923983573913574, 3.5552682876586914, 3.7181382179260254, 3.8810081481933594, 4.043878078460693, 4.206748008728027, 4.3696184158325195, 4.5324883460998535, 4.6953582763671875, 4.8582282066345215, 5.0210981369018555]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 6.0, 3.0, 3.0, 4.0, 5.0, 10.0, 9.0, 10.0, 16.0, 20.0, 21.0, 22.0, 35.0, 40.0, 56.0, 66.0, 121.0, 179.0, 282.0, 576.0, 1322.0, 3963.0, 16061.0, 186964.0, 3938151.0, 34802.0, 7438.0, 2260.0, 889.0, 451.0, 205.0, 119.0, 72.0, 50.0, 19.0, 17.0, 10.0, 5.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8828125, -8.667236328125, -8.45166015625, -8.236083984375, -8.0205078125, -7.804931640625, -7.58935546875, -7.373779296875, -7.158203125, -6.942626953125, -6.72705078125, -6.511474609375, -6.2958984375, -6.080322265625, -5.86474609375, -5.649169921875, -5.43359375, -5.218017578125, -5.00244140625, -4.786865234375, -4.5712890625, -4.355712890625, -4.14013671875, -3.924560546875, -3.708984375, -3.493408203125, -3.27783203125, -3.062255859375, -2.8466796875, -2.631103515625, -2.41552734375, -2.199951171875, -1.984375, -1.768798828125, -1.55322265625, -1.337646484375, -1.1220703125, -0.906494140625, -0.69091796875, -0.475341796875, -0.259765625, -0.044189453125, 0.17138671875, 0.386962890625, 0.6025390625, 0.818115234375, 1.03369140625, 1.249267578125, 1.46484375, 1.680419921875, 1.89599609375, 2.111572265625, 2.3271484375, 2.542724609375, 2.75830078125, 2.973876953125, 3.189453125, 3.405029296875, 3.62060546875, 3.836181640625, 4.0517578125, 4.267333984375, 4.48291015625, 4.698486328125, 4.9140625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 6.0, 2.0, 10.0, 27.0, 29.0, 60.0, 80.0, 96.0, 101.0, 120.0, 104.0, 91.0, 87.0, 65.0, 39.0, 31.0, 19.0, 16.0, 9.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65576171875, -0.6397018432617188, -0.6236419677734375, -0.6075820922851562, -0.591522216796875, -0.5754623413085938, -0.5594024658203125, -0.5433425903320312, -0.52728271484375, -0.5112228393554688, -0.4951629638671875, -0.47910308837890625, -0.463043212890625, -0.44698333740234375, -0.4309234619140625, -0.41486358642578125, -0.3988037109375, -0.38274383544921875, -0.3666839599609375, -0.35062408447265625, -0.334564208984375, -0.31850433349609375, -0.3024444580078125, -0.28638458251953125, -0.27032470703125, -0.25426483154296875, -0.2382049560546875, -0.22214508056640625, -0.206085205078125, -0.19002532958984375, -0.1739654541015625, -0.15790557861328125, -0.141845703125, -0.12578582763671875, -0.1097259521484375, -0.09366607666015625, -0.077606201171875, -0.06154632568359375, -0.0454864501953125, -0.02942657470703125, -0.01336669921875, 0.00269317626953125, 0.0187530517578125, 0.03481292724609375, 0.050872802734375, 0.06693267822265625, 0.0829925537109375, 0.09905242919921875, 0.1151123046875, 0.13117218017578125, 0.1472320556640625, 0.16329193115234375, 0.179351806640625, 0.19541168212890625, 0.2114715576171875, 0.22753143310546875, 0.24359130859375, 0.25965118408203125, 0.2757110595703125, 0.29177093505859375, 0.307830810546875, 0.32389068603515625, 0.3399505615234375, 0.35601043701171875, 0.3720703125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 9.0, 11.0, 11.0, 18.0, 16.0, 30.0, 45.0, 56.0, 79.0, 122.0, 298.0, 1090.0, 10176.0, 4111846.0, 67019.0, 2654.0, 440.0, 138.0, 68.0, 62.0, 32.0, 15.0, 17.0, 9.0, 11.0, 4.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.8359375, -14.3961181640625, -13.956298828125, -13.5164794921875, -13.07666015625, -12.6368408203125, -12.197021484375, -11.7572021484375, -11.3173828125, -10.8775634765625, -10.437744140625, -9.9979248046875, -9.55810546875, -9.1182861328125, -8.678466796875, -8.2386474609375, -7.798828125, -7.3590087890625, -6.919189453125, -6.4793701171875, -6.03955078125, -5.5997314453125, -5.159912109375, -4.7200927734375, -4.2802734375, -3.8404541015625, -3.400634765625, -2.9608154296875, -2.52099609375, -2.0811767578125, -1.641357421875, -1.2015380859375, -0.76171875, -0.3218994140625, 0.117919921875, 0.5577392578125, 0.99755859375, 1.4373779296875, 1.877197265625, 2.3170166015625, 2.7568359375, 3.1966552734375, 3.636474609375, 4.0762939453125, 4.51611328125, 4.9559326171875, 5.395751953125, 5.8355712890625, 6.275390625, 6.7152099609375, 7.155029296875, 7.5948486328125, 8.03466796875, 8.4744873046875, 8.914306640625, 9.3541259765625, 9.7939453125, 10.2337646484375, 10.673583984375, 11.1134033203125, 11.55322265625, 11.9930419921875, 12.432861328125, 12.8726806640625, 13.3125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 6.0, 3.0, 2.0, 7.0, 22.0, 42.0, 112.0, 1352.0, 2305.0, 133.0, 50.0, 24.0, 14.0, 10.0, 3.0, 4.0, 1.0, 0.0, 1.0], "bins": [-3.515625, -3.4493331909179688, -3.3830413818359375, -3.3167495727539062, -3.250457763671875, -3.1841659545898438, -3.1178741455078125, -3.0515823364257812, -2.98529052734375, -2.9189987182617188, -2.8527069091796875, -2.7864151000976562, -2.720123291015625, -2.6538314819335938, -2.5875396728515625, -2.5212478637695312, -2.4549560546875, -2.3886642456054688, -2.3223724365234375, -2.2560806274414062, -2.189788818359375, -2.1234970092773438, -2.0572052001953125, -1.9909133911132812, -1.92462158203125, -1.8583297729492188, -1.7920379638671875, -1.7257461547851562, -1.659454345703125, -1.5931625366210938, -1.5268707275390625, -1.4605789184570312, -1.394287109375, -1.3279953002929688, -1.2617034912109375, -1.1954116821289062, -1.129119873046875, -1.0628280639648438, -0.9965362548828125, -0.9302444458007812, -0.86395263671875, -0.7976608276367188, -0.7313690185546875, -0.6650772094726562, -0.598785400390625, -0.5324935913085938, -0.4662017822265625, -0.39990997314453125, -0.3336181640625, -0.26732635498046875, -0.2010345458984375, -0.13474273681640625, -0.068450927734375, -0.00215911865234375, 0.0641326904296875, 0.13042449951171875, 0.19671630859375, 0.26300811767578125, 0.3292999267578125, 0.39559173583984375, 0.461883544921875, 0.5281753540039062, 0.5944671630859375, 0.6607589721679688, 0.72705078125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 8.0, 19.0, 55.0, 254.0, 466.0, 144.0, 35.0, 6.0, 7.0, 5.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-26.899240493774414, -26.384647369384766, -25.870054244995117, -25.3554630279541, -24.840869903564453, -24.326276779174805, -23.811683654785156, -23.29709243774414, -22.782499313354492, -22.267906188964844, -21.753313064575195, -21.23872184753418, -20.72412872314453, -20.209535598754883, -19.694942474365234, -19.18035125732422, -18.665756225585938, -18.15116310119629, -17.63656997680664, -17.121978759765625, -16.607385635375977, -16.092792510986328, -15.57819938659668, -15.063607215881348, -14.549015045166016, -14.034421920776367, -13.519829750061035, -13.005236625671387, -12.490644454956055, -11.976051330566406, -11.461458206176758, -10.946866035461426, -10.432273864746094, -9.917680740356445, -9.403088569641113, -8.888495445251465, -8.373903274536133, -7.859310150146484, -7.344717502593994, -6.830124855041504, -6.315532207489014, -5.800939559936523, -5.286346912384033, -4.771754264831543, -4.2571611404418945, -3.7425687313079834, -3.227975845336914, -2.713383197784424, -2.1987905502319336, -1.6841979026794434, -1.1696051359176636, -0.6550123691558838, -0.14041972160339355, 0.3741729259490967, 0.888765811920166, 1.4033584594726562, 1.9179511070251465, 2.4325437545776367, 2.947136402130127, 3.4617292881011963, 3.9763219356536865, 4.490914344787598, 5.005507469177246, 5.520100116729736, 6.034692764282227]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 4.0, 6.0, 8.0, 15.0, 9.0, 13.0, 19.0, 34.0, 31.0, 34.0, 53.0, 53.0, 63.0, 86.0, 75.0, 71.0, 65.0, 54.0, 69.0, 52.0, 41.0, 36.0, 36.0, 20.0, 14.0, 15.0, 12.0, 7.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.8861656188964844, -3.759521484375, -3.6328773498535156, -3.506232976913452, -3.3795888423919678, -3.2529447078704834, -3.12630033493042, -2.9996562004089355, -2.873012065887451, -2.746367931365967, -2.6197237968444824, -2.493079423904419, -2.3664352893829346, -2.23979115486145, -2.1131467819213867, -1.9865026473999023, -1.859858512878418, -1.7332143783569336, -1.6065701246261597, -1.4799258708953857, -1.3532817363739014, -1.226637601852417, -1.099993348121643, -0.9733491539955139, -0.8467049598693848, -0.7200607657432556, -0.5934165716171265, -0.4667723774909973, -0.34012818336486816, -0.213483989238739, -0.08683979511260986, 0.03980439901351929, 0.16644906997680664, 0.2930932641029358, 0.41973745822906494, 0.5463816523551941, 0.6730258464813232, 0.7996700406074524, 0.9263142347335815, 1.0529584884643555, 1.1796026229858398, 1.3062467575073242, 1.4328910112380981, 1.559535264968872, 1.6861793994903564, 1.8128235340118408, 1.9394677877426147, 2.0661120414733887, 2.192756175994873, 2.3194003105163574, 2.446044445037842, 2.5726888179779053, 2.6993329524993896, 2.825977087020874, 2.9526214599609375, 3.079265594482422, 3.2059097290039062, 3.3325538635253906, 3.459197998046875, 3.5858423709869385, 3.712486505508423, 3.8391306400299072, 3.9657750129699707, 4.092419147491455, 4.2190632820129395]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 6.0, 0.0, 3.0, 10.0, 4.0, 9.0, 19.0, 24.0, 62.0, 116.0, 258.0, 587.0, 1871.0, 12264.0, 667875.0, 353899.0, 8927.0, 1653.0, 528.0, 212.0, 111.0, 52.0, 30.0, 17.0, 11.0, 4.0, 7.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.953125, -8.6436767578125, -8.334228515625, -8.0247802734375, -7.71533203125, -7.4058837890625, -7.096435546875, -6.7869873046875, -6.4775390625, -6.1680908203125, -5.858642578125, -5.5491943359375, -5.23974609375, -4.9302978515625, -4.620849609375, -4.3114013671875, -4.001953125, -3.6925048828125, -3.383056640625, -3.0736083984375, -2.76416015625, -2.4547119140625, -2.145263671875, -1.8358154296875, -1.5263671875, -1.2169189453125, -0.907470703125, -0.5980224609375, -0.28857421875, 0.0208740234375, 0.330322265625, 0.6397705078125, 0.94921875, 1.2586669921875, 1.568115234375, 1.8775634765625, 2.18701171875, 2.4964599609375, 2.805908203125, 3.1153564453125, 3.4248046875, 3.7342529296875, 4.043701171875, 4.3531494140625, 4.66259765625, 4.9720458984375, 5.281494140625, 5.5909423828125, 5.900390625, 6.2098388671875, 6.519287109375, 6.8287353515625, 7.13818359375, 7.4476318359375, 7.757080078125, 8.0665283203125, 8.3759765625, 8.6854248046875, 8.994873046875, 9.3043212890625, 9.61376953125, 9.9232177734375, 10.232666015625, 10.5421142578125, 10.8515625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 4.0, 15.0, 11.0, 26.0, 41.0, 54.0, 59.0, 79.0, 98.0, 106.0, 76.0, 86.0, 87.0, 77.0, 48.0, 39.0, 34.0, 22.0, 13.0, 6.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.69873046875, -0.6817626953125, -0.664794921875, -0.6478271484375, -0.630859375, -0.6138916015625, -0.596923828125, -0.5799560546875, -0.56298828125, -0.5460205078125, -0.529052734375, -0.5120849609375, -0.4951171875, -0.4781494140625, -0.461181640625, -0.4442138671875, -0.42724609375, -0.4102783203125, -0.393310546875, -0.3763427734375, -0.359375, -0.3424072265625, -0.325439453125, -0.3084716796875, -0.29150390625, -0.2745361328125, -0.257568359375, -0.2406005859375, -0.2236328125, -0.2066650390625, -0.189697265625, -0.1727294921875, -0.15576171875, -0.1387939453125, -0.121826171875, -0.1048583984375, -0.087890625, -0.0709228515625, -0.053955078125, -0.0369873046875, -0.02001953125, -0.0030517578125, 0.013916015625, 0.0308837890625, 0.0478515625, 0.0648193359375, 0.081787109375, 0.0987548828125, 0.11572265625, 0.1326904296875, 0.149658203125, 0.1666259765625, 0.18359375, 0.2005615234375, 0.217529296875, 0.2344970703125, 0.25146484375, 0.2684326171875, 0.285400390625, 0.3023681640625, 0.3193359375, 0.3363037109375, 0.353271484375, 0.3702392578125, 0.38720703125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 6.0, 9.0, 4.0, 8.0, 15.0, 11.0, 8.0, 24.0, 23.0, 41.0, 52.0, 92.0, 136.0, 254.0, 444.0, 810.0, 1520.0, 3266.0, 9410.0, 37143.0, 258293.0, 621390.0, 87902.0, 17537.0, 5412.0, 2346.0, 994.0, 543.0, 295.0, 182.0, 121.0, 83.0, 55.0, 35.0, 23.0, 23.0, 15.0, 12.0, 6.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.189453125, -3.084014892578125, -2.97857666015625, -2.873138427734375, -2.7677001953125, -2.662261962890625, -2.55682373046875, -2.451385498046875, -2.345947265625, -2.240509033203125, -2.13507080078125, -2.029632568359375, -1.9241943359375, -1.818756103515625, -1.71331787109375, -1.607879638671875, -1.50244140625, -1.397003173828125, -1.29156494140625, -1.186126708984375, -1.0806884765625, -0.975250244140625, -0.86981201171875, -0.764373779296875, -0.658935546875, -0.553497314453125, -0.44805908203125, -0.342620849609375, -0.2371826171875, -0.131744384765625, -0.02630615234375, 0.079132080078125, 0.1845703125, 0.290008544921875, 0.39544677734375, 0.500885009765625, 0.6063232421875, 0.711761474609375, 0.81719970703125, 0.922637939453125, 1.028076171875, 1.133514404296875, 1.23895263671875, 1.344390869140625, 1.4498291015625, 1.555267333984375, 1.66070556640625, 1.766143798828125, 1.87158203125, 1.977020263671875, 2.08245849609375, 2.187896728515625, 2.2933349609375, 2.398773193359375, 2.50421142578125, 2.609649658203125, 2.715087890625, 2.820526123046875, 2.92596435546875, 3.031402587890625, 3.1368408203125, 3.242279052734375, 3.34771728515625, 3.453155517578125, 3.55859375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 6.0, 3.0, 6.0, 3.0, 11.0, 11.0, 22.0, 21.0, 35.0, 28.0, 44.0, 57.0, 61.0, 43.0, 64.0, 82.0, 70.0, 77.0, 65.0, 61.0, 48.0, 41.0, 31.0, 27.0, 22.0, 18.0, 20.0, 8.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0], "bins": [-2.44140625, -2.3791046142578125, -2.316802978515625, -2.2545013427734375, -2.19219970703125, -2.1298980712890625, -2.067596435546875, -2.0052947998046875, -1.9429931640625, -1.8806915283203125, -1.818389892578125, -1.7560882568359375, -1.69378662109375, -1.6314849853515625, -1.569183349609375, -1.5068817138671875, -1.444580078125, -1.3822784423828125, -1.319976806640625, -1.2576751708984375, -1.19537353515625, -1.1330718994140625, -1.070770263671875, -1.0084686279296875, -0.9461669921875, -0.8838653564453125, -0.821563720703125, -0.7592620849609375, -0.69696044921875, -0.6346588134765625, -0.572357177734375, -0.5100555419921875, -0.44775390625, -0.3854522705078125, -0.323150634765625, -0.2608489990234375, -0.19854736328125, -0.1362457275390625, -0.073944091796875, -0.0116424560546875, 0.0506591796875, 0.1129608154296875, 0.175262451171875, 0.2375640869140625, 0.29986572265625, 0.3621673583984375, 0.424468994140625, 0.4867706298828125, 0.549072265625, 0.6113739013671875, 0.673675537109375, 0.7359771728515625, 0.79827880859375, 0.8605804443359375, 0.922882080078125, 0.9851837158203125, 1.0474853515625, 1.1097869873046875, 1.172088623046875, 1.2343902587890625, 1.29669189453125, 1.3589935302734375, 1.421295166015625, 1.4835968017578125, 1.5458984375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 3.0, 4.0, 6.0, 4.0, 9.0, 17.0, 19.0, 29.0, 35.0, 57.0, 71.0, 101.0, 183.0, 300.0, 465.0, 745.0, 1437.0, 2671.0, 6208.0, 19175.0, 126395.0, 800061.0, 66395.0, 13974.0, 4884.0, 2249.0, 1198.0, 696.0, 384.0, 241.0, 183.0, 113.0, 70.0, 59.0, 34.0, 24.0, 14.0, 16.0, 10.0, 8.0, 2.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.375, -2.3038330078125, -2.232666015625, -2.1614990234375, -2.09033203125, -2.0191650390625, -1.947998046875, -1.8768310546875, -1.8056640625, -1.7344970703125, -1.663330078125, -1.5921630859375, -1.52099609375, -1.4498291015625, -1.378662109375, -1.3074951171875, -1.236328125, -1.1651611328125, -1.093994140625, -1.0228271484375, -0.95166015625, -0.8804931640625, -0.809326171875, -0.7381591796875, -0.6669921875, -0.5958251953125, -0.524658203125, -0.4534912109375, -0.38232421875, -0.3111572265625, -0.239990234375, -0.1688232421875, -0.09765625, -0.0264892578125, 0.044677734375, 0.1158447265625, 0.18701171875, 0.2581787109375, 0.329345703125, 0.4005126953125, 0.4716796875, 0.5428466796875, 0.614013671875, 0.6851806640625, 0.75634765625, 0.8275146484375, 0.898681640625, 0.9698486328125, 1.041015625, 1.1121826171875, 1.183349609375, 1.2545166015625, 1.32568359375, 1.3968505859375, 1.468017578125, 1.5391845703125, 1.6103515625, 1.6815185546875, 1.752685546875, 1.8238525390625, 1.89501953125, 1.9661865234375, 2.037353515625, 2.1085205078125, 2.1796875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 2.0, 2.0, 8.0, 5.0, 11.0, 16.0, 16.0, 35.0, 59.0, 123.0, 255.0, 221.0, 109.0, 45.0, 28.0, 18.0, 9.0, 11.0, 8.0, 7.0, 6.0, 0.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00044918060302734375, -0.00043366849422454834, -0.00041815638542175293, -0.0004026442766189575, -0.0003871321678161621, -0.0003716200590133667, -0.0003561079502105713, -0.0003405958414077759, -0.00032508373260498047, -0.00030957162380218506, -0.00029405951499938965, -0.00027854740619659424, -0.00026303529739379883, -0.0002475231885910034, -0.000232011079788208, -0.0002164989709854126, -0.0002009868621826172, -0.00018547475337982178, -0.00016996264457702637, -0.00015445053577423096, -0.00013893842697143555, -0.00012342631816864014, -0.00010791420936584473, -9.240210056304932e-05, -7.68899917602539e-05, -6.13778829574585e-05, -4.5865774154663086e-05, -3.0353665351867676e-05, -1.4841556549072266e-05, 6.705522537231445e-07, 1.6182661056518555e-05, 3.1694769859313965e-05, 4.7206878662109375e-05, 6.271898746490479e-05, 7.82310962677002e-05, 9.37432050704956e-05, 0.00010925531387329102, 0.00012476742267608643, 0.00014027953147888184, 0.00015579164028167725, 0.00017130374908447266, 0.00018681585788726807, 0.00020232796669006348, 0.0002178400754928589, 0.0002333521842956543, 0.0002488642930984497, 0.0002643764019012451, 0.00027988851070404053, 0.00029540061950683594, 0.00031091272830963135, 0.00032642483711242676, 0.00034193694591522217, 0.0003574490547180176, 0.000372961163520813, 0.0003884732723236084, 0.0004039853811264038, 0.0004194974899291992, 0.00043500959873199463, 0.00045052170753479004, 0.00046603381633758545, 0.00048154592514038086, 0.0004970580339431763, 0.0005125701427459717, 0.0005280822515487671, 0.0005435943603515625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 0.0, 0.0, 4.0, 1.0, 8.0, 11.0, 18.0, 22.0, 41.0, 44.0, 64.0, 88.0, 156.0, 251.0, 417.0, 881.0, 1967.0, 5147.0, 18020.0, 170499.0, 792113.0, 43599.0, 9419.0, 3022.0, 1225.0, 623.0, 356.0, 194.0, 104.0, 92.0, 46.0, 39.0, 19.0, 16.0, 19.0, 6.0, 10.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-2.36328125, -2.28765869140625, -2.2120361328125, -2.13641357421875, -2.060791015625, -1.98516845703125, -1.9095458984375, -1.83392333984375, -1.75830078125, -1.68267822265625, -1.6070556640625, -1.53143310546875, -1.455810546875, -1.38018798828125, -1.3045654296875, -1.22894287109375, -1.1533203125, -1.07769775390625, -1.0020751953125, -0.92645263671875, -0.850830078125, -0.77520751953125, -0.6995849609375, -0.62396240234375, -0.54833984375, -0.47271728515625, -0.3970947265625, -0.32147216796875, -0.245849609375, -0.17022705078125, -0.0946044921875, -0.01898193359375, 0.056640625, 0.13226318359375, 0.2078857421875, 0.28350830078125, 0.359130859375, 0.43475341796875, 0.5103759765625, 0.58599853515625, 0.66162109375, 0.73724365234375, 0.8128662109375, 0.88848876953125, 0.964111328125, 1.03973388671875, 1.1153564453125, 1.19097900390625, 1.2666015625, 1.34222412109375, 1.4178466796875, 1.49346923828125, 1.569091796875, 1.64471435546875, 1.7203369140625, 1.79595947265625, 1.87158203125, 1.94720458984375, 2.0228271484375, 2.09844970703125, 2.174072265625, 2.24969482421875, 2.3253173828125, 2.40093994140625, 2.4765625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 7.0, 2.0, 4.0, 8.0, 6.0, 3.0, 9.0, 20.0, 21.0, 45.0, 83.0, 150.0, 205.0, 164.0, 122.0, 54.0, 31.0, 15.0, 13.0, 12.0, 7.0, 6.0, 4.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.96044921875, -0.9158096313476562, -0.8711700439453125, -0.8265304565429688, -0.781890869140625, -0.7372512817382812, -0.6926116943359375, -0.6479721069335938, -0.60333251953125, -0.5586929321289062, -0.5140533447265625, -0.46941375732421875, -0.424774169921875, -0.38013458251953125, -0.3354949951171875, -0.29085540771484375, -0.2462158203125, -0.20157623291015625, -0.1569366455078125, -0.11229705810546875, -0.067657470703125, -0.02301788330078125, 0.0216217041015625, 0.06626129150390625, 0.11090087890625, 0.15554046630859375, 0.2001800537109375, 0.24481964111328125, 0.289459228515625, 0.33409881591796875, 0.3787384033203125, 0.42337799072265625, 0.468017578125, 0.5126571655273438, 0.5572967529296875, 0.6019363403320312, 0.646575927734375, 0.6912155151367188, 0.7358551025390625, 0.7804946899414062, 0.82513427734375, 0.8697738647460938, 0.9144134521484375, 0.9590530395507812, 1.003692626953125, 1.0483322143554688, 1.0929718017578125, 1.1376113891601562, 1.1822509765625, 1.2268905639648438, 1.2715301513671875, 1.3161697387695312, 1.360809326171875, 1.4054489135742188, 1.4500885009765625, 1.4947280883789062, 1.53936767578125, 1.5840072631835938, 1.6286468505859375, 1.6732864379882812, 1.717926025390625, 1.7625656127929688, 1.8072052001953125, 1.8518447875976562, 1.896484375]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 8.0, 19.0, 38.0, 64.0, 144.0, 250.0, 231.0, 138.0, 47.0, 30.0, 20.0, 5.0, 9.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-44.38673400878906, -43.478458404541016, -42.57018280029297, -41.66191101074219, -40.75363540649414, -39.845359802246094, -38.93708419799805, -38.02880859375, -37.12053298950195, -36.212257385253906, -35.30398178100586, -34.39570617675781, -33.48743438720703, -32.579158782958984, -31.670883178710938, -30.76260757446289, -29.854333877563477, -28.94605827331543, -28.037784576416016, -27.12950897216797, -26.221233367919922, -25.312957763671875, -24.40468406677246, -23.496408462524414, -22.588134765625, -21.679859161376953, -20.77158546447754, -19.863309860229492, -18.955034255981445, -18.04676055908203, -17.138484954833984, -16.230209350585938, -15.321932792663574, -14.413658142089844, -13.505382537841797, -12.597107887268066, -11.688833236694336, -10.780557632446289, -9.872282981872559, -8.964008331298828, -8.055732727050781, -7.147457599639893, -6.239182472229004, -5.330907821655273, -4.422632694244385, -3.514357566833496, -2.6060829162597656, -1.697807788848877, -0.7895326614379883, 0.11874234676361084, 1.02701735496521, 1.9352922439575195, 2.843567371368408, 3.751842498779297, 4.660117149353027, 5.568392276763916, 6.476667404174805, 7.384942531585693, 8.293217658996582, 9.201492309570312, 10.10976791381836, 11.01804256439209, 11.92631721496582, 12.834592819213867, 13.742867469787598]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 7.0, 8.0, 12.0, 12.0, 14.0, 11.0, 15.0, 14.0, 23.0, 18.0, 26.0, 32.0, 42.0, 49.0, 42.0, 35.0, 55.0, 44.0, 46.0, 47.0, 54.0, 41.0, 48.0, 32.0, 33.0, 36.0, 38.0, 37.0, 15.0, 26.0, 20.0, 16.0, 13.0, 16.0, 7.0, 4.0, 6.0, 3.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.869426727294922, -8.569880485534668, -8.270334243774414, -7.97078800201416, -7.671241760253906, -7.371695518493652, -7.072149276733398, -6.7726030349731445, -6.473056793212891, -6.173510551452637, -5.873964309692383, -5.574418067932129, -5.274871826171875, -4.975325584411621, -4.675779342651367, -4.376233100891113, -4.076687335968018, -3.7771410942077637, -3.4775948524475098, -3.178048610687256, -2.878502368927002, -2.578956127166748, -2.2794101238250732, -1.9798638820648193, -1.6803176403045654, -1.3807713985443115, -1.0812251567840576, -0.7816790342330933, -0.48213279247283936, -0.18258655071258545, 0.1169595718383789, 0.4165058135986328, 0.7160520553588867, 1.0155982971191406, 1.3151445388793945, 1.6146906614303589, 1.9142369031906128, 2.2137832641601562, 2.513329267501831, 2.812875509262085, 3.112421751022339, 3.4119679927825928, 3.7115142345428467, 4.0110602378845215, 4.310606479644775, 4.610152721405029, 4.909698963165283, 5.209245204925537, 5.508791446685791, 5.808337688446045, 6.107883930206299, 6.407430171966553, 6.706976413726807, 7.0065226554870605, 7.306068420410156, 7.60561466217041, 7.905160903930664, 8.204707145690918, 8.504253387451172, 8.803799629211426, 9.10334587097168, 9.402892112731934, 9.702438354492188, 10.001984596252441, 10.301530838012695]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 5.0, 4.0, 3.0, 6.0, 9.0, 11.0, 10.0, 18.0, 16.0, 23.0, 22.0, 33.0, 39.0, 45.0, 63.0, 81.0, 115.0, 133.0, 206.0, 260.0, 493.0, 1017.0, 2409.0, 7017.0, 24340.0, 156591.0, 3862252.0, 107200.0, 21274.0, 6185.0, 2174.0, 1011.0, 533.0, 298.0, 165.0, 104.0, 46.0, 32.0, 18.0, 13.0, 5.0, 2.0, 3.0, 1.0, 5.0], "bins": [-7.75, -7.579376220703125, -7.40875244140625, -7.238128662109375, -7.0675048828125, -6.896881103515625, -6.72625732421875, -6.555633544921875, -6.385009765625, -6.214385986328125, -6.04376220703125, -5.873138427734375, -5.7025146484375, -5.531890869140625, -5.36126708984375, -5.190643310546875, -5.02001953125, -4.849395751953125, -4.67877197265625, -4.508148193359375, -4.3375244140625, -4.166900634765625, -3.99627685546875, -3.825653076171875, -3.655029296875, -3.484405517578125, -3.31378173828125, -3.143157958984375, -2.9725341796875, -2.801910400390625, -2.63128662109375, -2.460662841796875, -2.2900390625, -2.119415283203125, -1.94879150390625, -1.778167724609375, -1.6075439453125, -1.436920166015625, -1.26629638671875, -1.095672607421875, -0.925048828125, -0.754425048828125, -0.58380126953125, -0.413177490234375, -0.2425537109375, -0.071929931640625, 0.09869384765625, 0.269317626953125, 0.43994140625, 0.610565185546875, 0.78118896484375, 0.951812744140625, 1.1224365234375, 1.293060302734375, 1.46368408203125, 1.634307861328125, 1.804931640625, 1.975555419921875, 2.14617919921875, 2.316802978515625, 2.4874267578125, 2.658050537109375, 2.82867431640625, 2.999298095703125, 3.169921875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 6.0, 4.0, 8.0, 15.0, 14.0, 35.0, 37.0, 54.0, 51.0, 71.0, 88.0, 100.0, 94.0, 85.0, 68.0, 80.0, 58.0, 37.0, 29.0, 16.0, 13.0, 17.0, 14.0, 3.0, 3.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.69677734375, -0.680267333984375, -0.66375732421875, -0.647247314453125, -0.6307373046875, -0.614227294921875, -0.59771728515625, -0.581207275390625, -0.564697265625, -0.548187255859375, -0.53167724609375, -0.515167236328125, -0.4986572265625, -0.482147216796875, -0.46563720703125, -0.449127197265625, -0.4326171875, -0.416107177734375, -0.39959716796875, -0.383087158203125, -0.3665771484375, -0.350067138671875, -0.33355712890625, -0.317047119140625, -0.300537109375, -0.284027099609375, -0.26751708984375, -0.251007080078125, -0.2344970703125, -0.217987060546875, -0.20147705078125, -0.184967041015625, -0.16845703125, -0.151947021484375, -0.13543701171875, -0.118927001953125, -0.1024169921875, -0.085906982421875, -0.06939697265625, -0.052886962890625, -0.036376953125, -0.019866943359375, -0.00335693359375, 0.013153076171875, 0.0296630859375, 0.046173095703125, 0.06268310546875, 0.079193115234375, 0.095703125, 0.112213134765625, 0.12872314453125, 0.145233154296875, 0.1617431640625, 0.178253173828125, 0.19476318359375, 0.211273193359375, 0.227783203125, 0.244293212890625, 0.26080322265625, 0.277313232421875, 0.2938232421875, 0.310333251953125, 0.32684326171875, 0.343353271484375, 0.35986328125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 11.0, 16.0, 26.0, 43.0, 68.0, 124.0, 196.0, 448.0, 855.0, 1999.0, 5697.0, 28428.0, 3828884.0, 305658.0, 15278.0, 3875.0, 1409.0, 618.0, 306.0, 138.0, 73.0, 42.0, 26.0, 13.0, 19.0, 10.0, 5.0, 3.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.7890625, -8.4735107421875, -8.157958984375, -7.8424072265625, -7.52685546875, -7.2113037109375, -6.895751953125, -6.5802001953125, -6.2646484375, -5.9490966796875, -5.633544921875, -5.3179931640625, -5.00244140625, -4.6868896484375, -4.371337890625, -4.0557861328125, -3.740234375, -3.4246826171875, -3.109130859375, -2.7935791015625, -2.47802734375, -2.1624755859375, -1.846923828125, -1.5313720703125, -1.2158203125, -0.9002685546875, -0.584716796875, -0.2691650390625, 0.04638671875, 0.3619384765625, 0.677490234375, 0.9930419921875, 1.30859375, 1.6241455078125, 1.939697265625, 2.2552490234375, 2.57080078125, 2.8863525390625, 3.201904296875, 3.5174560546875, 3.8330078125, 4.1485595703125, 4.464111328125, 4.7796630859375, 5.09521484375, 5.4107666015625, 5.726318359375, 6.0418701171875, 6.357421875, 6.6729736328125, 6.988525390625, 7.3040771484375, 7.61962890625, 7.9351806640625, 8.250732421875, 8.5662841796875, 8.8818359375, 9.1973876953125, 9.512939453125, 9.8284912109375, 10.14404296875, 10.4595947265625, 10.775146484375, 11.0906982421875, 11.40625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 5.0, 4.0, 2.0, 4.0, 3.0, 7.0, 15.0, 14.0, 24.0, 39.0, 43.0, 79.0, 117.0, 344.0, 2361.0, 621.0, 188.0, 76.0, 51.0, 20.0, 20.0, 7.0, 11.0, 5.0, 3.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.267578125, -2.2057342529296875, -2.143890380859375, -2.0820465087890625, -2.02020263671875, -1.9583587646484375, -1.896514892578125, -1.8346710205078125, -1.7728271484375, -1.7109832763671875, -1.649139404296875, -1.5872955322265625, -1.52545166015625, -1.4636077880859375, -1.401763916015625, -1.3399200439453125, -1.278076171875, -1.2162322998046875, -1.154388427734375, -1.0925445556640625, -1.03070068359375, -0.9688568115234375, -0.907012939453125, -0.8451690673828125, -0.7833251953125, -0.7214813232421875, -0.659637451171875, -0.5977935791015625, -0.53594970703125, -0.4741058349609375, -0.412261962890625, -0.3504180908203125, -0.28857421875, -0.2267303466796875, -0.164886474609375, -0.1030426025390625, -0.04119873046875, 0.0206451416015625, 0.082489013671875, 0.1443328857421875, 0.2061767578125, 0.2680206298828125, 0.329864501953125, 0.3917083740234375, 0.45355224609375, 0.5153961181640625, 0.577239990234375, 0.6390838623046875, 0.700927734375, 0.7627716064453125, 0.824615478515625, 0.8864593505859375, 0.94830322265625, 1.0101470947265625, 1.071990966796875, 1.1338348388671875, 1.1956787109375, 1.2575225830078125, 1.319366455078125, 1.3812103271484375, 1.44305419921875, 1.5048980712890625, 1.566741943359375, 1.6285858154296875, 1.6904296875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 10.0, 19.0, 45.0, 184.0, 478.0, 209.0, 37.0, 19.0, 5.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-57.367347717285156, -56.31603240966797, -55.264713287353516, -54.21339797973633, -53.162078857421875, -52.11076354980469, -51.059444427490234, -50.00812911987305, -48.956809997558594, -47.905494689941406, -46.85417556762695, -45.802860260009766, -44.75154113769531, -43.700225830078125, -42.64890670776367, -41.597591400146484, -40.5462760925293, -39.49496078491211, -38.443641662597656, -37.39232635498047, -36.341007232666016, -35.28969192504883, -34.238372802734375, -33.18705749511719, -32.1357421875, -31.08442497253418, -30.03310775756836, -28.98179054260254, -27.93047332763672, -26.87915802001953, -25.82784080505371, -24.77652359008789, -23.725204467773438, -22.673887252807617, -21.622570037841797, -20.571252822875977, -19.519935607910156, -18.46862030029297, -17.41730308532715, -16.365985870361328, -15.314667701721191, -14.263350486755371, -13.212034225463867, -12.160717010498047, -11.109399795532227, -10.058082580566406, -9.006765365600586, -7.955449104309082, -6.904131889343262, -5.852814674377441, -4.801497936248779, -3.750180959701538, -2.698863983154297, -1.6475467681884766, -0.5962300300598145, 0.45508670806884766, 1.506403923034668, 2.557720899581909, 3.6090378761291504, 4.6603546142578125, 5.711671829223633, 6.762989044189453, 7.814305782318115, 8.865622520446777, 9.916939735412598]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 7.0, 9.0, 14.0, 14.0, 20.0, 39.0, 55.0, 58.0, 65.0, 96.0, 96.0, 88.0, 80.0, 84.0, 59.0, 63.0, 52.0, 29.0, 31.0, 8.0, 10.0, 11.0, 4.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.166707992553711, -9.867802619934082, -9.568897247314453, -9.269991874694824, -8.971086502075195, -8.67218017578125, -8.373274803161621, -8.074369430541992, -7.775464057922363, -7.476558685302734, -7.1776533126831055, -6.878747463226318, -6.5798420906066895, -6.2809367179870605, -5.982030868530273, -5.6831254959106445, -5.384220123291016, -5.085314750671387, -4.786409378051758, -4.487503528594971, -4.188598155975342, -3.889692783355713, -3.590787172317505, -3.291881561279297, -2.992976188659668, -2.694070816040039, -2.395165205001831, -2.096259593963623, -1.7973542213439941, -1.4984487295150757, -1.1995432376861572, -0.9006376266479492, -0.6017322540283203, -0.30282676219940186, -0.0039212703704833984, 0.29498422145843506, 0.5938897132873535, 0.892795205116272, 1.1917006969451904, 1.4906063079833984, 1.7895116806030273, 2.0884170532226562, 2.3873226642608643, 2.6862282752990723, 2.985133647918701, 3.28403902053833, 3.582944631576538, 3.881850242614746, 4.180755615234375, 4.479660987854004, 4.778566360473633, 5.07747220993042, 5.376377582550049, 5.675282955169678, 5.974188804626465, 6.273094177246094, 6.571999549865723, 6.870904922485352, 7.1698102951049805, 7.468716144561768, 7.7676215171813965, 8.066527366638184, 8.365432739257812, 8.664338111877441, 8.96324348449707]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 7.0, 5.0, 5.0, 5.0, 3.0, 12.0, 11.0, 19.0, 32.0, 40.0, 45.0, 77.0, 130.0, 218.0, 416.0, 812.0, 2364.0, 9486.0, 87165.0, 790110.0, 140076.0, 12812.0, 2707.0, 946.0, 439.0, 215.0, 127.0, 85.0, 59.0, 30.0, 28.0, 17.0, 13.0, 14.0, 5.0, 7.0, 8.0, 5.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7421875, -3.57647705078125, -3.4107666015625, -3.24505615234375, -3.079345703125, -2.91363525390625, -2.7479248046875, -2.58221435546875, -2.41650390625, -2.25079345703125, -2.0850830078125, -1.91937255859375, -1.753662109375, -1.58795166015625, -1.4222412109375, -1.25653076171875, -1.0908203125, -0.92510986328125, -0.7593994140625, -0.59368896484375, -0.427978515625, -0.26226806640625, -0.0965576171875, 0.06915283203125, 0.23486328125, 0.40057373046875, 0.5662841796875, 0.73199462890625, 0.897705078125, 1.06341552734375, 1.2291259765625, 1.39483642578125, 1.560546875, 1.72625732421875, 1.8919677734375, 2.05767822265625, 2.223388671875, 2.38909912109375, 2.5548095703125, 2.72052001953125, 2.88623046875, 3.05194091796875, 3.2176513671875, 3.38336181640625, 3.549072265625, 3.71478271484375, 3.8804931640625, 4.04620361328125, 4.2119140625, 4.37762451171875, 4.5433349609375, 4.70904541015625, 4.874755859375, 5.04046630859375, 5.2061767578125, 5.37188720703125, 5.53759765625, 5.70330810546875, 5.8690185546875, 6.03472900390625, 6.200439453125, 6.36614990234375, 6.5318603515625, 6.69757080078125, 6.86328125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 13.0, 12.0, 29.0, 37.0, 66.0, 106.0, 99.0, 120.0, 138.0, 97.0, 89.0, 65.0, 48.0, 35.0, 19.0, 12.0, 6.0, 4.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.98974609375, -0.9662857055664062, -0.9428253173828125, -0.9193649291992188, -0.895904541015625, -0.8724441528320312, -0.8489837646484375, -0.8255233764648438, -0.80206298828125, -0.7786026000976562, -0.7551422119140625, -0.7316818237304688, -0.708221435546875, -0.6847610473632812, -0.6613006591796875, -0.6378402709960938, -0.6143798828125, -0.5909194946289062, -0.5674591064453125, -0.5439987182617188, -0.520538330078125, -0.49707794189453125, -0.4736175537109375, -0.45015716552734375, -0.42669677734375, -0.40323638916015625, -0.3797760009765625, -0.35631561279296875, -0.332855224609375, -0.30939483642578125, -0.2859344482421875, -0.26247406005859375, -0.239013671875, -0.21555328369140625, -0.1920928955078125, -0.16863250732421875, -0.145172119140625, -0.12171173095703125, -0.0982513427734375, -0.07479095458984375, -0.05133056640625, -0.02787017822265625, -0.0044097900390625, 0.01905059814453125, 0.042510986328125, 0.06597137451171875, 0.0894317626953125, 0.11289215087890625, 0.1363525390625, 0.15981292724609375, 0.1832733154296875, 0.20673370361328125, 0.230194091796875, 0.25365447998046875, 0.2771148681640625, 0.30057525634765625, 0.32403564453125, 0.34749603271484375, 0.3709564208984375, 0.39441680908203125, 0.417877197265625, 0.44133758544921875, 0.4647979736328125, 0.48825836181640625, 0.51171875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 6.0, 11.0, 12.0, 14.0, 24.0, 33.0, 43.0, 40.0, 103.0, 132.0, 191.0, 275.0, 465.0, 894.0, 1690.0, 3513.0, 8029.0, 20142.0, 57391.0, 188221.0, 421010.0, 233075.0, 71778.0, 23980.0, 9101.0, 4025.0, 1883.0, 954.0, 514.0, 339.0, 215.0, 127.0, 86.0, 60.0, 43.0, 35.0, 25.0, 18.0, 22.0, 12.0, 15.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0], "bins": [-1.7919921875, -1.74432373046875, -1.6966552734375, -1.64898681640625, -1.601318359375, -1.55364990234375, -1.5059814453125, -1.45831298828125, -1.41064453125, -1.36297607421875, -1.3153076171875, -1.26763916015625, -1.219970703125, -1.17230224609375, -1.1246337890625, -1.07696533203125, -1.029296875, -0.98162841796875, -0.9339599609375, -0.88629150390625, -0.838623046875, -0.79095458984375, -0.7432861328125, -0.69561767578125, -0.64794921875, -0.60028076171875, -0.5526123046875, -0.50494384765625, -0.457275390625, -0.40960693359375, -0.3619384765625, -0.31427001953125, -0.2666015625, -0.21893310546875, -0.1712646484375, -0.12359619140625, -0.075927734375, -0.02825927734375, 0.0194091796875, 0.06707763671875, 0.11474609375, 0.16241455078125, 0.2100830078125, 0.25775146484375, 0.305419921875, 0.35308837890625, 0.4007568359375, 0.44842529296875, 0.49609375, 0.54376220703125, 0.5914306640625, 0.63909912109375, 0.686767578125, 0.73443603515625, 0.7821044921875, 0.82977294921875, 0.87744140625, 0.92510986328125, 0.9727783203125, 1.02044677734375, 1.068115234375, 1.11578369140625, 1.1634521484375, 1.21112060546875, 1.2587890625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 8.0, 6.0, 4.0, 7.0, 10.0, 10.0, 16.0, 13.0, 20.0, 20.0, 23.0, 28.0, 27.0, 35.0, 42.0, 40.0, 31.0, 54.0, 32.0, 37.0, 51.0, 38.0, 48.0, 44.0, 43.0, 39.0, 36.0, 30.0, 40.0, 21.0, 20.0, 18.0, 25.0, 17.0, 22.0, 11.0, 8.0, 9.0, 10.0, 4.0, 7.0, 3.0, 0.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.310546875, -1.2704010009765625, -1.230255126953125, -1.1901092529296875, -1.14996337890625, -1.1098175048828125, -1.069671630859375, -1.0295257568359375, -0.9893798828125, -0.9492340087890625, -0.909088134765625, -0.8689422607421875, -0.82879638671875, -0.7886505126953125, -0.748504638671875, -0.7083587646484375, -0.668212890625, -0.6280670166015625, -0.587921142578125, -0.5477752685546875, -0.50762939453125, -0.4674835205078125, -0.427337646484375, -0.3871917724609375, -0.3470458984375, -0.3069000244140625, -0.266754150390625, -0.2266082763671875, -0.18646240234375, -0.1463165283203125, -0.106170654296875, -0.0660247802734375, -0.02587890625, 0.0142669677734375, 0.054412841796875, 0.0945587158203125, 0.13470458984375, 0.1748504638671875, 0.214996337890625, 0.2551422119140625, 0.2952880859375, 0.3354339599609375, 0.375579833984375, 0.4157257080078125, 0.45587158203125, 0.4960174560546875, 0.536163330078125, 0.5763092041015625, 0.616455078125, 0.6566009521484375, 0.696746826171875, 0.7368927001953125, 0.77703857421875, 0.8171844482421875, 0.857330322265625, 0.8974761962890625, 0.9376220703125, 0.9777679443359375, 1.017913818359375, 1.0580596923828125, 1.09820556640625, 1.1383514404296875, 1.178497314453125, 1.2186431884765625, 1.2587890625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 5.0, 10.0, 10.0, 9.0, 13.0, 26.0, 34.0, 44.0, 65.0, 86.0, 108.0, 201.0, 265.0, 379.0, 582.0, 981.0, 1533.0, 2858.0, 5213.0, 10182.0, 22290.0, 59310.0, 204650.0, 448147.0, 191976.0, 56135.0, 21428.0, 9899.0, 4994.0, 2861.0, 1556.0, 931.0, 640.0, 349.0, 244.0, 179.0, 110.0, 73.0, 46.0, 37.0, 26.0, 18.0, 16.0, 13.0, 7.0, 2.0, 6.0, 3.0, 1.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.81787109375, -0.7926864624023438, -0.7675018310546875, -0.7423171997070312, -0.717132568359375, -0.6919479370117188, -0.6667633056640625, -0.6415786743164062, -0.61639404296875, -0.5912094116210938, -0.5660247802734375, -0.5408401489257812, -0.515655517578125, -0.49047088623046875, -0.4652862548828125, -0.44010162353515625, -0.4149169921875, -0.38973236083984375, -0.3645477294921875, -0.33936309814453125, -0.314178466796875, -0.28899383544921875, -0.2638092041015625, -0.23862457275390625, -0.21343994140625, -0.18825531005859375, -0.1630706787109375, -0.13788604736328125, -0.112701416015625, -0.08751678466796875, -0.0623321533203125, -0.03714752197265625, -0.011962890625, 0.01322174072265625, 0.0384063720703125, 0.06359100341796875, 0.088775634765625, 0.11396026611328125, 0.1391448974609375, 0.16432952880859375, 0.18951416015625, 0.21469879150390625, 0.2398834228515625, 0.26506805419921875, 0.290252685546875, 0.31543731689453125, 0.3406219482421875, 0.36580657958984375, 0.3909912109375, 0.41617584228515625, 0.4413604736328125, 0.46654510498046875, 0.491729736328125, 0.5169143676757812, 0.5420989990234375, 0.5672836303710938, 0.59246826171875, 0.6176528930664062, 0.6428375244140625, 0.6680221557617188, 0.693206787109375, 0.7183914184570312, 0.7435760498046875, 0.7687606811523438, 0.7939453125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 10.0, 7.0, 11.0, 21.0, 32.0, 52.0, 75.0, 119.0, 151.0, 145.0, 114.0, 105.0, 46.0, 37.0, 21.0, 25.0, 9.0, 6.0, 3.0, 3.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0003209114074707031, -0.00030991435050964355, -0.000298917293548584, -0.0002879202365875244, -0.00027692317962646484, -0.0002659261226654053, -0.0002549290657043457, -0.00024393200874328613, -0.00023293495178222656, -0.000221937894821167, -0.00021094083786010742, -0.00019994378089904785, -0.00018894672393798828, -0.0001779496669769287, -0.00016695261001586914, -0.00015595555305480957, -0.00014495849609375, -0.00013396143913269043, -0.00012296438217163086, -0.00011196732521057129, -0.00010097026824951172, -8.997321128845215e-05, -7.897615432739258e-05, -6.797909736633301e-05, -5.698204040527344e-05, -4.598498344421387e-05, -3.49879264831543e-05, -2.3990869522094727e-05, -1.2993812561035156e-05, -1.996755599975586e-06, 9.000301361083984e-06, 1.9997358322143555e-05, 3.0994415283203125e-05, 4.1991472244262695e-05, 5.2988529205322266e-05, 6.398558616638184e-05, 7.49826431274414e-05, 8.597970008850098e-05, 9.697675704956055e-05, 0.00010797381401062012, 0.00011897087097167969, 0.00012996792793273926, 0.00014096498489379883, 0.0001519620418548584, 0.00016295909881591797, 0.00017395615577697754, 0.0001849532127380371, 0.00019595026969909668, 0.00020694732666015625, 0.00021794438362121582, 0.0002289414405822754, 0.00023993849754333496, 0.00025093555450439453, 0.0002619326114654541, 0.00027292966842651367, 0.00028392672538757324, 0.0002949237823486328, 0.0003059208393096924, 0.00031691789627075195, 0.0003279149532318115, 0.0003389120101928711, 0.00034990906715393066, 0.00036090612411499023, 0.0003719031810760498, 0.0003829002380371094]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 6.0, 9.0, 8.0, 14.0, 14.0, 20.0, 35.0, 46.0, 48.0, 78.0, 97.0, 167.0, 281.0, 402.0, 692.0, 1148.0, 2154.0, 4263.0, 9638.0, 25249.0, 86978.0, 382394.0, 397731.0, 91468.0, 25939.0, 9817.0, 4418.0, 2299.0, 1178.0, 697.0, 435.0, 275.0, 182.0, 105.0, 86.0, 43.0, 45.0, 28.0, 17.0, 17.0, 16.0, 5.0, 3.0, 3.0, 1.0, 6.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.9677734375, -0.9375457763671875, -0.907318115234375, -0.8770904541015625, -0.84686279296875, -0.8166351318359375, -0.786407470703125, -0.7561798095703125, -0.7259521484375, -0.6957244873046875, -0.665496826171875, -0.6352691650390625, -0.60504150390625, -0.5748138427734375, -0.544586181640625, -0.5143585205078125, -0.484130859375, -0.4539031982421875, -0.423675537109375, -0.3934478759765625, -0.36322021484375, -0.3329925537109375, -0.302764892578125, -0.2725372314453125, -0.2423095703125, -0.2120819091796875, -0.181854248046875, -0.1516265869140625, -0.12139892578125, -0.0911712646484375, -0.060943603515625, -0.0307159423828125, -0.00048828125, 0.0297393798828125, 0.059967041015625, 0.0901947021484375, 0.12042236328125, 0.1506500244140625, 0.180877685546875, 0.2111053466796875, 0.2413330078125, 0.2715606689453125, 0.301788330078125, 0.3320159912109375, 0.36224365234375, 0.3924713134765625, 0.422698974609375, 0.4529266357421875, 0.483154296875, 0.5133819580078125, 0.543609619140625, 0.5738372802734375, 0.60406494140625, 0.6342926025390625, 0.664520263671875, 0.6947479248046875, 0.7249755859375, 0.7552032470703125, 0.785430908203125, 0.8156585693359375, 0.84588623046875, 0.8761138916015625, 0.906341552734375, 0.9365692138671875, 0.966796875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 2.0, 3.0, 1.0, 5.0, 6.0, 9.0, 10.0, 9.0, 13.0, 23.0, 27.0, 39.0, 42.0, 82.0, 91.0, 106.0, 101.0, 98.0, 87.0, 65.0, 45.0, 39.0, 23.0, 26.0, 14.0, 13.0, 8.0, 7.0, 6.0, 4.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69580078125, -0.6661300659179688, -0.6364593505859375, -0.6067886352539062, -0.577117919921875, -0.5474472045898438, -0.5177764892578125, -0.48810577392578125, -0.45843505859375, -0.42876434326171875, -0.3990936279296875, -0.36942291259765625, -0.339752197265625, -0.31008148193359375, -0.2804107666015625, -0.25074005126953125, -0.2210693359375, -0.19139862060546875, -0.1617279052734375, -0.13205718994140625, -0.102386474609375, -0.07271575927734375, -0.0430450439453125, -0.01337432861328125, 0.01629638671875, 0.04596710205078125, 0.0756378173828125, 0.10530853271484375, 0.134979248046875, 0.16464996337890625, 0.1943206787109375, 0.22399139404296875, 0.253662109375, 0.28333282470703125, 0.3130035400390625, 0.34267425537109375, 0.372344970703125, 0.40201568603515625, 0.4316864013671875, 0.46135711669921875, 0.49102783203125, 0.5206985473632812, 0.5503692626953125, 0.5800399780273438, 0.609710693359375, 0.6393814086914062, 0.6690521240234375, 0.6987228393554688, 0.7283935546875, 0.7580642700195312, 0.7877349853515625, 0.8174057006835938, 0.847076416015625, 0.8767471313476562, 0.9064178466796875, 0.9360885620117188, 0.96575927734375, 0.9954299926757812, 1.0251007080078125, 1.0547714233398438, 1.084442138671875, 1.1141128540039062, 1.1437835693359375, 1.1734542846679688, 1.203125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 23.0, 46.0, 95.0, 151.0, 199.0, 204.0, 136.0, 61.0, 52.0, 19.0, 7.0, 6.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-28.24990463256836, -27.64635467529297, -27.042802810668945, -26.439252853393555, -25.835702896118164, -25.23215103149414, -24.62860107421875, -24.02505111694336, -23.42150115966797, -22.817951202392578, -22.214399337768555, -21.610849380493164, -21.007299423217773, -20.40374755859375, -19.80019760131836, -19.19664764404297, -18.593095779418945, -17.989545822143555, -17.38599395751953, -16.78244400024414, -16.17889404296875, -15.575343132019043, -14.971792221069336, -14.368242263793945, -13.764691352844238, -13.161140441894531, -12.55759048461914, -11.954039573669434, -11.350488662719727, -10.746938705444336, -10.143387794494629, -9.539836883544922, -8.936286926269531, -8.332736015319824, -7.729186058044434, -7.125635147094727, -6.522084712982178, -5.918534278869629, -5.314983367919922, -4.711432933807373, -4.107882499694824, -3.5043320655822754, -2.9007813930511475, -2.2972307205200195, -1.6936802864074707, -1.0901298522949219, -0.48657917976379395, 0.11697149276733398, 0.7205219268798828, 1.3240724802017212, 1.9276230335235596, 2.5311737060546875, 3.1347241401672363, 3.738274574279785, 4.341825485229492, 4.945375919342041, 5.54892635345459, 6.152476787567139, 6.7560272216796875, 7.3595781326293945, 7.963128566741943, 8.566679000854492, 9.1702299118042, 9.773780822753906, 10.377330780029297]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 2.0, 4.0, 3.0, 5.0, 7.0, 9.0, 8.0, 12.0, 13.0, 20.0, 22.0, 16.0, 27.0, 24.0, 44.0, 24.0, 36.0, 35.0, 42.0, 33.0, 38.0, 41.0, 39.0, 46.0, 38.0, 38.0, 41.0, 31.0, 35.0, 28.0, 27.0, 27.0, 19.0, 26.0, 22.0, 17.0, 21.0, 10.0, 13.0, 8.0, 12.0, 4.0, 6.0, 4.0, 6.0, 5.0, 1.0, 2.0, 7.0, 2.0, 3.0, 1.0], "bins": [-7.423919677734375, -7.210368633270264, -6.996817588806152, -6.783266544342041, -6.56971549987793, -6.356164932250977, -6.142613410949707, -5.929062843322754, -5.715511798858643, -5.501960754394531, -5.28840970993042, -5.074858665466309, -4.861307621002197, -4.647756576538086, -4.434206008911133, -4.2206549644470215, -4.00710391998291, -3.793552875518799, -3.5800018310546875, -3.366450786590576, -3.152899980545044, -2.9393489360809326, -2.7257978916168213, -2.512247085571289, -2.2986955642700195, -2.085144519805908, -1.8715935945510864, -1.658042550086975, -1.4444916248321533, -1.230940580368042, -1.0173895359039307, -0.8038386106491089, -0.5902876853942871, -0.37673670053482056, -0.16318568587303162, 0.050365328788757324, 0.2639163136482239, 0.47746729850769043, 0.6910183429718018, 0.9045692682266235, 1.1181203126907349, 1.3316713571548462, 1.545222282409668, 1.7587733268737793, 1.9723243713378906, 2.185875415802002, 2.3994264602661133, 2.6129772663116455, 2.826528310775757, 3.040079355239868, 3.2536303997039795, 3.4671812057495117, 3.680732250213623, 3.8942832946777344, 4.107834339141846, 4.321385383605957, 4.534936428070068, 4.74848747253418, 4.962038516998291, 5.175589561462402, 5.389140605926514, 5.602691650390625, 5.816242218017578, 6.0297932624816895, 6.243344306945801]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 4.0, 5.0, 5.0, 7.0, 7.0, 6.0, 11.0, 10.0, 10.0, 17.0, 12.0, 22.0, 24.0, 29.0, 36.0, 54.0, 63.0, 95.0, 132.0, 222.0, 449.0, 989.0, 3148.0, 12507.0, 106025.0, 4005151.0, 51866.0, 8685.0, 2549.0, 947.0, 485.0, 276.0, 146.0, 104.0, 49.0, 58.0, 27.0, 19.0, 12.0, 7.0, 7.0, 2.0, 0.0, 4.0, 1.0], "bins": [-8.7109375, -8.514617919921875, -8.31829833984375, -8.121978759765625, -7.9256591796875, -7.729339599609375, -7.53302001953125, -7.336700439453125, -7.140380859375, -6.944061279296875, -6.74774169921875, -6.551422119140625, -6.3551025390625, -6.158782958984375, -5.96246337890625, -5.766143798828125, -5.56982421875, -5.373504638671875, -5.17718505859375, -4.980865478515625, -4.7845458984375, -4.588226318359375, -4.39190673828125, -4.195587158203125, -3.999267578125, -3.802947998046875, -3.60662841796875, -3.410308837890625, -3.2139892578125, -3.017669677734375, -2.82135009765625, -2.625030517578125, -2.4287109375, -2.232391357421875, -2.03607177734375, -1.839752197265625, -1.6434326171875, -1.447113037109375, -1.25079345703125, -1.054473876953125, -0.858154296875, -0.661834716796875, -0.46551513671875, -0.269195556640625, -0.0728759765625, 0.123443603515625, 0.31976318359375, 0.516082763671875, 0.71240234375, 0.908721923828125, 1.10504150390625, 1.301361083984375, 1.4976806640625, 1.694000244140625, 1.89031982421875, 2.086639404296875, 2.282958984375, 2.479278564453125, 2.67559814453125, 2.871917724609375, 3.0682373046875, 3.264556884765625, 3.46087646484375, 3.657196044921875, 3.853515625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 3.0, 13.0, 12.0, 17.0, 52.0, 60.0, 76.0, 97.0, 107.0, 103.0, 135.0, 105.0, 81.0, 43.0, 40.0, 20.0, 24.0, 6.0, 6.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.041015625, -1.0170974731445312, -0.9931793212890625, -0.9692611694335938, -0.945343017578125, -0.9214248657226562, -0.8975067138671875, -0.8735885620117188, -0.84967041015625, -0.8257522583007812, -0.8018341064453125, -0.7779159545898438, -0.753997802734375, -0.7300796508789062, -0.7061614990234375, -0.6822433471679688, -0.6583251953125, -0.6344070434570312, -0.6104888916015625, -0.5865707397460938, -0.562652587890625, -0.5387344360351562, -0.5148162841796875, -0.49089813232421875, -0.46697998046875, -0.44306182861328125, -0.4191436767578125, -0.39522552490234375, -0.371307373046875, -0.34738922119140625, -0.3234710693359375, -0.29955291748046875, -0.275634765625, -0.25171661376953125, -0.2277984619140625, -0.20388031005859375, -0.179962158203125, -0.15604400634765625, -0.1321258544921875, -0.10820770263671875, -0.08428955078125, -0.06037139892578125, -0.0364532470703125, -0.01253509521484375, 0.011383056640625, 0.03530120849609375, 0.0592193603515625, 0.08313751220703125, 0.1070556640625, 0.13097381591796875, 0.1548919677734375, 0.17881011962890625, 0.202728271484375, 0.22664642333984375, 0.2505645751953125, 0.27448272705078125, 0.29840087890625, 0.32231903076171875, 0.3462371826171875, 0.37015533447265625, 0.394073486328125, 0.41799163818359375, 0.4419097900390625, 0.46582794189453125, 0.48974609375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 1.0, 5.0, 6.0, 6.0, 13.0, 15.0, 32.0, 40.0, 57.0, 98.0, 151.0, 263.0, 449.0, 926.0, 2181.0, 5780.0, 19682.0, 116889.0, 3861350.0, 152711.0, 22342.0, 6542.0, 2492.0, 1046.0, 518.0, 282.0, 160.0, 91.0, 51.0, 37.0, 18.0, 13.0, 9.0, 7.0, 7.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.548828125, -3.424530029296875, -3.30023193359375, -3.175933837890625, -3.0516357421875, -2.927337646484375, -2.80303955078125, -2.678741455078125, -2.554443359375, -2.430145263671875, -2.30584716796875, -2.181549072265625, -2.0572509765625, -1.932952880859375, -1.80865478515625, -1.684356689453125, -1.56005859375, -1.435760498046875, -1.31146240234375, -1.187164306640625, -1.0628662109375, -0.938568115234375, -0.81427001953125, -0.689971923828125, -0.565673828125, -0.441375732421875, -0.31707763671875, -0.192779541015625, -0.0684814453125, 0.055816650390625, 0.18011474609375, 0.304412841796875, 0.4287109375, 0.553009033203125, 0.67730712890625, 0.801605224609375, 0.9259033203125, 1.050201416015625, 1.17449951171875, 1.298797607421875, 1.423095703125, 1.547393798828125, 1.67169189453125, 1.795989990234375, 1.9202880859375, 2.044586181640625, 2.16888427734375, 2.293182373046875, 2.41748046875, 2.541778564453125, 2.66607666015625, 2.790374755859375, 2.9146728515625, 3.038970947265625, 3.16326904296875, 3.287567138671875, 3.411865234375, 3.536163330078125, 3.66046142578125, 3.784759521484375, 3.9090576171875, 4.033355712890625, 4.15765380859375, 4.281951904296875, 4.40625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 6.0, 6.0, 15.0, 18.0, 19.0, 17.0, 45.0, 62.0, 119.0, 309.0, 2358.0, 664.0, 185.0, 83.0, 56.0, 31.0, 23.0, 10.0, 10.0, 12.0, 6.0, 6.0, 2.0, 5.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4931640625, -1.4546279907226562, -1.4160919189453125, -1.3775558471679688, -1.339019775390625, -1.3004837036132812, -1.2619476318359375, -1.2234115600585938, -1.18487548828125, -1.1463394165039062, -1.1078033447265625, -1.0692672729492188, -1.030731201171875, -0.9921951293945312, -0.9536590576171875, -0.9151229858398438, -0.8765869140625, -0.8380508422851562, -0.7995147705078125, -0.7609786987304688, -0.722442626953125, -0.6839065551757812, -0.6453704833984375, -0.6068344116210938, -0.56829833984375, -0.5297622680664062, -0.4912261962890625, -0.45269012451171875, -0.414154052734375, -0.37561798095703125, -0.3370819091796875, -0.29854583740234375, -0.260009765625, -0.22147369384765625, -0.1829376220703125, -0.14440155029296875, -0.105865478515625, -0.06732940673828125, -0.0287933349609375, 0.00974273681640625, 0.04827880859375, 0.08681488037109375, 0.1253509521484375, 0.16388702392578125, 0.202423095703125, 0.24095916748046875, 0.2794952392578125, 0.31803131103515625, 0.3565673828125, 0.39510345458984375, 0.4336395263671875, 0.47217559814453125, 0.510711669921875, 0.5492477416992188, 0.5877838134765625, 0.6263198852539062, 0.66485595703125, 0.7033920288085938, 0.7419281005859375, 0.7804641723632812, 0.819000244140625, 0.8575363159179688, 0.8960723876953125, 0.9346084594726562, 0.97314453125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 4.0, 9.0, 8.0, 33.0, 71.0, 168.0, 297.0, 232.0, 105.0, 40.0, 16.0, 14.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.675071716308594, -7.304558277130127, -6.934044361114502, -6.563530921936035, -6.193017482757568, -5.822504043579102, -5.451990127563477, -5.08147668838501, -4.710963249206543, -4.340449810028076, -3.9699361324310303, -3.5994224548339844, -3.2289090156555176, -2.8583953380584717, -2.487881660461426, -2.117368221282959, -1.746854305267334, -1.3763407468795776, -1.0058271884918213, -0.6353135108947754, -0.26479995250701904, 0.1057136058807373, 0.4762272834777832, 0.84674072265625, 1.217254400253296, 1.5877679586410522, 1.9582815170288086, 2.3287951946258545, 2.6993088722229004, 3.069822311401367, 3.440335988998413, 3.81084942817688, 4.181363105773926, 4.551876544952393, 4.922390460968018, 5.292903900146484, 5.663417339324951, 6.033930778503418, 6.404444694519043, 6.77495813369751, 7.145471572875977, 7.515985012054443, 7.886498928070068, 8.257012367248535, 8.62752628326416, 8.998039245605469, 9.368553161621094, 9.739067077636719, 10.109580993652344, 10.480094909667969, 10.850607872009277, 11.221121788024902, 11.591635704040527, 11.962148666381836, 12.332662582397461, 12.703176498413086, 13.073689460754395, 13.44420337677002, 13.814716339111328, 14.185230255126953, 14.555744171142578, 14.926257133483887, 15.296771049499512, 15.66728401184082, 16.037797927856445]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 6.0, 9.0, 18.0, 14.0, 21.0, 26.0, 24.0, 26.0, 32.0, 29.0, 20.0, 42.0, 54.0, 36.0, 58.0, 49.0, 63.0, 54.0, 59.0, 39.0, 50.0, 36.0, 37.0, 37.0, 35.0, 25.0, 24.0, 10.0, 14.0, 10.0, 13.0, 7.0, 1.0, 6.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.039074420928955, -2.9304943084716797, -2.8219144344329834, -2.713334321975708, -2.6047542095184326, -2.4961743354797363, -2.387594223022461, -2.2790141105651855, -2.1704342365264893, -2.061854124069214, -1.953274130821228, -1.8446941375732422, -1.7361141443252563, -1.6275341510772705, -1.5189540386199951, -1.4103740453720093, -1.3017939329147339, -1.193213939666748, -1.0846338272094727, -0.9760538339614868, -0.867473840713501, -0.7588937878608704, -0.6503137350082397, -0.5417337417602539, -0.4331536889076233, -0.32457366585731506, -0.21599362790584564, -0.10741358995437622, 0.0011664330959320068, 0.10974645614624023, 0.21832650899887085, 0.3269065022468567, 0.4354865550994873, 0.5440666079521179, 0.6526466012001038, 0.7612266540527344, 0.8698066473007202, 0.9783867001533508, 1.0869667530059814, 1.1955467462539673, 1.3041267395019531, 1.412706732749939, 1.5212868452072144, 1.6298668384552002, 1.738446831703186, 1.8470268249511719, 1.9556069374084473, 2.0641870498657227, 2.172767162322998, 2.2813472747802734, 2.3899271488189697, 2.498507261276245, 2.6070873737335205, 2.715667247772217, 2.824247360229492, 2.9328274726867676, 3.041407346725464, 3.1499874591827393, 3.2585673332214355, 3.367147445678711, 3.4757275581359863, 3.5843074321746826, 3.692887544631958, 3.8014674186706543, 3.9100475311279297]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 3.0, 2.0, 7.0, 8.0, 7.0, 13.0, 23.0, 24.0, 34.0, 49.0, 81.0, 149.0, 240.0, 435.0, 1043.0, 2901.0, 12247.0, 102217.0, 762841.0, 145207.0, 15297.0, 3480.0, 1124.0, 469.0, 235.0, 140.0, 74.0, 62.0, 48.0, 17.0, 17.0, 16.0, 13.0, 9.0, 8.0, 4.0, 0.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.66015625, -4.5076904296875, -4.355224609375, -4.2027587890625, -4.05029296875, -3.8978271484375, -3.745361328125, -3.5928955078125, -3.4404296875, -3.2879638671875, -3.135498046875, -2.9830322265625, -2.83056640625, -2.6781005859375, -2.525634765625, -2.3731689453125, -2.220703125, -2.0682373046875, -1.915771484375, -1.7633056640625, -1.61083984375, -1.4583740234375, -1.305908203125, -1.1534423828125, -1.0009765625, -0.8485107421875, -0.696044921875, -0.5435791015625, -0.39111328125, -0.2386474609375, -0.086181640625, 0.0662841796875, 0.21875, 0.3712158203125, 0.523681640625, 0.6761474609375, 0.82861328125, 0.9810791015625, 1.133544921875, 1.2860107421875, 1.4384765625, 1.5909423828125, 1.743408203125, 1.8958740234375, 2.04833984375, 2.2008056640625, 2.353271484375, 2.5057373046875, 2.658203125, 2.8106689453125, 2.963134765625, 3.1156005859375, 3.26806640625, 3.4205322265625, 3.572998046875, 3.7254638671875, 3.8779296875, 4.0303955078125, 4.182861328125, 4.3353271484375, 4.48779296875, 4.6402587890625, 4.792724609375, 4.9451904296875, 5.09765625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 6.0, 7.0, 8.0, 28.0, 36.0, 46.0, 64.0, 72.0, 73.0, 93.0, 114.0, 106.0, 90.0, 69.0, 62.0, 44.0, 28.0, 23.0, 12.0, 6.0, 8.0, 3.0, 0.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0], "bins": [-0.90234375, -0.8811302185058594, -0.8599166870117188, -0.8387031555175781, -0.8174896240234375, -0.7962760925292969, -0.7750625610351562, -0.7538490295410156, -0.732635498046875, -0.7114219665527344, -0.6902084350585938, -0.6689949035644531, -0.6477813720703125, -0.6265678405761719, -0.6053543090820312, -0.5841407775878906, -0.56292724609375, -0.5417137145996094, -0.5205001831054688, -0.4992866516113281, -0.4780731201171875, -0.4568595886230469, -0.43564605712890625, -0.4144325256347656, -0.393218994140625, -0.3720054626464844, -0.35079193115234375, -0.3295783996582031, -0.3083648681640625, -0.2871513366699219, -0.26593780517578125, -0.24472427368164062, -0.2235107421875, -0.20229721069335938, -0.18108367919921875, -0.15987014770507812, -0.1386566162109375, -0.11744308471679688, -0.09622955322265625, -0.07501602172851562, -0.053802490234375, -0.032588958740234375, -0.01137542724609375, 0.009838104248046875, 0.0310516357421875, 0.052265167236328125, 0.07347869873046875, 0.09469223022460938, 0.11590576171875, 0.13711929321289062, 0.15833282470703125, 0.17954635620117188, 0.2007598876953125, 0.22197341918945312, 0.24318695068359375, 0.2644004821777344, 0.285614013671875, 0.3068275451660156, 0.32804107666015625, 0.3492546081542969, 0.3704681396484375, 0.3916816711425781, 0.41289520263671875, 0.4341087341308594, 0.455322265625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 1.0, 6.0, 4.0, 5.0, 11.0, 21.0, 22.0, 21.0, 35.0, 54.0, 64.0, 100.0, 156.0, 248.0, 445.0, 820.0, 1541.0, 3230.0, 7169.0, 17611.0, 51246.0, 170467.0, 426730.0, 250961.0, 74951.0, 24746.0, 9565.0, 4006.0, 1895.0, 985.0, 537.0, 340.0, 188.0, 105.0, 76.0, 53.0, 42.0, 27.0, 18.0, 10.0, 11.0, 11.0, 6.0, 9.0, 7.0, 1.0, 0.0, 1.0, 3.0], "bins": [-1.9873046875, -1.934539794921875, -1.88177490234375, -1.829010009765625, -1.7762451171875, -1.723480224609375, -1.67071533203125, -1.617950439453125, -1.565185546875, -1.512420654296875, -1.45965576171875, -1.406890869140625, -1.3541259765625, -1.301361083984375, -1.24859619140625, -1.195831298828125, -1.14306640625, -1.090301513671875, -1.03753662109375, -0.984771728515625, -0.9320068359375, -0.879241943359375, -0.82647705078125, -0.773712158203125, -0.720947265625, -0.668182373046875, -0.61541748046875, -0.562652587890625, -0.5098876953125, -0.457122802734375, -0.40435791015625, -0.351593017578125, -0.298828125, -0.246063232421875, -0.19329833984375, -0.140533447265625, -0.0877685546875, -0.035003662109375, 0.01776123046875, 0.070526123046875, 0.123291015625, 0.176055908203125, 0.22882080078125, 0.281585693359375, 0.3343505859375, 0.387115478515625, 0.43988037109375, 0.492645263671875, 0.54541015625, 0.598175048828125, 0.65093994140625, 0.703704833984375, 0.7564697265625, 0.809234619140625, 0.86199951171875, 0.914764404296875, 0.967529296875, 1.020294189453125, 1.07305908203125, 1.125823974609375, 1.1785888671875, 1.231353759765625, 1.28411865234375, 1.336883544921875, 1.3896484375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 4.0, 5.0, 9.0, 11.0, 11.0, 15.0, 9.0, 18.0, 20.0, 29.0, 30.0, 22.0, 38.0, 41.0, 48.0, 38.0, 57.0, 50.0, 44.0, 49.0, 39.0, 42.0, 53.0, 42.0, 41.0, 26.0, 25.0, 21.0, 24.0, 34.0, 24.0, 17.0, 13.0, 8.0, 12.0, 5.0, 6.0, 7.0, 2.0, 4.0, 7.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.3056640625, -1.260833740234375, -1.21600341796875, -1.171173095703125, -1.1263427734375, -1.081512451171875, -1.03668212890625, -0.991851806640625, -0.947021484375, -0.902191162109375, -0.85736083984375, -0.812530517578125, -0.7677001953125, -0.722869873046875, -0.67803955078125, -0.633209228515625, -0.58837890625, -0.543548583984375, -0.49871826171875, -0.453887939453125, -0.4090576171875, -0.364227294921875, -0.31939697265625, -0.274566650390625, -0.229736328125, -0.184906005859375, -0.14007568359375, -0.095245361328125, -0.0504150390625, -0.005584716796875, 0.03924560546875, 0.084075927734375, 0.12890625, 0.173736572265625, 0.21856689453125, 0.263397216796875, 0.3082275390625, 0.353057861328125, 0.39788818359375, 0.442718505859375, 0.487548828125, 0.532379150390625, 0.57720947265625, 0.622039794921875, 0.6668701171875, 0.711700439453125, 0.75653076171875, 0.801361083984375, 0.84619140625, 0.891021728515625, 0.93585205078125, 0.980682373046875, 1.0255126953125, 1.070343017578125, 1.11517333984375, 1.160003662109375, 1.204833984375, 1.249664306640625, 1.29449462890625, 1.339324951171875, 1.3841552734375, 1.428985595703125, 1.47381591796875, 1.518646240234375, 1.5634765625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 8.0, 10.0, 7.0, 15.0, 12.0, 34.0, 46.0, 73.0, 133.0, 246.0, 535.0, 1459.0, 5475.0, 50779.0, 891175.0, 88520.0, 7051.0, 1705.0, 646.0, 260.0, 150.0, 79.0, 50.0, 41.0, 19.0, 9.0, 6.0, 4.0, 1.0, 4.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.837890625, -2.7643280029296875, -2.690765380859375, -2.6172027587890625, -2.54364013671875, -2.4700775146484375, -2.396514892578125, -2.3229522705078125, -2.2493896484375, -2.1758270263671875, -2.102264404296875, -2.0287017822265625, -1.95513916015625, -1.8815765380859375, -1.808013916015625, -1.7344512939453125, -1.660888671875, -1.5873260498046875, -1.513763427734375, -1.4402008056640625, -1.36663818359375, -1.2930755615234375, -1.219512939453125, -1.1459503173828125, -1.0723876953125, -0.9988250732421875, -0.925262451171875, -0.8516998291015625, -0.77813720703125, -0.7045745849609375, -0.631011962890625, -0.5574493408203125, -0.48388671875, -0.4103240966796875, -0.336761474609375, -0.2631988525390625, -0.18963623046875, -0.1160736083984375, -0.042510986328125, 0.0310516357421875, 0.1046142578125, 0.1781768798828125, 0.251739501953125, 0.3253021240234375, 0.39886474609375, 0.4724273681640625, 0.545989990234375, 0.6195526123046875, 0.693115234375, 0.7666778564453125, 0.840240478515625, 0.9138031005859375, 0.98736572265625, 1.0609283447265625, 1.134490966796875, 1.2080535888671875, 1.2816162109375, 1.3551788330078125, 1.428741455078125, 1.5023040771484375, 1.57586669921875, 1.6494293212890625, 1.722991943359375, 1.7965545654296875, 1.8701171875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 3.0, 9.0, 8.0, 10.0, 16.0, 14.0, 26.0, 35.0, 57.0, 82.0, 116.0, 127.0, 116.0, 113.0, 63.0, 51.0, 52.0, 35.0, 20.0, 12.0, 19.0, 7.0, 5.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022149085998535156, -0.0002142973244190216, -0.00020710378885269165, -0.0001999102532863617, -0.00019271671772003174, -0.00018552318215370178, -0.00017832964658737183, -0.00017113611102104187, -0.00016394257545471191, -0.00015674903988838196, -0.000149555504322052, -0.00014236196875572205, -0.0001351684331893921, -0.00012797489762306213, -0.00012078136205673218, -0.00011358782649040222, -0.00010639429092407227, -9.920075535774231e-05, -9.200721979141235e-05, -8.48136842250824e-05, -7.762014865875244e-05, -7.042661309242249e-05, -6.323307752609253e-05, -5.603954195976257e-05, -4.884600639343262e-05, -4.165247082710266e-05, -3.4458935260772705e-05, -2.726539969444275e-05, -2.0071864128112793e-05, -1.2878328561782837e-05, -5.684792995452881e-06, 1.5087425708770752e-06, 8.702278137207031e-06, 1.5895813703536987e-05, 2.3089349269866943e-05, 3.02828848361969e-05, 3.7476420402526855e-05, 4.466995596885681e-05, 5.186349153518677e-05, 5.9057027101516724e-05, 6.625056266784668e-05, 7.344409823417664e-05, 8.063763380050659e-05, 8.783116936683655e-05, 9.50247049331665e-05, 0.00010221824049949646, 0.00010941177606582642, 0.00011660531163215637, 0.00012379884719848633, 0.00013099238276481628, 0.00013818591833114624, 0.0001453794538974762, 0.00015257298946380615, 0.0001597665250301361, 0.00016696006059646606, 0.00017415359616279602, 0.00018134713172912598, 0.00018854066729545593, 0.0001957342028617859, 0.00020292773842811584, 0.0002101212739944458, 0.00021731480956077576, 0.0002245083451271057, 0.00023170188069343567, 0.00023889541625976562]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 5.0, 6.0, 8.0, 10.0, 16.0, 21.0, 37.0, 62.0, 100.0, 151.0, 259.0, 409.0, 726.0, 1594.0, 3957.0, 12580.0, 69465.0, 661724.0, 258902.0, 26593.0, 6951.0, 2478.0, 1080.0, 561.0, 297.0, 197.0, 139.0, 68.0, 50.0, 33.0, 17.0, 16.0, 11.0, 5.0, 2.0, 8.0, 2.0, 4.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.4619140625, -1.4172821044921875, -1.372650146484375, -1.3280181884765625, -1.28338623046875, -1.2387542724609375, -1.194122314453125, -1.1494903564453125, -1.1048583984375, -1.0602264404296875, -1.015594482421875, -0.9709625244140625, -0.92633056640625, -0.8816986083984375, -0.837066650390625, -0.7924346923828125, -0.747802734375, -0.7031707763671875, -0.658538818359375, -0.6139068603515625, -0.56927490234375, -0.5246429443359375, -0.480010986328125, -0.4353790283203125, -0.3907470703125, -0.3461151123046875, -0.301483154296875, -0.2568511962890625, -0.21221923828125, -0.1675872802734375, -0.122955322265625, -0.0783233642578125, -0.03369140625, 0.0109405517578125, 0.055572509765625, 0.1002044677734375, 0.14483642578125, 0.1894683837890625, 0.234100341796875, 0.2787322998046875, 0.3233642578125, 0.3679962158203125, 0.412628173828125, 0.4572601318359375, 0.50189208984375, 0.5465240478515625, 0.591156005859375, 0.6357879638671875, 0.680419921875, 0.7250518798828125, 0.769683837890625, 0.8143157958984375, 0.85894775390625, 0.9035797119140625, 0.948211669921875, 0.9928436279296875, 1.0374755859375, 1.0821075439453125, 1.126739501953125, 1.1713714599609375, 1.21600341796875, 1.2606353759765625, 1.305267333984375, 1.3498992919921875, 1.39453125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 5.0, 10.0, 9.0, 6.0, 12.0, 14.0, 21.0, 38.0, 65.0, 108.0, 141.0, 153.0, 145.0, 90.0, 68.0, 41.0, 31.0, 10.0, 10.0, 7.0, 7.0, 7.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.091796875, -1.055908203125, -1.02001953125, -0.984130859375, -0.9482421875, -0.912353515625, -0.87646484375, -0.840576171875, -0.8046875, -0.768798828125, -0.73291015625, -0.697021484375, -0.6611328125, -0.625244140625, -0.58935546875, -0.553466796875, -0.517578125, -0.481689453125, -0.44580078125, -0.409912109375, -0.3740234375, -0.338134765625, -0.30224609375, -0.266357421875, -0.23046875, -0.194580078125, -0.15869140625, -0.122802734375, -0.0869140625, -0.051025390625, -0.01513671875, 0.020751953125, 0.056640625, 0.092529296875, 0.12841796875, 0.164306640625, 0.2001953125, 0.236083984375, 0.27197265625, 0.307861328125, 0.34375, 0.379638671875, 0.41552734375, 0.451416015625, 0.4873046875, 0.523193359375, 0.55908203125, 0.594970703125, 0.630859375, 0.666748046875, 0.70263671875, 0.738525390625, 0.7744140625, 0.810302734375, 0.84619140625, 0.882080078125, 0.91796875, 0.953857421875, 0.98974609375, 1.025634765625, 1.0615234375, 1.097412109375, 1.13330078125, 1.169189453125, 1.205078125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 13.0, 16.0, 18.0, 49.0, 111.0, 133.0, 196.0, 170.0, 128.0, 78.0, 35.0, 24.0, 15.0, 8.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.58957290649414, -13.040345191955566, -12.491117477416992, -11.941890716552734, -11.39266300201416, -10.843435287475586, -10.294207572937012, -9.744979858398438, -9.19575309753418, -8.646525382995605, -8.097297668457031, -7.548070430755615, -6.998843193054199, -6.449615478515625, -5.900387763977051, -5.351160049438477, -4.801932334899902, -4.252704620361328, -3.703477382659912, -3.154249668121338, -2.6050221920013428, -2.0557947158813477, -1.5065670013427734, -0.9573395252227783, -0.4081120491027832, 0.1411154866218567, 0.6903430223464966, 1.2395706176757812, 1.7887980937957764, 2.3380255699157715, 2.8872532844543457, 3.436480760574341, 3.985708236694336, 4.53493595123291, 5.084163188934326, 5.6333909034729, 6.182618141174316, 6.731845855712891, 7.281073570251465, 7.830301284790039, 8.379528045654297, 8.928755760192871, 9.477983474731445, 10.027210235595703, 10.576437950134277, 11.125665664672852, 11.674893379211426, 12.22412109375, 12.773348808288574, 13.322576522827148, 13.871804237365723, 14.421031951904297, 14.970258712768555, 15.519486427307129, 16.068714141845703, 16.61794090270996, 17.16716957092285, 17.71639633178711, 18.265625, 18.814851760864258, 19.36408042907715, 19.913307189941406, 20.462535858154297, 21.011762619018555, 21.560989379882812]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 1.0, 0.0, 6.0, 2.0, 5.0, 6.0, 8.0, 11.0, 15.0, 13.0, 13.0, 20.0, 20.0, 25.0, 30.0, 30.0, 25.0, 32.0, 32.0, 38.0, 32.0, 42.0, 49.0, 35.0, 44.0, 44.0, 41.0, 41.0, 29.0, 46.0, 31.0, 34.0, 18.0, 28.0, 25.0, 22.0, 20.0, 16.0, 15.0, 12.0, 13.0, 9.0, 7.0, 6.0, 1.0, 3.0, 5.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-7.248810768127441, -7.030357360839844, -6.811903953552246, -6.593450546264648, -6.374996662139893, -6.156543254852295, -5.938089847564697, -5.7196364402771, -5.501183032989502, -5.282729625701904, -5.064276218414307, -4.845822334289551, -4.627368927001953, -4.4089155197143555, -4.190462112426758, -3.97200870513916, -3.7535550594329834, -3.5351016521453857, -3.316648006439209, -3.0981945991516113, -2.8797411918640137, -2.661287784576416, -2.4428341388702393, -2.2243807315826416, -2.005927085876465, -1.7874735593795776, -1.56902015209198, -1.3505666255950928, -1.1321132183074951, -0.9136596918106079, -0.6952061653137207, -0.47675275802612305, -0.2582993507385254, -0.039845868945121765, 0.17860761284828186, 0.3970611095428467, 0.6155145764350891, 0.8339680433273315, 1.0524215698242188, 1.2708749771118164, 1.4893285036087036, 1.7077820301055908, 1.9262354373931885, 2.1446890830993652, 2.363142490386963, 2.5815958976745605, 2.800049304962158, 3.018502712249756, 3.2369563579559326, 3.4554097652435303, 3.673863410949707, 3.8923168182373047, 4.110770225524902, 4.3292236328125, 4.547677040100098, 4.766130447387695, 4.984584331512451, 5.203037738800049, 5.4214911460876465, 5.639945030212402, 5.8583984375, 6.076851844787598, 6.295305252075195, 6.513758659362793, 6.732212066650391]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 4.0, 3.0, 3.0, 5.0, 3.0, 8.0, 9.0, 12.0, 10.0, 14.0, 14.0, 16.0, 20.0, 25.0, 26.0, 36.0, 46.0, 57.0, 83.0, 138.0, 200.0, 396.0, 737.0, 1872.0, 5180.0, 18483.0, 131368.0, 3929517.0, 83059.0, 14351.0, 4510.0, 1836.0, 891.0, 501.0, 282.0, 185.0, 129.0, 80.0, 58.0, 44.0, 26.0, 18.0, 8.0, 6.0, 8.0, 4.0, 2.0, 2.0, 2.0], "bins": [-6.15234375, -6.007293701171875, -5.86224365234375, -5.717193603515625, -5.5721435546875, -5.427093505859375, -5.28204345703125, -5.136993408203125, -4.991943359375, -4.846893310546875, -4.70184326171875, -4.556793212890625, -4.4117431640625, -4.266693115234375, -4.12164306640625, -3.976593017578125, -3.83154296875, -3.686492919921875, -3.54144287109375, -3.396392822265625, -3.2513427734375, -3.106292724609375, -2.96124267578125, -2.816192626953125, -2.671142578125, -2.526092529296875, -2.38104248046875, -2.235992431640625, -2.0909423828125, -1.945892333984375, -1.80084228515625, -1.655792236328125, -1.5107421875, -1.365692138671875, -1.22064208984375, -1.075592041015625, -0.9305419921875, -0.785491943359375, -0.64044189453125, -0.495391845703125, -0.350341796875, -0.205291748046875, -0.06024169921875, 0.084808349609375, 0.2298583984375, 0.374908447265625, 0.51995849609375, 0.665008544921875, 0.81005859375, 0.955108642578125, 1.10015869140625, 1.245208740234375, 1.3902587890625, 1.535308837890625, 1.68035888671875, 1.825408935546875, 1.970458984375, 2.115509033203125, 2.26055908203125, 2.405609130859375, 2.5506591796875, 2.695709228515625, 2.84075927734375, 2.985809326171875, 3.130859375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 3.0, 7.0, 14.0, 16.0, 30.0, 44.0, 54.0, 49.0, 68.0, 69.0, 81.0, 83.0, 88.0, 84.0, 50.0, 66.0, 58.0, 38.0, 39.0, 20.0, 11.0, 12.0, 6.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.78173828125, -0.7620773315429688, -0.7424163818359375, -0.7227554321289062, -0.703094482421875, -0.6834335327148438, -0.6637725830078125, -0.6441116333007812, -0.62445068359375, -0.6047897338867188, -0.5851287841796875, -0.5654678344726562, -0.545806884765625, -0.5261459350585938, -0.5064849853515625, -0.48682403564453125, -0.4671630859375, -0.44750213623046875, -0.4278411865234375, -0.40818023681640625, -0.388519287109375, -0.36885833740234375, -0.3491973876953125, -0.32953643798828125, -0.30987548828125, -0.29021453857421875, -0.2705535888671875, -0.25089263916015625, -0.231231689453125, -0.21157073974609375, -0.1919097900390625, -0.17224884033203125, -0.152587890625, -0.13292694091796875, -0.1132659912109375, -0.09360504150390625, -0.073944091796875, -0.05428314208984375, -0.0346221923828125, -0.01496124267578125, 0.00469970703125, 0.02436065673828125, 0.0440216064453125, 0.06368255615234375, 0.083343505859375, 0.10300445556640625, 0.1226654052734375, 0.14232635498046875, 0.1619873046875, 0.18164825439453125, 0.2013092041015625, 0.22097015380859375, 0.240631103515625, 0.26029205322265625, 0.2799530029296875, 0.29961395263671875, 0.31927490234375, 0.33893585205078125, 0.3585968017578125, 0.37825775146484375, 0.397918701171875, 0.41757965087890625, 0.4372406005859375, 0.45690155029296875, 0.4765625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 5.0, 1.0, 11.0, 3.0, 10.0, 24.0, 32.0, 29.0, 29.0, 58.0, 71.0, 139.0, 218.0, 343.0, 522.0, 854.0, 1541.0, 2951.0, 5967.0, 13736.0, 38934.0, 189077.0, 3628309.0, 239203.0, 43597.0, 14728.0, 6505.0, 3149.0, 1673.0, 944.0, 561.0, 371.0, 205.0, 152.0, 92.0, 72.0, 49.0, 35.0, 23.0, 14.0, 11.0, 8.0, 3.0, 10.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0], "bins": [-2.572265625, -2.488067626953125, -2.40386962890625, -2.319671630859375, -2.2354736328125, -2.151275634765625, -2.06707763671875, -1.982879638671875, -1.898681640625, -1.814483642578125, -1.73028564453125, -1.646087646484375, -1.5618896484375, -1.477691650390625, -1.39349365234375, -1.309295654296875, -1.22509765625, -1.140899658203125, -1.05670166015625, -0.972503662109375, -0.8883056640625, -0.804107666015625, -0.71990966796875, -0.635711669921875, -0.551513671875, -0.467315673828125, -0.38311767578125, -0.298919677734375, -0.2147216796875, -0.130523681640625, -0.04632568359375, 0.037872314453125, 0.1220703125, 0.206268310546875, 0.29046630859375, 0.374664306640625, 0.4588623046875, 0.543060302734375, 0.62725830078125, 0.711456298828125, 0.795654296875, 0.879852294921875, 0.96405029296875, 1.048248291015625, 1.1324462890625, 1.216644287109375, 1.30084228515625, 1.385040283203125, 1.46923828125, 1.553436279296875, 1.63763427734375, 1.721832275390625, 1.8060302734375, 1.890228271484375, 1.97442626953125, 2.058624267578125, 2.142822265625, 2.227020263671875, 2.31121826171875, 2.395416259765625, 2.4796142578125, 2.563812255859375, 2.64801025390625, 2.732208251953125, 2.81640625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 11.0, 8.0, 8.0, 10.0, 9.0, 20.0, 19.0, 23.0, 45.0, 43.0, 94.0, 156.0, 433.0, 2076.0, 617.0, 210.0, 90.0, 65.0, 32.0, 29.0, 21.0, 10.0, 14.0, 8.0, 5.0, 2.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0419921875, -1.004241943359375, -0.96649169921875, -0.928741455078125, -0.8909912109375, -0.853240966796875, -0.81549072265625, -0.777740478515625, -0.739990234375, -0.702239990234375, -0.66448974609375, -0.626739501953125, -0.5889892578125, -0.551239013671875, -0.51348876953125, -0.475738525390625, -0.43798828125, -0.400238037109375, -0.36248779296875, -0.324737548828125, -0.2869873046875, -0.249237060546875, -0.21148681640625, -0.173736572265625, -0.135986328125, -0.098236083984375, -0.06048583984375, -0.022735595703125, 0.0150146484375, 0.052764892578125, 0.09051513671875, 0.128265380859375, 0.166015625, 0.203765869140625, 0.24151611328125, 0.279266357421875, 0.3170166015625, 0.354766845703125, 0.39251708984375, 0.430267333984375, 0.468017578125, 0.505767822265625, 0.54351806640625, 0.581268310546875, 0.6190185546875, 0.656768798828125, 0.69451904296875, 0.732269287109375, 0.77001953125, 0.807769775390625, 0.84552001953125, 0.883270263671875, 0.9210205078125, 0.958770751953125, 0.99652099609375, 1.034271240234375, 1.072021484375, 1.109771728515625, 1.14752197265625, 1.185272216796875, 1.2230224609375, 1.260772705078125, 1.29852294921875, 1.336273193359375, 1.3740234375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 11.0, 14.0, 41.0, 57.0, 155.0, 233.0, 210.0, 141.0, 82.0, 24.0, 11.0, 7.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.101417541503906, -10.718205451965332, -10.334993362426758, -9.951781272888184, -9.56856918334961, -9.185358047485352, -8.802145004272461, -8.418933868408203, -8.035721778869629, -7.652509689331055, -7.2692975997924805, -6.886085510253906, -6.50287389755249, -6.119661808013916, -5.736449718475342, -5.353238105773926, -4.970025539398193, -4.586813449859619, -4.203601360321045, -3.82038950920105, -3.4371776580810547, -3.0539655685424805, -2.6707534790039062, -2.287541627883911, -1.904329538345337, -1.5211175680160522, -1.1379055976867676, -0.7546935081481934, -0.3714815378189087, 0.011730432510375977, 0.3949425220489502, 0.7781543731689453, 1.1613664627075195, 1.5445784330368042, 1.9277904033660889, 2.311002492904663, 2.694214344024658, 3.0774264335632324, 3.4606385231018066, 3.8438503742218018, 4.227062225341797, 4.610274314880371, 4.993486404418945, 5.3766984939575195, 5.7599101066589355, 6.14312219619751, 6.526334285736084, 6.9095458984375, 7.292758464813232, 7.675970554351807, 8.059182167053223, 8.442394256591797, 8.825606346130371, 9.208818435668945, 9.59203052520752, 9.975242614746094, 10.358454704284668, 10.741666793823242, 11.124878883361816, 11.50809097290039, 11.891303062438965, 12.274515151977539, 12.657726287841797, 13.040938377380371, 13.424150466918945]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 3.0, 4.0, 5.0, 4.0, 7.0, 11.0, 13.0, 12.0, 21.0, 19.0, 22.0, 29.0, 43.0, 27.0, 55.0, 45.0, 50.0, 65.0, 38.0, 53.0, 55.0, 50.0, 49.0, 44.0, 47.0, 28.0, 36.0, 34.0, 24.0, 26.0, 19.0, 13.0, 13.0, 9.0, 5.0, 9.0, 2.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.616724967956543, -4.49234676361084, -4.3679680824279785, -4.243589878082275, -4.119211196899414, -3.994832992553711, -3.8704545497894287, -3.7460761070251465, -3.6216976642608643, -3.497319221496582, -3.3729407787323, -3.2485623359680176, -3.1241841316223145, -2.999805450439453, -2.87542724609375, -2.7510488033294678, -2.6266703605651855, -2.5022919178009033, -2.377913475036621, -2.253535032272339, -2.1291565895080566, -2.0047783851623535, -1.8803999423980713, -1.756021499633789, -1.6316430568695068, -1.5072646141052246, -1.3828861713409424, -1.2585078477859497, -1.1341294050216675, -1.0097509622573853, -0.8853725790977478, -0.7609941959381104, -0.6366157531738281, -0.5122373104095459, -0.38785892724990845, -0.2634805142879486, -0.13910210132598877, -0.014723658561706543, 0.10965472459793091, 0.23403310775756836, 0.3584115505218506, 0.4827899634838104, 0.6071683764457703, 0.7315467596054077, 0.8559252023696899, 0.9803036451339722, 1.1046819686889648, 1.229060411453247, 1.3534388542175293, 1.4778172969818115, 1.6021957397460938, 1.7265740633010864, 1.8509525060653687, 1.9753309488296509, 2.0997092723846436, 2.224087715148926, 2.348466157913208, 2.4728446006774902, 2.5972230434417725, 2.7216014862060547, 2.845979690551758, 2.970358371734619, 3.0947365760803223, 3.2191150188446045, 3.3434934616088867]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 6.0, 9.0, 9.0, 18.0, 28.0, 44.0, 59.0, 116.0, 185.0, 335.0, 756.0, 1914.0, 6699.0, 40514.0, 623709.0, 341231.0, 25147.0, 4973.0, 1541.0, 600.0, 279.0, 135.0, 92.0, 53.0, 24.0, 21.0, 10.0, 9.0, 12.0, 4.0, 6.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.31640625, -4.149658203125, -3.98291015625, -3.816162109375, -3.6494140625, -3.482666015625, -3.31591796875, -3.149169921875, -2.982421875, -2.815673828125, -2.64892578125, -2.482177734375, -2.3154296875, -2.148681640625, -1.98193359375, -1.815185546875, -1.6484375, -1.481689453125, -1.31494140625, -1.148193359375, -0.9814453125, -0.814697265625, -0.64794921875, -0.481201171875, -0.314453125, -0.147705078125, 0.01904296875, 0.185791015625, 0.3525390625, 0.519287109375, 0.68603515625, 0.852783203125, 1.01953125, 1.186279296875, 1.35302734375, 1.519775390625, 1.6865234375, 1.853271484375, 2.02001953125, 2.186767578125, 2.353515625, 2.520263671875, 2.68701171875, 2.853759765625, 3.0205078125, 3.187255859375, 3.35400390625, 3.520751953125, 3.6875, 3.854248046875, 4.02099609375, 4.187744140625, 4.3544921875, 4.521240234375, 4.68798828125, 4.854736328125, 5.021484375, 5.188232421875, 5.35498046875, 5.521728515625, 5.6884765625, 5.855224609375, 6.02197265625, 6.188720703125, 6.35546875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 7.0, 6.0, 19.0, 13.0, 28.0, 34.0, 48.0, 57.0, 55.0, 70.0, 89.0, 67.0, 81.0, 74.0, 63.0, 65.0, 54.0, 45.0, 36.0, 22.0, 11.0, 17.0, 14.0, 6.0, 6.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.70458984375, -0.685577392578125, -0.66656494140625, -0.647552490234375, -0.6285400390625, -0.609527587890625, -0.59051513671875, -0.571502685546875, -0.552490234375, -0.533477783203125, -0.51446533203125, -0.495452880859375, -0.4764404296875, -0.457427978515625, -0.43841552734375, -0.419403076171875, -0.400390625, -0.381378173828125, -0.36236572265625, -0.343353271484375, -0.3243408203125, -0.305328369140625, -0.28631591796875, -0.267303466796875, -0.248291015625, -0.229278564453125, -0.21026611328125, -0.191253662109375, -0.1722412109375, -0.153228759765625, -0.13421630859375, -0.115203857421875, -0.09619140625, -0.077178955078125, -0.05816650390625, -0.039154052734375, -0.0201416015625, -0.001129150390625, 0.01788330078125, 0.036895751953125, 0.055908203125, 0.074920654296875, 0.09393310546875, 0.112945556640625, 0.1319580078125, 0.150970458984375, 0.16998291015625, 0.188995361328125, 0.2080078125, 0.227020263671875, 0.24603271484375, 0.265045166015625, 0.2840576171875, 0.303070068359375, 0.32208251953125, 0.341094970703125, 0.360107421875, 0.379119873046875, 0.39813232421875, 0.417144775390625, 0.4361572265625, 0.455169677734375, 0.47418212890625, 0.493194580078125, 0.51220703125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 6.0, 2.0, 0.0, 3.0, 2.0, 1.0, 7.0, 6.0, 8.0, 10.0, 20.0, 15.0, 23.0, 49.0, 69.0, 93.0, 149.0, 248.0, 423.0, 717.0, 1506.0, 3702.0, 9828.0, 33455.0, 146670.0, 540915.0, 237175.0, 50172.0, 14276.0, 4922.0, 1861.0, 891.0, 482.0, 285.0, 176.0, 116.0, 72.0, 60.0, 38.0, 32.0, 25.0, 13.0, 13.0, 10.0, 6.0, 4.0, 4.0, 1.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.03125, -1.9649658203125, -1.898681640625, -1.8323974609375, -1.76611328125, -1.6998291015625, -1.633544921875, -1.5672607421875, -1.5009765625, -1.4346923828125, -1.368408203125, -1.3021240234375, -1.23583984375, -1.1695556640625, -1.103271484375, -1.0369873046875, -0.970703125, -0.9044189453125, -0.838134765625, -0.7718505859375, -0.70556640625, -0.6392822265625, -0.572998046875, -0.5067138671875, -0.4404296875, -0.3741455078125, -0.307861328125, -0.2415771484375, -0.17529296875, -0.1090087890625, -0.042724609375, 0.0235595703125, 0.08984375, 0.1561279296875, 0.222412109375, 0.2886962890625, 0.35498046875, 0.4212646484375, 0.487548828125, 0.5538330078125, 0.6201171875, 0.6864013671875, 0.752685546875, 0.8189697265625, 0.88525390625, 0.9515380859375, 1.017822265625, 1.0841064453125, 1.150390625, 1.2166748046875, 1.282958984375, 1.3492431640625, 1.41552734375, 1.4818115234375, 1.548095703125, 1.6143798828125, 1.6806640625, 1.7469482421875, 1.813232421875, 1.8795166015625, 1.94580078125, 2.0120849609375, 2.078369140625, 2.1446533203125, 2.2109375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 3.0, 1.0, 9.0, 3.0, 12.0, 5.0, 9.0, 12.0, 11.0, 19.0, 24.0, 25.0, 27.0, 43.0, 48.0, 41.0, 40.0, 35.0, 49.0, 46.0, 44.0, 39.0, 42.0, 49.0, 43.0, 56.0, 35.0, 47.0, 22.0, 25.0, 24.0, 6.0, 19.0, 17.0, 23.0, 11.0, 12.0, 4.0, 9.0, 7.0, 8.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.5068359375, -1.455352783203125, -1.40386962890625, -1.352386474609375, -1.3009033203125, -1.249420166015625, -1.19793701171875, -1.146453857421875, -1.094970703125, -1.043487548828125, -0.99200439453125, -0.940521240234375, -0.8890380859375, -0.837554931640625, -0.78607177734375, -0.734588623046875, -0.68310546875, -0.631622314453125, -0.58013916015625, -0.528656005859375, -0.4771728515625, -0.425689697265625, -0.37420654296875, -0.322723388671875, -0.271240234375, -0.219757080078125, -0.16827392578125, -0.116790771484375, -0.0653076171875, -0.013824462890625, 0.03765869140625, 0.089141845703125, 0.140625, 0.192108154296875, 0.24359130859375, 0.295074462890625, 0.3465576171875, 0.398040771484375, 0.44952392578125, 0.501007080078125, 0.552490234375, 0.603973388671875, 0.65545654296875, 0.706939697265625, 0.7584228515625, 0.809906005859375, 0.86138916015625, 0.912872314453125, 0.96435546875, 1.015838623046875, 1.06732177734375, 1.118804931640625, 1.1702880859375, 1.221771240234375, 1.27325439453125, 1.324737548828125, 1.376220703125, 1.427703857421875, 1.47918701171875, 1.530670166015625, 1.5821533203125, 1.633636474609375, 1.68511962890625, 1.736602783203125, 1.7880859375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 4.0, 7.0, 7.0, 7.0, 18.0, 20.0, 31.0, 77.0, 137.0, 258.0, 602.0, 1628.0, 5745.0, 50144.0, 864004.0, 113535.0, 8737.0, 2154.0, 755.0, 331.0, 154.0, 75.0, 40.0, 33.0, 12.0, 13.0, 12.0, 4.0, 4.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.04296875, -1.9739990234375, -1.905029296875, -1.8360595703125, -1.76708984375, -1.6981201171875, -1.629150390625, -1.5601806640625, -1.4912109375, -1.4222412109375, -1.353271484375, -1.2843017578125, -1.21533203125, -1.1463623046875, -1.077392578125, -1.0084228515625, -0.939453125, -0.8704833984375, -0.801513671875, -0.7325439453125, -0.66357421875, -0.5946044921875, -0.525634765625, -0.4566650390625, -0.3876953125, -0.3187255859375, -0.249755859375, -0.1807861328125, -0.11181640625, -0.0428466796875, 0.026123046875, 0.0950927734375, 0.1640625, 0.2330322265625, 0.302001953125, 0.3709716796875, 0.43994140625, 0.5089111328125, 0.577880859375, 0.6468505859375, 0.7158203125, 0.7847900390625, 0.853759765625, 0.9227294921875, 0.99169921875, 1.0606689453125, 1.129638671875, 1.1986083984375, 1.267578125, 1.3365478515625, 1.405517578125, 1.4744873046875, 1.54345703125, 1.6124267578125, 1.681396484375, 1.7503662109375, 1.8193359375, 1.8883056640625, 1.957275390625, 2.0262451171875, 2.09521484375, 2.1641845703125, 2.233154296875, 2.3021240234375, 2.37109375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 8.0, 7.0, 8.0, 14.0, 28.0, 37.0, 55.0, 87.0, 175.0, 160.0, 163.0, 91.0, 59.0, 36.0, 27.0, 13.0, 9.0, 4.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003418922424316406, -0.00033226609230041504, -0.00032263994216918945, -0.00031301379203796387, -0.0003033876419067383, -0.0002937614917755127, -0.0002841353416442871, -0.0002745091915130615, -0.00026488304138183594, -0.00025525689125061035, -0.00024563074111938477, -0.00023600459098815918, -0.0002263784408569336, -0.000216752290725708, -0.00020712614059448242, -0.00019749999046325684, -0.00018787384033203125, -0.00017824769020080566, -0.00016862154006958008, -0.0001589953899383545, -0.0001493692398071289, -0.00013974308967590332, -0.00013011693954467773, -0.00012049078941345215, -0.00011086463928222656, -0.00010123848915100098, -9.161233901977539e-05, -8.19861888885498e-05, -7.236003875732422e-05, -6.273388862609863e-05, -5.310773849487305e-05, -4.348158836364746e-05, -3.3855438232421875e-05, -2.422928810119629e-05, -1.4603137969970703e-05, -4.976987838745117e-06, 4.649162292480469e-06, 1.4275312423706055e-05, 2.390146255493164e-05, 3.3527612686157227e-05, 4.315376281738281e-05, 5.27799129486084e-05, 6.240606307983398e-05, 7.203221321105957e-05, 8.165836334228516e-05, 9.128451347351074e-05, 0.00010091066360473633, 0.00011053681373596191, 0.0001201629638671875, 0.00012978911399841309, 0.00013941526412963867, 0.00014904141426086426, 0.00015866756439208984, 0.00016829371452331543, 0.00017791986465454102, 0.0001875460147857666, 0.0001971721649169922, 0.00020679831504821777, 0.00021642446517944336, 0.00022605061531066895, 0.00023567676544189453, 0.0002453029155731201, 0.0002549290657043457, 0.0002645552158355713, 0.0002741813659667969]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 3.0, 5.0, 7.0, 13.0, 23.0, 40.0, 76.0, 114.0, 211.0, 501.0, 1953.0, 22671.0, 980118.0, 39086.0, 2591.0, 565.0, 234.0, 125.0, 93.0, 55.0, 29.0, 18.0, 8.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.8203125, -3.706512451171875, -3.59271240234375, -3.478912353515625, -3.3651123046875, -3.251312255859375, -3.13751220703125, -3.023712158203125, -2.909912109375, -2.796112060546875, -2.68231201171875, -2.568511962890625, -2.4547119140625, -2.340911865234375, -2.22711181640625, -2.113311767578125, -1.99951171875, -1.885711669921875, -1.77191162109375, -1.658111572265625, -1.5443115234375, -1.430511474609375, -1.31671142578125, -1.202911376953125, -1.089111328125, -0.975311279296875, -0.86151123046875, -0.747711181640625, -0.6339111328125, -0.520111083984375, -0.40631103515625, -0.292510986328125, -0.1787109375, -0.064910888671875, 0.04888916015625, 0.162689208984375, 0.2764892578125, 0.390289306640625, 0.50408935546875, 0.617889404296875, 0.731689453125, 0.845489501953125, 0.95928955078125, 1.073089599609375, 1.1868896484375, 1.300689697265625, 1.41448974609375, 1.528289794921875, 1.64208984375, 1.755889892578125, 1.86968994140625, 1.983489990234375, 2.0972900390625, 2.211090087890625, 2.32489013671875, 2.438690185546875, 2.552490234375, 2.666290283203125, 2.78009033203125, 2.893890380859375, 3.0076904296875, 3.121490478515625, 3.23529052734375, 3.349090576171875, 3.462890625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 7.0, 13.0, 18.0, 48.0, 99.0, 177.0, 228.0, 193.0, 113.0, 50.0, 28.0, 11.0, 10.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8857421875, -1.8241424560546875, -1.762542724609375, -1.7009429931640625, -1.63934326171875, -1.5777435302734375, -1.516143798828125, -1.4545440673828125, -1.3929443359375, -1.3313446044921875, -1.269744873046875, -1.2081451416015625, -1.14654541015625, -1.0849456787109375, -1.023345947265625, -0.9617462158203125, -0.900146484375, -0.8385467529296875, -0.776947021484375, -0.7153472900390625, -0.65374755859375, -0.5921478271484375, -0.530548095703125, -0.4689483642578125, -0.4073486328125, -0.3457489013671875, -0.284149169921875, -0.2225494384765625, -0.16094970703125, -0.0993499755859375, -0.037750244140625, 0.0238494873046875, 0.08544921875, 0.1470489501953125, 0.208648681640625, 0.2702484130859375, 0.33184814453125, 0.3934478759765625, 0.455047607421875, 0.5166473388671875, 0.5782470703125, 0.6398468017578125, 0.701446533203125, 0.7630462646484375, 0.82464599609375, 0.8862457275390625, 0.947845458984375, 1.0094451904296875, 1.071044921875, 1.1326446533203125, 1.194244384765625, 1.2558441162109375, 1.31744384765625, 1.3790435791015625, 1.440643310546875, 1.5022430419921875, 1.5638427734375, 1.6254425048828125, 1.687042236328125, 1.7486419677734375, 1.81024169921875, 1.8718414306640625, 1.933441162109375, 1.9950408935546875, 2.056640625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 12.0, 31.0, 113.0, 272.0, 291.0, 178.0, 61.0, 29.0, 12.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.77569580078125, -41.7070198059082, -40.63833999633789, -39.569664001464844, -38.50098419189453, -37.432308197021484, -36.36362838745117, -35.294952392578125, -34.22627258300781, -33.157596588134766, -32.08891677856445, -31.020238876342773, -29.951560974121094, -28.882884979248047, -27.814207077026367, -26.745529174804688, -25.67685317993164, -24.60817527770996, -23.53949737548828, -22.4708194732666, -21.402141571044922, -20.333465576171875, -19.264787673950195, -18.196109771728516, -17.127431869506836, -16.058753967285156, -14.990076065063477, -13.921399116516113, -12.852721214294434, -11.784043312072754, -10.71536636352539, -9.646688461303711, -8.578006744384766, -7.509328842163086, -6.4406514167785645, -5.371973991394043, -4.303296089172363, -3.2346181869506836, -2.165940761566162, -1.0972633361816406, -0.028585433959960938, 1.0400922298431396, 2.1087698936462402, 3.177447557449341, 4.246125221252441, 5.314803123474121, 6.383480548858643, 7.452157974243164, 8.520835876464844, 9.589513778686523, 10.658191680908203, 11.726868629455566, 12.795546531677246, 13.864224433898926, 14.932901382446289, 16.00157928466797, 17.07025718688965, 18.138935089111328, 19.207612991333008, 20.276290893554688, 21.344966888427734, 22.413646697998047, 23.482322692871094, 24.551000595092773, 25.619678497314453]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 1.0, 3.0, 5.0, 6.0, 9.0, 11.0, 21.0, 19.0, 11.0, 21.0, 28.0, 28.0, 40.0, 52.0, 41.0, 53.0, 56.0, 54.0, 44.0, 58.0, 62.0, 41.0, 56.0, 49.0, 39.0, 33.0, 28.0, 19.0, 19.0, 18.0, 12.0, 16.0, 11.0, 12.0, 9.0, 8.0, 5.0, 4.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.453246116638184, -8.151788711547852, -7.8503313064575195, -7.548873424530029, -7.247416019439697, -6.945958614349365, -6.644500732421875, -6.343043327331543, -6.041585922241211, -5.740128517150879, -5.438671112060547, -5.137213230133057, -4.835755825042725, -4.534298419952393, -4.232840538024902, -3.9313831329345703, -3.6299257278442383, -3.3284683227539062, -3.027010679244995, -2.725553035736084, -2.424095630645752, -2.12263822555542, -1.8211805820465088, -1.5197229385375977, -1.2182655334472656, -0.916808009147644, -0.6153504848480225, -0.3138929605484009, -0.012435436248779297, 0.2890220880508423, 0.5904796123504639, 0.891937255859375, 1.193394660949707, 1.4948521852493286, 1.7963097095489502, 2.0977673530578613, 2.3992247581481934, 2.7006821632385254, 3.0021398067474365, 3.3035974502563477, 3.6050548553466797, 3.9065122604370117, 4.207969665527344, 4.509427547454834, 4.810884952545166, 5.112342357635498, 5.413800239562988, 5.71525764465332, 6.016715049743652, 6.318172454833984, 6.619629859924316, 6.921087741851807, 7.222545146942139, 7.524002552032471, 7.825460433959961, 8.126917839050293, 8.428375244140625, 8.729832649230957, 9.031290054321289, 9.332747459411621, 9.634204864501953, 9.935663223266602, 10.237120628356934, 10.538578033447266, 10.840035438537598]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 6.0, 1.0, 7.0, 8.0, 7.0, 7.0, 14.0, 17.0, 24.0, 29.0, 46.0, 58.0, 98.0, 231.0, 418.0, 1048.0, 3076.0, 13262.0, 197128.0, 3945447.0, 25011.0, 5053.0, 1708.0, 686.0, 366.0, 183.0, 128.0, 75.0, 38.0, 43.0, 22.0, 15.0, 8.0, 2.0, 2.0, 6.0, 2.0, 2.0, 1.0, 2.0], "bins": [-8.4296875, -8.23443603515625, -8.0391845703125, -7.84393310546875, -7.648681640625, -7.45343017578125, -7.2581787109375, -7.06292724609375, -6.86767578125, -6.67242431640625, -6.4771728515625, -6.28192138671875, -6.086669921875, -5.89141845703125, -5.6961669921875, -5.50091552734375, -5.3056640625, -5.11041259765625, -4.9151611328125, -4.71990966796875, -4.524658203125, -4.32940673828125, -4.1341552734375, -3.93890380859375, -3.74365234375, -3.54840087890625, -3.3531494140625, -3.15789794921875, -2.962646484375, -2.76739501953125, -2.5721435546875, -2.37689208984375, -2.181640625, -1.98638916015625, -1.7911376953125, -1.59588623046875, -1.400634765625, -1.20538330078125, -1.0101318359375, -0.81488037109375, -0.61962890625, -0.42437744140625, -0.2291259765625, -0.03387451171875, 0.161376953125, 0.35662841796875, 0.5518798828125, 0.74713134765625, 0.9423828125, 1.13763427734375, 1.3328857421875, 1.52813720703125, 1.723388671875, 1.91864013671875, 2.1138916015625, 2.30914306640625, 2.50439453125, 2.69964599609375, 2.8948974609375, 3.09014892578125, 3.285400390625, 3.48065185546875, 3.6759033203125, 3.87115478515625, 4.06640625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 7.0, 2.0, 2.0, 7.0, 15.0, 34.0, 27.0, 39.0, 38.0, 80.0, 54.0, 80.0, 89.0, 84.0, 75.0, 85.0, 62.0, 70.0, 41.0, 30.0, 32.0, 14.0, 13.0, 6.0, 7.0, 1.0, 7.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.71826171875, -0.6954193115234375, -0.672576904296875, -0.6497344970703125, -0.62689208984375, -0.6040496826171875, -0.581207275390625, -0.5583648681640625, -0.5355224609375, -0.5126800537109375, -0.489837646484375, -0.4669952392578125, -0.44415283203125, -0.4213104248046875, -0.398468017578125, -0.3756256103515625, -0.352783203125, -0.3299407958984375, -0.307098388671875, -0.2842559814453125, -0.26141357421875, -0.2385711669921875, -0.215728759765625, -0.1928863525390625, -0.1700439453125, -0.1472015380859375, -0.124359130859375, -0.1015167236328125, -0.07867431640625, -0.0558319091796875, -0.032989501953125, -0.0101470947265625, 0.0126953125, 0.0355377197265625, 0.058380126953125, 0.0812225341796875, 0.10406494140625, 0.1269073486328125, 0.149749755859375, 0.1725921630859375, 0.1954345703125, 0.2182769775390625, 0.241119384765625, 0.2639617919921875, 0.28680419921875, 0.3096466064453125, 0.332489013671875, 0.3553314208984375, 0.378173828125, 0.4010162353515625, 0.423858642578125, 0.4467010498046875, 0.46954345703125, 0.4923858642578125, 0.515228271484375, 0.5380706787109375, 0.5609130859375, 0.5837554931640625, 0.606597900390625, 0.6294403076171875, 0.65228271484375, 0.6751251220703125, 0.697967529296875, 0.7208099365234375, 0.74365234375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 4.0, 11.0, 4.0, 10.0, 11.0, 18.0, 15.0, 25.0, 46.0, 60.0, 79.0, 111.0, 160.0, 216.0, 397.0, 790.0, 1691.0, 4313.0, 14182.0, 79990.0, 3941788.0, 123415.0, 17794.0, 5141.0, 1939.0, 873.0, 449.0, 262.0, 176.0, 87.0, 71.0, 41.0, 27.0, 22.0, 25.0, 14.0, 10.0, 8.0, 1.0, 5.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 1.0], "bins": [-5.50390625, -5.357452392578125, -5.21099853515625, -5.064544677734375, -4.9180908203125, -4.771636962890625, -4.62518310546875, -4.478729248046875, -4.332275390625, -4.185821533203125, -4.03936767578125, -3.892913818359375, -3.7464599609375, -3.600006103515625, -3.45355224609375, -3.307098388671875, -3.16064453125, -3.014190673828125, -2.86773681640625, -2.721282958984375, -2.5748291015625, -2.428375244140625, -2.28192138671875, -2.135467529296875, -1.989013671875, -1.842559814453125, -1.69610595703125, -1.549652099609375, -1.4031982421875, -1.256744384765625, -1.11029052734375, -0.963836669921875, -0.8173828125, -0.670928955078125, -0.52447509765625, -0.378021240234375, -0.2315673828125, -0.085113525390625, 0.06134033203125, 0.207794189453125, 0.354248046875, 0.500701904296875, 0.64715576171875, 0.793609619140625, 0.9400634765625, 1.086517333984375, 1.23297119140625, 1.379425048828125, 1.52587890625, 1.672332763671875, 1.81878662109375, 1.965240478515625, 2.1116943359375, 2.258148193359375, 2.40460205078125, 2.551055908203125, 2.697509765625, 2.843963623046875, 2.99041748046875, 3.136871337890625, 3.2833251953125, 3.429779052734375, 3.57623291015625, 3.722686767578125, 3.869140625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 3.0, 5.0, 4.0, 12.0, 19.0, 33.0, 32.0, 70.0, 148.0, 673.0, 2618.0, 228.0, 94.0, 37.0, 22.0, 24.0, 16.0, 9.0, 7.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-2.314453125, -2.2632522583007812, -2.2120513916015625, -2.1608505249023438, -2.109649658203125, -2.0584487915039062, -2.0072479248046875, -1.9560470581054688, -1.90484619140625, -1.8536453247070312, -1.8024444580078125, -1.7512435913085938, -1.700042724609375, -1.6488418579101562, -1.5976409912109375, -1.5464401245117188, -1.4952392578125, -1.4440383911132812, -1.3928375244140625, -1.3416366577148438, -1.290435791015625, -1.2392349243164062, -1.1880340576171875, -1.1368331909179688, -1.08563232421875, -1.0344314575195312, -0.9832305908203125, -0.9320297241210938, -0.880828857421875, -0.8296279907226562, -0.7784271240234375, -0.7272262573242188, -0.676025390625, -0.6248245239257812, -0.5736236572265625, -0.5224227905273438, -0.471221923828125, -0.42002105712890625, -0.3688201904296875, -0.31761932373046875, -0.26641845703125, -0.21521759033203125, -0.1640167236328125, -0.11281585693359375, -0.061614990234375, -0.01041412353515625, 0.0407867431640625, 0.09198760986328125, 0.1431884765625, 0.19438934326171875, 0.2455902099609375, 0.29679107666015625, 0.347991943359375, 0.39919281005859375, 0.4503936767578125, 0.5015945434570312, 0.55279541015625, 0.6039962768554688, 0.6551971435546875, 0.7063980102539062, 0.757598876953125, 0.8087997436523438, 0.8600006103515625, 0.9112014770507812, 0.96240234375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 9.0, 6.0, 16.0, 22.0, 72.0, 149.0, 237.0, 249.0, 154.0, 52.0, 20.0, 8.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.933156967163086, -7.572983741760254, -7.212810516357422, -6.85263729095459, -6.492464065551758, -6.132290840148926, -5.7721171379089355, -5.4119439125061035, -5.0517706871032715, -4.6915974617004395, -4.331424236297607, -3.9712507724761963, -3.6110775470733643, -3.2509043216705322, -2.890730857849121, -2.530557632446289, -2.170384407043457, -1.810211181640625, -1.4500378370285034, -1.0898644924163818, -0.7296912670135498, -0.3695180416107178, -0.00934457778930664, 0.3508286476135254, 0.7110018730163574, 1.0711750984191895, 1.431348443031311, 1.7915217876434326, 2.1516950130462646, 2.5118682384490967, 2.872041702270508, 3.23221492767334, 3.5923891067504883, 3.9525623321533203, 4.312735557556152, 4.672908782958984, 5.033082008361816, 5.393255233764648, 5.753428936004639, 6.113602161407471, 6.473775386810303, 6.833948612213135, 7.194121837615967, 7.554295539855957, 7.914468765258789, 8.274641990661621, 8.634815216064453, 8.994988441467285, 9.355161666870117, 9.71533489227295, 10.075508117675781, 10.435681343078613, 10.795854568481445, 11.156027793884277, 11.51620101928711, 11.876375198364258, 12.236547470092773, 12.596720695495605, 12.956893920898438, 13.31706714630127, 13.677240371704102, 14.037413597106934, 14.397586822509766, 14.757761001586914, 15.117934226989746]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 0.0, 7.0, 5.0, 4.0, 8.0, 10.0, 12.0, 16.0, 21.0, 20.0, 36.0, 46.0, 38.0, 46.0, 44.0, 67.0, 76.0, 58.0, 63.0, 54.0, 50.0, 64.0, 42.0, 53.0, 25.0, 39.0, 27.0, 21.0, 12.0, 5.0, 9.0, 14.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.75924015045166, -4.625065803527832, -4.490890979766846, -4.356716632843018, -4.222541809082031, -4.088367462158203, -3.954193115234375, -3.8200185298919678, -3.6858439445495605, -3.5516693592071533, -3.417494773864746, -3.283320426940918, -3.1491458415985107, -3.0149712562561035, -2.8807969093322754, -2.746622323989868, -2.612447738647461, -2.4782731533050537, -2.3440985679626465, -2.2099242210388184, -2.075749635696411, -1.941575050354004, -1.8074005842208862, -1.6732261180877686, -1.5390515327453613, -1.404876947402954, -1.2707024812698364, -1.1365280151367188, -1.0023534297943115, -0.8681789040565491, -0.7340043783187866, -0.5998298525810242, -0.4656558036804199, -0.33148127794265747, -0.19730675220489502, -0.06313222646713257, 0.07104229927062988, 0.20521682500839233, 0.3393913507461548, 0.47356587648391724, 0.6077404022216797, 0.7419149279594421, 0.8760894536972046, 1.0102639198303223, 1.1444385051727295, 1.2786130905151367, 1.4127875566482544, 1.546962022781372, 1.6811366081237793, 1.8153111934661865, 1.9494856595993042, 2.083660125732422, 2.217834711074829, 2.3520092964172363, 2.4861836433410645, 2.6203582286834717, 2.754532814025879, 2.888707399368286, 3.0228819847106934, 3.1570563316345215, 3.2912309169769287, 3.425405502319336, 3.559579849243164, 3.6937544345855713, 3.8279290199279785]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 3.0, 4.0, 1.0, 5.0, 11.0, 14.0, 25.0, 34.0, 67.0, 131.0, 275.0, 622.0, 1712.0, 6728.0, 55446.0, 786768.0, 178628.0, 13747.0, 2640.0, 872.0, 357.0, 181.0, 101.0, 58.0, 39.0, 26.0, 20.0, 12.0, 7.0, 8.0, 6.0, 5.0, 3.0, 1.0, 3.0, 3.0], "bins": [-7.87890625, -7.6986083984375, -7.518310546875, -7.3380126953125, -7.15771484375, -6.9774169921875, -6.797119140625, -6.6168212890625, -6.4365234375, -6.2562255859375, -6.075927734375, -5.8956298828125, -5.71533203125, -5.5350341796875, -5.354736328125, -5.1744384765625, -4.994140625, -4.8138427734375, -4.633544921875, -4.4532470703125, -4.27294921875, -4.0926513671875, -3.912353515625, -3.7320556640625, -3.5517578125, -3.3714599609375, -3.191162109375, -3.0108642578125, -2.83056640625, -2.6502685546875, -2.469970703125, -2.2896728515625, -2.109375, -1.9290771484375, -1.748779296875, -1.5684814453125, -1.38818359375, -1.2078857421875, -1.027587890625, -0.8472900390625, -0.6669921875, -0.4866943359375, -0.306396484375, -0.1260986328125, 0.05419921875, 0.2344970703125, 0.414794921875, 0.5950927734375, 0.775390625, 0.9556884765625, 1.135986328125, 1.3162841796875, 1.49658203125, 1.6768798828125, 1.857177734375, 2.0374755859375, 2.2177734375, 2.3980712890625, 2.578369140625, 2.7586669921875, 2.93896484375, 3.1192626953125, 3.299560546875, 3.4798583984375, 3.66015625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 1.0, 12.0, 11.0, 12.0, 18.0, 25.0, 42.0, 51.0, 70.0, 52.0, 52.0, 77.0, 84.0, 70.0, 54.0, 78.0, 58.0, 51.0, 45.0, 39.0, 27.0, 17.0, 17.0, 11.0, 12.0, 4.0, 7.0, 1.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.82470703125, -0.803070068359375, -0.78143310546875, -0.759796142578125, -0.7381591796875, -0.716522216796875, -0.69488525390625, -0.673248291015625, -0.651611328125, -0.629974365234375, -0.60833740234375, -0.586700439453125, -0.5650634765625, -0.543426513671875, -0.52178955078125, -0.500152587890625, -0.478515625, -0.456878662109375, -0.43524169921875, -0.413604736328125, -0.3919677734375, -0.370330810546875, -0.34869384765625, -0.327056884765625, -0.305419921875, -0.283782958984375, -0.26214599609375, -0.240509033203125, -0.2188720703125, -0.197235107421875, -0.17559814453125, -0.153961181640625, -0.13232421875, -0.110687255859375, -0.08905029296875, -0.067413330078125, -0.0457763671875, -0.024139404296875, -0.00250244140625, 0.019134521484375, 0.040771484375, 0.062408447265625, 0.08404541015625, 0.105682373046875, 0.1273193359375, 0.148956298828125, 0.17059326171875, 0.192230224609375, 0.2138671875, 0.235504150390625, 0.25714111328125, 0.278778076171875, 0.3004150390625, 0.322052001953125, 0.34368896484375, 0.365325927734375, 0.386962890625, 0.408599853515625, 0.43023681640625, 0.451873779296875, 0.4735107421875, 0.495147705078125, 0.51678466796875, 0.538421630859375, 0.56005859375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 4.0, 5.0, 4.0, 4.0, 10.0, 14.0, 33.0, 47.0, 75.0, 130.0, 215.0, 459.0, 1170.0, 2820.0, 8862.0, 33819.0, 174037.0, 588972.0, 187460.0, 35961.0, 9160.0, 3041.0, 1152.0, 529.0, 250.0, 128.0, 59.0, 48.0, 31.0, 19.0, 14.0, 7.0, 7.0, 7.0, 2.0, 1.0, 4.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-2.763671875, -2.691925048828125, -2.62017822265625, -2.548431396484375, -2.4766845703125, -2.404937744140625, -2.33319091796875, -2.261444091796875, -2.189697265625, -2.117950439453125, -2.04620361328125, -1.974456787109375, -1.9027099609375, -1.830963134765625, -1.75921630859375, -1.687469482421875, -1.61572265625, -1.543975830078125, -1.47222900390625, -1.400482177734375, -1.3287353515625, -1.256988525390625, -1.18524169921875, -1.113494873046875, -1.041748046875, -0.970001220703125, -0.89825439453125, -0.826507568359375, -0.7547607421875, -0.683013916015625, -0.61126708984375, -0.539520263671875, -0.4677734375, -0.396026611328125, -0.32427978515625, -0.252532958984375, -0.1807861328125, -0.109039306640625, -0.03729248046875, 0.034454345703125, 0.106201171875, 0.177947998046875, 0.24969482421875, 0.321441650390625, 0.3931884765625, 0.464935302734375, 0.53668212890625, 0.608428955078125, 0.68017578125, 0.751922607421875, 0.82366943359375, 0.895416259765625, 0.9671630859375, 1.038909912109375, 1.11065673828125, 1.182403564453125, 1.254150390625, 1.325897216796875, 1.39764404296875, 1.469390869140625, 1.5411376953125, 1.612884521484375, 1.68463134765625, 1.756378173828125, 1.828125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 10.0, 6.0, 8.0, 8.0, 15.0, 10.0, 16.0, 21.0, 16.0, 33.0, 25.0, 32.0, 36.0, 34.0, 46.0, 31.0, 43.0, 45.0, 37.0, 41.0, 45.0, 48.0, 33.0, 43.0, 42.0, 41.0, 32.0, 29.0, 24.0, 29.0, 15.0, 14.0, 15.0, 18.0, 11.0, 17.0, 9.0, 6.0, 4.0, 0.0, 2.0, 2.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.634765625, -1.5825347900390625, -1.530303955078125, -1.4780731201171875, -1.42584228515625, -1.3736114501953125, -1.321380615234375, -1.2691497802734375, -1.2169189453125, -1.1646881103515625, -1.112457275390625, -1.0602264404296875, -1.00799560546875, -0.9557647705078125, -0.903533935546875, -0.8513031005859375, -0.799072265625, -0.7468414306640625, -0.694610595703125, -0.6423797607421875, -0.59014892578125, -0.5379180908203125, -0.485687255859375, -0.4334564208984375, -0.3812255859375, -0.3289947509765625, -0.276763916015625, -0.2245330810546875, -0.17230224609375, -0.1200714111328125, -0.067840576171875, -0.0156097412109375, 0.03662109375, 0.0888519287109375, 0.141082763671875, 0.1933135986328125, 0.24554443359375, 0.2977752685546875, 0.350006103515625, 0.4022369384765625, 0.4544677734375, 0.5066986083984375, 0.558929443359375, 0.6111602783203125, 0.66339111328125, 0.7156219482421875, 0.767852783203125, 0.8200836181640625, 0.872314453125, 0.9245452880859375, 0.976776123046875, 1.0290069580078125, 1.08123779296875, 1.1334686279296875, 1.185699462890625, 1.2379302978515625, 1.2901611328125, 1.3423919677734375, 1.394622802734375, 1.4468536376953125, 1.49908447265625, 1.5513153076171875, 1.603546142578125, 1.6557769775390625, 1.7080078125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 3.0, 1.0, 5.0, 6.0, 6.0, 12.0, 12.0, 25.0, 20.0, 48.0, 52.0, 109.0, 149.0, 263.0, 406.0, 837.0, 1545.0, 3384.0, 7211.0, 19127.0, 59905.0, 244421.0, 476363.0, 166150.0, 42623.0, 14383.0, 5860.0, 2685.0, 1229.0, 683.0, 401.0, 195.0, 137.0, 83.0, 67.0, 38.0, 27.0, 18.0, 21.0, 8.0, 12.0, 7.0, 3.0, 3.0, 4.0, 2.0, 9.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.65771484375, -0.63531494140625, -0.6129150390625, -0.59051513671875, -0.568115234375, -0.54571533203125, -0.5233154296875, -0.50091552734375, -0.478515625, -0.45611572265625, -0.4337158203125, -0.41131591796875, -0.388916015625, -0.36651611328125, -0.3441162109375, -0.32171630859375, -0.29931640625, -0.27691650390625, -0.2545166015625, -0.23211669921875, -0.209716796875, -0.18731689453125, -0.1649169921875, -0.14251708984375, -0.1201171875, -0.09771728515625, -0.0753173828125, -0.05291748046875, -0.030517578125, -0.00811767578125, 0.0142822265625, 0.03668212890625, 0.05908203125, 0.08148193359375, 0.1038818359375, 0.12628173828125, 0.148681640625, 0.17108154296875, 0.1934814453125, 0.21588134765625, 0.23828125, 0.26068115234375, 0.2830810546875, 0.30548095703125, 0.327880859375, 0.35028076171875, 0.3726806640625, 0.39508056640625, 0.41748046875, 0.43988037109375, 0.4622802734375, 0.48468017578125, 0.507080078125, 0.52947998046875, 0.5518798828125, 0.57427978515625, 0.5966796875, 0.61907958984375, 0.6414794921875, 0.66387939453125, 0.686279296875, 0.70867919921875, 0.7310791015625, 0.75347900390625, 0.77587890625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 4.0, 5.0, 9.0, 7.0, 12.0, 12.0, 17.0, 19.0, 24.0, 33.0, 54.0, 87.0, 104.0, 121.0, 143.0, 94.0, 64.0, 58.0, 30.0, 23.0, 18.0, 13.0, 7.0, 13.0, 7.0, 4.0, 7.0, 2.0, 4.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001533031463623047, -0.000146571546792984, -0.00013983994722366333, -0.00013310834765434265, -0.00012637674808502197, -0.0001196451485157013, -0.00011291354894638062, -0.00010618194937705994, -9.945034980773926e-05, -9.271875023841858e-05, -8.59871506690979e-05, -7.925555109977722e-05, -7.252395153045654e-05, -6.579235196113586e-05, -5.9060752391815186e-05, -5.232915282249451e-05, -4.559755325317383e-05, -3.886595368385315e-05, -3.213435411453247e-05, -2.5402754545211792e-05, -1.8671154975891113e-05, -1.1939555406570435e-05, -5.207955837249756e-06, 1.5236437320709229e-06, 8.255243301391602e-06, 1.498684287071228e-05, 2.171844244003296e-05, 2.8450042009353638e-05, 3.5181641578674316e-05, 4.1913241147994995e-05, 4.8644840717315674e-05, 5.537644028663635e-05, 6.210803985595703e-05, 6.883963942527771e-05, 7.557123899459839e-05, 8.230283856391907e-05, 8.903443813323975e-05, 9.576603770256042e-05, 0.0001024976372718811, 0.00010922923684120178, 0.00011596083641052246, 0.00012269243597984314, 0.00012942403554916382, 0.0001361556351184845, 0.00014288723468780518, 0.00014961883425712585, 0.00015635043382644653, 0.0001630820333957672, 0.0001698136329650879, 0.00017654523253440857, 0.00018327683210372925, 0.00019000843167304993, 0.0001967400312423706, 0.00020347163081169128, 0.00021020323038101196, 0.00021693482995033264, 0.00022366642951965332, 0.000230398029088974, 0.00023712962865829468, 0.00024386122822761536, 0.00025059282779693604, 0.0002573244273662567, 0.0002640560269355774, 0.00027078762650489807, 0.00027751922607421875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 3.0, 5.0, 6.0, 9.0, 12.0, 16.0, 16.0, 29.0, 26.0, 46.0, 73.0, 85.0, 136.0, 197.0, 358.0, 565.0, 994.0, 1918.0, 3676.0, 8534.0, 22773.0, 79670.0, 334834.0, 431064.0, 113249.0, 29979.0, 10642.0, 4603.0, 2109.0, 1131.0, 628.0, 393.0, 242.0, 159.0, 90.0, 83.0, 52.0, 38.0, 25.0, 26.0, 15.0, 21.0, 5.0, 4.0, 3.0, 6.0, 2.0, 2.0, 2.0, 2.0, 5.0, 3.0], "bins": [-0.810546875, -0.7874679565429688, -0.7643890380859375, -0.7413101196289062, -0.718231201171875, -0.6951522827148438, -0.6720733642578125, -0.6489944458007812, -0.62591552734375, -0.6028366088867188, -0.5797576904296875, -0.5566787719726562, -0.533599853515625, -0.5105209350585938, -0.4874420166015625, -0.46436309814453125, -0.4412841796875, -0.41820526123046875, -0.3951263427734375, -0.37204742431640625, -0.348968505859375, -0.32588958740234375, -0.3028106689453125, -0.27973175048828125, -0.25665283203125, -0.23357391357421875, -0.2104949951171875, -0.18741607666015625, -0.164337158203125, -0.14125823974609375, -0.1181793212890625, -0.09510040283203125, -0.072021484375, -0.04894256591796875, -0.0258636474609375, -0.00278472900390625, 0.020294189453125, 0.04337310791015625, 0.0664520263671875, 0.08953094482421875, 0.11260986328125, 0.13568878173828125, 0.1587677001953125, 0.18184661865234375, 0.204925537109375, 0.22800445556640625, 0.2510833740234375, 0.27416229248046875, 0.2972412109375, 0.32032012939453125, 0.3433990478515625, 0.36647796630859375, 0.389556884765625, 0.41263580322265625, 0.4357147216796875, 0.45879364013671875, 0.48187255859375, 0.5049514770507812, 0.5280303955078125, 0.5511093139648438, 0.574188232421875, 0.5972671508789062, 0.6203460693359375, 0.6434249877929688, 0.66650390625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 6.0, 6.0, 9.0, 9.0, 7.0, 17.0, 22.0, 31.0, 42.0, 54.0, 57.0, 75.0, 63.0, 74.0, 77.0, 72.0, 79.0, 63.0, 51.0, 44.0, 41.0, 15.0, 19.0, 13.0, 8.0, 11.0, 13.0, 4.0, 6.0, 5.0, 5.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66943359375, -0.6479644775390625, -0.626495361328125, -0.6050262451171875, -0.58355712890625, -0.5620880126953125, -0.540618896484375, -0.5191497802734375, -0.4976806640625, -0.4762115478515625, -0.454742431640625, -0.4332733154296875, -0.41180419921875, -0.3903350830078125, -0.368865966796875, -0.3473968505859375, -0.325927734375, -0.3044586181640625, -0.282989501953125, -0.2615203857421875, -0.24005126953125, -0.2185821533203125, -0.197113037109375, -0.1756439208984375, -0.1541748046875, -0.1327056884765625, -0.111236572265625, -0.0897674560546875, -0.06829833984375, -0.0468292236328125, -0.025360107421875, -0.0038909912109375, 0.017578125, 0.0390472412109375, 0.060516357421875, 0.0819854736328125, 0.10345458984375, 0.1249237060546875, 0.146392822265625, 0.1678619384765625, 0.1893310546875, 0.2108001708984375, 0.232269287109375, 0.2537384033203125, 0.27520751953125, 0.2966766357421875, 0.318145751953125, 0.3396148681640625, 0.361083984375, 0.3825531005859375, 0.404022216796875, 0.4254913330078125, 0.44696044921875, 0.4684295654296875, 0.489898681640625, 0.5113677978515625, 0.5328369140625, 0.5543060302734375, 0.575775146484375, 0.5972442626953125, 0.61871337890625, 0.6401824951171875, 0.661651611328125, 0.6831207275390625, 0.70458984375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 7.0, 13.0, 30.0, 54.0, 88.0, 135.0, 161.0, 161.0, 131.0, 97.0, 51.0, 29.0, 22.0, 14.0, 6.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.505455017089844, -17.974851608276367, -17.444246292114258, -16.91364288330078, -16.383037567138672, -15.852433204650879, -15.321828842163086, -14.79122543334961, -14.2606201171875, -13.730015754699707, -13.199411392211914, -12.668807029724121, -12.138202667236328, -11.607598304748535, -11.076993942260742, -10.546390533447266, -10.015786170959473, -9.48518180847168, -8.954577445983887, -8.423973083496094, -7.893368721008301, -7.362764358520508, -6.832160472869873, -6.30155611038208, -5.770951747894287, -5.240347385406494, -4.709743022918701, -4.179139137268066, -3.6485345363616943, -3.1179301738739014, -2.5873260498046875, -2.0567216873168945, -1.5261163711547852, -0.995512068271637, -0.46490776538848877, 0.06569647789001465, 0.5963008403778076, 1.1269052028656006, 1.6575093269348145, 2.1881136894226074, 2.7187180519104004, 3.2493224143981934, 3.7799267768859863, 4.310530662536621, 4.841135025024414, 5.371739387512207, 5.90234375, 6.432948112487793, 6.963552474975586, 7.494156837463379, 8.024761199951172, 8.555365562438965, 9.085969924926758, 9.61657428741455, 10.147178649902344, 10.67778205871582, 11.20838737487793, 11.738991737365723, 12.269596099853516, 12.800200462341309, 13.330804824829102, 13.861409187316895, 14.392013549804688, 14.922616958618164, 15.453221321105957]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 6.0, 14.0, 11.0, 12.0, 12.0, 18.0, 21.0, 16.0, 19.0, 23.0, 19.0, 20.0, 26.0, 35.0, 31.0, 29.0, 40.0, 38.0, 45.0, 49.0, 48.0, 51.0, 39.0, 28.0, 34.0, 27.0, 41.0, 22.0, 40.0, 34.0, 23.0, 22.0, 18.0, 16.0, 12.0, 7.0, 11.0, 9.0, 7.0, 8.0, 3.0, 5.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.645497798919678, -7.397172927856445, -7.148848056793213, -6.9005231857299805, -6.652198791503906, -6.403873920440674, -6.155549049377441, -5.907224178314209, -5.658899307250977, -5.410574436187744, -5.162249565124512, -4.9139251708984375, -4.665600299835205, -4.417275428771973, -4.16895055770874, -3.920625686645508, -3.6723012924194336, -3.423976421356201, -3.175651788711548, -2.9273269176483154, -2.679002285003662, -2.4306774139404297, -2.1823525428771973, -1.9340277910232544, -1.6857030391693115, -1.4373782873153687, -1.1890535354614258, -0.9407286643981934, -0.6924039125442505, -0.4440791606903076, -0.1957542896270752, 0.052570462226867676, 0.30089473724365234, 0.5492194890975952, 0.7975443005561829, 1.0458691120147705, 1.2941938638687134, 1.5425186157226562, 1.7908434867858887, 2.039168357849121, 2.2874929904937744, 2.535817861557007, 2.78414249420166, 3.0324673652648926, 3.280792236328125, 3.5291168689727783, 3.7774417400360107, 4.025766372680664, 4.2740912437438965, 4.522416114807129, 4.770740985870361, 5.019065856933594, 5.267390251159668, 5.5157151222229, 5.764039993286133, 6.012364864349365, 6.260689735412598, 6.50901460647583, 6.7573394775390625, 7.005663871765137, 7.253988742828369, 7.502313613891602, 7.750638484954834, 7.998963356018066, 8.24728775024414]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 1.0, 3.0, 7.0, 5.0, 8.0, 11.0, 14.0, 18.0, 29.0, 27.0, 48.0, 107.0, 162.0, 286.0, 495.0, 1100.0, 2477.0, 7637.0, 34494.0, 3837916.0, 277369.0, 22049.0, 5653.0, 2171.0, 956.0, 473.0, 299.0, 181.0, 89.0, 62.0, 50.0, 33.0, 14.0, 12.0, 9.0, 5.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.57421875, -6.40509033203125, -6.2359619140625, -6.06683349609375, -5.897705078125, -5.72857666015625, -5.5594482421875, -5.39031982421875, -5.22119140625, -5.05206298828125, -4.8829345703125, -4.71380615234375, -4.544677734375, -4.37554931640625, -4.2064208984375, -4.03729248046875, -3.8681640625, -3.69903564453125, -3.5299072265625, -3.36077880859375, -3.191650390625, -3.02252197265625, -2.8533935546875, -2.68426513671875, -2.51513671875, -2.34600830078125, -2.1768798828125, -2.00775146484375, -1.838623046875, -1.66949462890625, -1.5003662109375, -1.33123779296875, -1.162109375, -0.99298095703125, -0.8238525390625, -0.65472412109375, -0.485595703125, -0.31646728515625, -0.1473388671875, 0.02178955078125, 0.19091796875, 0.36004638671875, 0.5291748046875, 0.69830322265625, 0.867431640625, 1.03656005859375, 1.2056884765625, 1.37481689453125, 1.5439453125, 1.71307373046875, 1.8822021484375, 2.05133056640625, 2.220458984375, 2.38958740234375, 2.5587158203125, 2.72784423828125, 2.89697265625, 3.06610107421875, 3.2352294921875, 3.40435791015625, 3.573486328125, 3.74261474609375, 3.9117431640625, 4.08087158203125, 4.25]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 2.0, 6.0, 9.0, 9.0, 24.0, 21.0, 27.0, 29.0, 46.0, 38.0, 56.0, 57.0, 58.0, 67.0, 47.0, 72.0, 62.0, 54.0, 70.0, 50.0, 35.0, 36.0, 32.0, 25.0, 15.0, 12.0, 11.0, 10.0, 5.0, 5.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.74560546875, -0.7253570556640625, -0.705108642578125, -0.6848602294921875, -0.66461181640625, -0.6443634033203125, -0.624114990234375, -0.6038665771484375, -0.5836181640625, -0.5633697509765625, -0.543121337890625, -0.5228729248046875, -0.50262451171875, -0.4823760986328125, -0.462127685546875, -0.4418792724609375, -0.421630859375, -0.4013824462890625, -0.381134033203125, -0.3608856201171875, -0.34063720703125, -0.3203887939453125, -0.300140380859375, -0.2798919677734375, -0.2596435546875, -0.2393951416015625, -0.219146728515625, -0.1988983154296875, -0.17864990234375, -0.1584014892578125, -0.138153076171875, -0.1179046630859375, -0.09765625, -0.0774078369140625, -0.057159423828125, -0.0369110107421875, -0.01666259765625, 0.0035858154296875, 0.023834228515625, 0.0440826416015625, 0.0643310546875, 0.0845794677734375, 0.104827880859375, 0.1250762939453125, 0.14532470703125, 0.1655731201171875, 0.185821533203125, 0.2060699462890625, 0.226318359375, 0.2465667724609375, 0.266815185546875, 0.2870635986328125, 0.30731201171875, 0.3275604248046875, 0.347808837890625, 0.3680572509765625, 0.3883056640625, 0.4085540771484375, 0.428802490234375, 0.4490509033203125, 0.46929931640625, 0.4895477294921875, 0.509796142578125, 0.5300445556640625, 0.55029296875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 5.0, 4.0, 9.0, 15.0, 14.0, 17.0, 23.0, 24.0, 29.0, 45.0, 75.0, 107.0, 156.0, 217.0, 367.0, 747.0, 1644.0, 4786.0, 19035.0, 157957.0, 3915877.0, 74369.0, 12442.0, 3421.0, 1279.0, 589.0, 356.0, 194.0, 133.0, 96.0, 62.0, 49.0, 33.0, 27.0, 19.0, 17.0, 13.0, 8.0, 13.0, 7.0, 4.0, 1.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.83984375, -4.698974609375, -4.55810546875, -4.417236328125, -4.2763671875, -4.135498046875, -3.99462890625, -3.853759765625, -3.712890625, -3.572021484375, -3.43115234375, -3.290283203125, -3.1494140625, -3.008544921875, -2.86767578125, -2.726806640625, -2.5859375, -2.445068359375, -2.30419921875, -2.163330078125, -2.0224609375, -1.881591796875, -1.74072265625, -1.599853515625, -1.458984375, -1.318115234375, -1.17724609375, -1.036376953125, -0.8955078125, -0.754638671875, -0.61376953125, -0.472900390625, -0.33203125, -0.191162109375, -0.05029296875, 0.090576171875, 0.2314453125, 0.372314453125, 0.51318359375, 0.654052734375, 0.794921875, 0.935791015625, 1.07666015625, 1.217529296875, 1.3583984375, 1.499267578125, 1.64013671875, 1.781005859375, 1.921875, 2.062744140625, 2.20361328125, 2.344482421875, 2.4853515625, 2.626220703125, 2.76708984375, 2.907958984375, 3.048828125, 3.189697265625, 3.33056640625, 3.471435546875, 3.6123046875, 3.753173828125, 3.89404296875, 4.034912109375, 4.17578125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 5.0, 6.0, 9.0, 19.0, 37.0, 78.0, 245.0, 3211.0, 296.0, 85.0, 39.0, 18.0, 13.0, 7.0, 7.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.93359375, -1.854736328125, -1.77587890625, -1.697021484375, -1.6181640625, -1.539306640625, -1.46044921875, -1.381591796875, -1.302734375, -1.223876953125, -1.14501953125, -1.066162109375, -0.9873046875, -0.908447265625, -0.82958984375, -0.750732421875, -0.671875, -0.593017578125, -0.51416015625, -0.435302734375, -0.3564453125, -0.277587890625, -0.19873046875, -0.119873046875, -0.041015625, 0.037841796875, 0.11669921875, 0.195556640625, 0.2744140625, 0.353271484375, 0.43212890625, 0.510986328125, 0.58984375, 0.668701171875, 0.74755859375, 0.826416015625, 0.9052734375, 0.984130859375, 1.06298828125, 1.141845703125, 1.220703125, 1.299560546875, 1.37841796875, 1.457275390625, 1.5361328125, 1.614990234375, 1.69384765625, 1.772705078125, 1.8515625, 1.930419921875, 2.00927734375, 2.088134765625, 2.1669921875, 2.245849609375, 2.32470703125, 2.403564453125, 2.482421875, 2.561279296875, 2.64013671875, 2.718994140625, 2.7978515625, 2.876708984375, 2.95556640625, 3.034423828125, 3.11328125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 1.0, 4.0, 4.0, 12.0, 25.0, 61.0, 117.0, 256.0, 281.0, 143.0, 49.0, 23.0, 9.0, 2.0, 3.0, 1.0, 2.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.739609241485596, -5.422520637512207, -5.105432033538818, -4.78834342956543, -4.471254825592041, -4.154166221618652, -3.8370776176452637, -3.519989013671875, -3.2029004096984863, -2.8858118057250977, -2.568723201751709, -2.2516345977783203, -1.9345459938049316, -1.617457389831543, -1.3003687858581543, -0.9832801818847656, -0.666191577911377, -0.3491029739379883, -0.03201436996459961, 0.28507423400878906, 0.6021628379821777, 0.9192514419555664, 1.236340045928955, 1.5534286499023438, 1.8705172538757324, 2.187605857849121, 2.5046944618225098, 2.8217830657958984, 3.138871669769287, 3.455960273742676, 3.7730488777160645, 4.090137481689453, 4.4072265625, 4.724315166473389, 5.041403770446777, 5.358492374420166, 5.675580978393555, 5.992669582366943, 6.309758186340332, 6.626846790313721, 6.943935394287109, 7.261023998260498, 7.578112602233887, 7.895201206207275, 8.212289810180664, 8.529378890991211, 8.846467018127441, 9.163555145263672, 9.480644226074219, 9.797733306884766, 10.114821434020996, 10.431909561157227, 10.748998641967773, 11.06608772277832, 11.38317584991455, 11.700263977050781, 12.017353057861328, 12.334442138671875, 12.651530265808105, 12.968618392944336, 13.285707473754883, 13.60279655456543, 13.91988468170166, 14.23697280883789, 14.554061889648438]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 6.0, 15.0, 18.0, 29.0, 31.0, 40.0, 41.0, 56.0, 52.0, 57.0, 86.0, 83.0, 56.0, 69.0, 74.0, 59.0, 50.0, 33.0, 41.0, 24.0, 27.0, 17.0, 14.0, 4.0, 3.0, 7.0, 3.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.216091632843018, -5.058459758758545, -4.9008283615112305, -4.743196487426758, -4.585564613342285, -4.427933216094971, -4.270301342010498, -4.112669944763184, -3.955038070678711, -3.7974064350128174, -3.639774799346924, -3.482142925262451, -3.3245112895965576, -3.166879653930664, -3.0092477798461914, -2.851616144180298, -2.6939845085144043, -2.5363528728485107, -2.378721237182617, -2.2210893630981445, -2.063457727432251, -1.9058260917663574, -1.7481943368911743, -1.5905625820159912, -1.4329309463500977, -1.275299310684204, -1.117667555809021, -0.9600358605384827, -0.8024041652679443, -0.644772469997406, -0.4871407747268677, -0.32950901985168457, -0.17187786102294922, -0.014246165752410889, 0.14338552951812744, 0.30101722478866577, 0.4586489200592041, 0.6162806153297424, 0.7739123106002808, 0.9315440654754639, 1.0891757011413574, 1.246807336807251, 1.404439091682434, 1.5620708465576172, 1.7197024822235107, 1.8773341178894043, 2.034965991973877, 2.1925976276397705, 2.350229263305664, 2.5078608989715576, 2.665492534637451, 2.823124408721924, 2.9807560443878174, 3.138387680053711, 3.2960195541381836, 3.453651189804077, 3.6112828254699707, 3.7689144611358643, 3.926546096801758, 4.0841779708862305, 4.241809844970703, 4.399441242218018, 4.55707311630249, 4.714704513549805, 4.872336387634277]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 5.0, 6.0, 7.0, 12.0, 19.0, 15.0, 19.0, 44.0, 53.0, 94.0, 163.0, 258.0, 544.0, 1041.0, 2591.0, 7407.0, 29740.0, 166779.0, 615731.0, 179743.0, 31378.0, 7861.0, 2598.0, 1164.0, 555.0, 283.0, 160.0, 98.0, 55.0, 50.0, 27.0, 18.0, 11.0, 7.0, 9.0, 3.0, 1.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.5234375, -3.407989501953125, -3.29254150390625, -3.177093505859375, -3.0616455078125, -2.946197509765625, -2.83074951171875, -2.715301513671875, -2.599853515625, -2.484405517578125, -2.36895751953125, -2.253509521484375, -2.1380615234375, -2.022613525390625, -1.90716552734375, -1.791717529296875, -1.67626953125, -1.560821533203125, -1.44537353515625, -1.329925537109375, -1.2144775390625, -1.099029541015625, -0.98358154296875, -0.868133544921875, -0.752685546875, -0.637237548828125, -0.52178955078125, -0.406341552734375, -0.2908935546875, -0.175445556640625, -0.05999755859375, 0.055450439453125, 0.1708984375, 0.286346435546875, 0.40179443359375, 0.517242431640625, 0.6326904296875, 0.748138427734375, 0.86358642578125, 0.979034423828125, 1.094482421875, 1.209930419921875, 1.32537841796875, 1.440826416015625, 1.5562744140625, 1.671722412109375, 1.78717041015625, 1.902618408203125, 2.01806640625, 2.133514404296875, 2.24896240234375, 2.364410400390625, 2.4798583984375, 2.595306396484375, 2.71075439453125, 2.826202392578125, 2.941650390625, 3.057098388671875, 3.17254638671875, 3.287994384765625, 3.4034423828125, 3.518890380859375, 3.63433837890625, 3.749786376953125, 3.865234375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 7.0, 7.0, 7.0, 7.0, 4.0, 18.0, 23.0, 35.0, 42.0, 33.0, 45.0, 47.0, 62.0, 63.0, 54.0, 66.0, 55.0, 72.0, 56.0, 52.0, 40.0, 45.0, 39.0, 36.0, 24.0, 14.0, 18.0, 8.0, 5.0, 8.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.7763671875, -0.7540130615234375, -0.731658935546875, -0.7093048095703125, -0.68695068359375, -0.6645965576171875, -0.642242431640625, -0.6198883056640625, -0.5975341796875, -0.5751800537109375, -0.552825927734375, -0.5304718017578125, -0.50811767578125, -0.4857635498046875, -0.463409423828125, -0.4410552978515625, -0.418701171875, -0.3963470458984375, -0.373992919921875, -0.3516387939453125, -0.32928466796875, -0.3069305419921875, -0.284576416015625, -0.2622222900390625, -0.2398681640625, -0.2175140380859375, -0.195159912109375, -0.1728057861328125, -0.15045166015625, -0.1280975341796875, -0.105743408203125, -0.0833892822265625, -0.06103515625, -0.0386810302734375, -0.016326904296875, 0.0060272216796875, 0.02838134765625, 0.0507354736328125, 0.073089599609375, 0.0954437255859375, 0.1177978515625, 0.1401519775390625, 0.162506103515625, 0.1848602294921875, 0.20721435546875, 0.2295684814453125, 0.251922607421875, 0.2742767333984375, 0.296630859375, 0.3189849853515625, 0.341339111328125, 0.3636932373046875, 0.38604736328125, 0.4084014892578125, 0.430755615234375, 0.4531097412109375, 0.4754638671875, 0.4978179931640625, 0.520172119140625, 0.5425262451171875, 0.56488037109375, 0.5872344970703125, 0.609588623046875, 0.6319427490234375, 0.654296875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 6.0, 3.0, 16.0, 12.0, 16.0, 19.0, 29.0, 59.0, 72.0, 118.0, 132.0, 270.0, 427.0, 677.0, 1274.0, 2402.0, 4938.0, 10620.0, 25023.0, 63963.0, 180472.0, 380113.0, 235138.0, 85006.0, 31619.0, 13325.0, 6060.0, 2951.0, 1578.0, 864.0, 483.0, 298.0, 183.0, 143.0, 85.0, 61.0, 36.0, 18.0, 18.0, 11.0, 5.0, 3.0, 2.0, 4.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.4794921875, -1.4327239990234375, -1.385955810546875, -1.3391876220703125, -1.29241943359375, -1.2456512451171875, -1.198883056640625, -1.1521148681640625, -1.1053466796875, -1.0585784912109375, -1.011810302734375, -0.9650421142578125, -0.91827392578125, -0.8715057373046875, -0.824737548828125, -0.7779693603515625, -0.731201171875, -0.6844329833984375, -0.637664794921875, -0.5908966064453125, -0.54412841796875, -0.4973602294921875, -0.450592041015625, -0.4038238525390625, -0.3570556640625, -0.3102874755859375, -0.263519287109375, -0.2167510986328125, -0.16998291015625, -0.1232147216796875, -0.076446533203125, -0.0296783447265625, 0.01708984375, 0.0638580322265625, 0.110626220703125, 0.1573944091796875, 0.20416259765625, 0.2509307861328125, 0.297698974609375, 0.3444671630859375, 0.3912353515625, 0.4380035400390625, 0.484771728515625, 0.5315399169921875, 0.57830810546875, 0.6250762939453125, 0.671844482421875, 0.7186126708984375, 0.765380859375, 0.8121490478515625, 0.858917236328125, 0.9056854248046875, 0.95245361328125, 0.9992218017578125, 1.045989990234375, 1.0927581787109375, 1.1395263671875, 1.1862945556640625, 1.233062744140625, 1.2798309326171875, 1.32659912109375, 1.3733673095703125, 1.420135498046875, 1.4669036865234375, 1.513671875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 5.0, 3.0, 2.0, 7.0, 10.0, 13.0, 19.0, 24.0, 28.0, 26.0, 32.0, 22.0, 39.0, 44.0, 54.0, 54.0, 59.0, 61.0, 50.0, 44.0, 56.0, 50.0, 37.0, 33.0, 35.0, 38.0, 31.0, 33.0, 15.0, 16.0, 14.0, 10.0, 9.0, 4.0, 7.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2421875, -2.158538818359375, -2.07489013671875, -1.991241455078125, -1.9075927734375, -1.823944091796875, -1.74029541015625, -1.656646728515625, -1.572998046875, -1.489349365234375, -1.40570068359375, -1.322052001953125, -1.2384033203125, -1.154754638671875, -1.07110595703125, -0.987457275390625, -0.90380859375, -0.820159912109375, -0.73651123046875, -0.652862548828125, -0.5692138671875, -0.485565185546875, -0.40191650390625, -0.318267822265625, -0.234619140625, -0.150970458984375, -0.06732177734375, 0.016326904296875, 0.0999755859375, 0.183624267578125, 0.26727294921875, 0.350921630859375, 0.4345703125, 0.518218994140625, 0.60186767578125, 0.685516357421875, 0.7691650390625, 0.852813720703125, 0.93646240234375, 1.020111083984375, 1.103759765625, 1.187408447265625, 1.27105712890625, 1.354705810546875, 1.4383544921875, 1.522003173828125, 1.60565185546875, 1.689300537109375, 1.77294921875, 1.856597900390625, 1.94024658203125, 2.023895263671875, 2.1075439453125, 2.191192626953125, 2.27484130859375, 2.358489990234375, 2.442138671875, 2.525787353515625, 2.60943603515625, 2.693084716796875, 2.7767333984375, 2.860382080078125, 2.94403076171875, 3.027679443359375, 3.111328125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 2.0, 1.0, 6.0, 4.0, 17.0, 22.0, 36.0, 76.0, 149.0, 312.0, 687.0, 2152.0, 10304.0, 126406.0, 795970.0, 100250.0, 8927.0, 2034.0, 645.0, 265.0, 128.0, 69.0, 28.0, 25.0, 16.0, 9.0, 8.0, 3.0, 1.0, 2.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2265625, -1.1783905029296875, -1.130218505859375, -1.0820465087890625, -1.03387451171875, -0.9857025146484375, -0.937530517578125, -0.8893585205078125, -0.8411865234375, -0.7930145263671875, -0.744842529296875, -0.6966705322265625, -0.64849853515625, -0.6003265380859375, -0.552154541015625, -0.5039825439453125, -0.455810546875, -0.4076385498046875, -0.359466552734375, -0.3112945556640625, -0.26312255859375, -0.2149505615234375, -0.166778564453125, -0.1186065673828125, -0.0704345703125, -0.0222625732421875, 0.025909423828125, 0.0740814208984375, 0.12225341796875, 0.1704254150390625, 0.218597412109375, 0.2667694091796875, 0.31494140625, 0.3631134033203125, 0.411285400390625, 0.4594573974609375, 0.50762939453125, 0.5558013916015625, 0.603973388671875, 0.6521453857421875, 0.7003173828125, 0.7484893798828125, 0.796661376953125, 0.8448333740234375, 0.89300537109375, 0.9411773681640625, 0.989349365234375, 1.0375213623046875, 1.085693359375, 1.1338653564453125, 1.182037353515625, 1.2302093505859375, 1.27838134765625, 1.3265533447265625, 1.374725341796875, 1.4228973388671875, 1.4710693359375, 1.5192413330078125, 1.567413330078125, 1.6155853271484375, 1.66375732421875, 1.7119293212890625, 1.760101318359375, 1.8082733154296875, 1.8564453125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 1.0, 8.0, 5.0, 4.0, 9.0, 8.0, 13.0, 25.0, 30.0, 33.0, 51.0, 85.0, 74.0, 87.0, 104.0, 102.0, 106.0, 58.0, 51.0, 37.0, 22.0, 21.0, 19.0, 10.0, 6.0, 10.0, 5.0, 10.0, 1.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00018525123596191406, -0.00017956271767616272, -0.00017387419939041138, -0.00016818568110466003, -0.0001624971628189087, -0.00015680864453315735, -0.000151120126247406, -0.00014543160796165466, -0.00013974308967590332, -0.00013405457139015198, -0.00012836605310440063, -0.0001226775348186493, -0.00011698901653289795, -0.0001113004982471466, -0.00010561197996139526, -9.992346167564392e-05, -9.423494338989258e-05, -8.854642510414124e-05, -8.285790681838989e-05, -7.716938853263855e-05, -7.148087024688721e-05, -6.579235196113586e-05, -6.010383367538452e-05, -5.441531538963318e-05, -4.8726797103881836e-05, -4.303827881813049e-05, -3.734976053237915e-05, -3.166124224662781e-05, -2.5972723960876465e-05, -2.0284205675125122e-05, -1.459568738937378e-05, -8.907169103622437e-06, -3.2186508178710938e-06, 2.469867467880249e-06, 8.158385753631592e-06, 1.3846904039382935e-05, 1.9535422325134277e-05, 2.522394061088562e-05, 3.091245889663696e-05, 3.6600977182388306e-05, 4.228949546813965e-05, 4.797801375389099e-05, 5.3666532039642334e-05, 5.935505032539368e-05, 6.504356861114502e-05, 7.073208689689636e-05, 7.64206051826477e-05, 8.210912346839905e-05, 8.779764175415039e-05, 9.348616003990173e-05, 9.917467832565308e-05, 0.00010486319661140442, 0.00011055171489715576, 0.0001162402331829071, 0.00012192875146865845, 0.0001276172697544098, 0.00013330578804016113, 0.00013899430632591248, 0.00014468282461166382, 0.00015037134289741516, 0.0001560598611831665, 0.00016174837946891785, 0.0001674368977546692, 0.00017312541604042053, 0.00017881393432617188]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 2.0, 3.0, 4.0, 5.0, 12.0, 17.0, 21.0, 30.0, 63.0, 123.0, 219.0, 475.0, 1160.0, 3499.0, 16647.0, 158809.0, 706424.0, 140395.0, 15447.0, 3235.0, 1067.0, 420.0, 227.0, 94.0, 59.0, 34.0, 23.0, 15.0, 6.0, 5.0, 4.0, 6.0, 2.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.21484375, -1.17218017578125, -1.1295166015625, -1.08685302734375, -1.044189453125, -1.00152587890625, -0.9588623046875, -0.91619873046875, -0.87353515625, -0.83087158203125, -0.7882080078125, -0.74554443359375, -0.702880859375, -0.66021728515625, -0.6175537109375, -0.57489013671875, -0.5322265625, -0.48956298828125, -0.4468994140625, -0.40423583984375, -0.361572265625, -0.31890869140625, -0.2762451171875, -0.23358154296875, -0.19091796875, -0.14825439453125, -0.1055908203125, -0.06292724609375, -0.020263671875, 0.02239990234375, 0.0650634765625, 0.10772705078125, 0.150390625, 0.19305419921875, 0.2357177734375, 0.27838134765625, 0.321044921875, 0.36370849609375, 0.4063720703125, 0.44903564453125, 0.49169921875, 0.53436279296875, 0.5770263671875, 0.61968994140625, 0.662353515625, 0.70501708984375, 0.7476806640625, 0.79034423828125, 0.8330078125, 0.87567138671875, 0.9183349609375, 0.96099853515625, 1.003662109375, 1.04632568359375, 1.0889892578125, 1.13165283203125, 1.17431640625, 1.21697998046875, 1.2596435546875, 1.30230712890625, 1.344970703125, 1.38763427734375, 1.4302978515625, 1.47296142578125, 1.515625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 11.0, 11.0, 19.0, 26.0, 27.0, 48.0, 70.0, 99.0, 113.0, 135.0, 96.0, 98.0, 73.0, 57.0, 46.0, 23.0, 19.0, 8.0, 3.0, 9.0, 6.0, 3.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2861328125, -1.244140625, -1.2021484375, -1.16015625, -1.1181640625, -1.076171875, -1.0341796875, -0.9921875, -0.9501953125, -0.908203125, -0.8662109375, -0.82421875, -0.7822265625, -0.740234375, -0.6982421875, -0.65625, -0.6142578125, -0.572265625, -0.5302734375, -0.48828125, -0.4462890625, -0.404296875, -0.3623046875, -0.3203125, -0.2783203125, -0.236328125, -0.1943359375, -0.15234375, -0.1103515625, -0.068359375, -0.0263671875, 0.015625, 0.0576171875, 0.099609375, 0.1416015625, 0.18359375, 0.2255859375, 0.267578125, 0.3095703125, 0.3515625, 0.3935546875, 0.435546875, 0.4775390625, 0.51953125, 0.5615234375, 0.603515625, 0.6455078125, 0.6875, 0.7294921875, 0.771484375, 0.8134765625, 0.85546875, 0.8974609375, 0.939453125, 0.9814453125, 1.0234375, 1.0654296875, 1.107421875, 1.1494140625, 1.19140625, 1.2333984375, 1.275390625, 1.3173828125, 1.359375, 1.4013671875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 9.0, 12.0, 39.0, 87.0, 199.0, 254.0, 238.0, 94.0, 44.0, 24.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.49341869354248, -11.415940284729004, -10.338460922241211, -9.260982513427734, -8.183504104614258, -7.106025695800781, -6.0285468101501465, -4.951067924499512, -3.873589515686035, -2.7961108684539795, -1.7186322212219238, -0.6411535739898682, 0.4363250732421875, 1.513803482055664, 2.591282367706299, 3.6687612533569336, 4.74623966217041, 5.823718070983887, 6.9011969566345215, 7.978675842285156, 9.056154251098633, 10.13363265991211, 11.211111068725586, 12.288590431213379, 13.366068840026855, 14.443547248840332, 15.521026611328125, 16.5985050201416, 17.675983428955078, 18.753461837768555, 19.83094024658203, 20.90842056274414, 21.98590087890625, 23.063379287719727, 24.140857696533203, 25.21833610534668, 26.295814514160156, 27.373294830322266, 28.450773239135742, 29.52825164794922, 30.605730056762695, 31.683208465576172, 32.76068878173828, 33.838165283203125, 34.915645599365234, 35.99312210083008, 37.07060241699219, 38.14807891845703, 39.22555923461914, 40.30303955078125, 41.380516052246094, 42.4579963684082, 43.53547286987305, 44.612953186035156, 45.6904296875, 46.76791000366211, 47.84539031982422, 48.92287063598633, 50.00034713745117, 51.07782745361328, 52.155303955078125, 53.232784271240234, 54.31026077270508, 55.38774108886719, 56.46521759033203]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 4.0, 2.0, 6.0, 7.0, 10.0, 12.0, 15.0, 20.0, 14.0, 18.0, 19.0, 25.0, 28.0, 19.0, 25.0, 36.0, 36.0, 48.0, 41.0, 39.0, 37.0, 47.0, 45.0, 54.0, 36.0, 31.0, 27.0, 39.0, 34.0, 30.0, 26.0, 30.0, 32.0, 14.0, 20.0, 16.0, 9.0, 8.0, 6.0, 13.0, 6.0, 7.0, 6.0, 1.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.785120964050293, -11.40289306640625, -11.020666122436523, -10.63843822479248, -10.256210327148438, -9.873982429504395, -9.491754531860352, -9.109527587890625, -8.727299690246582, -8.345071792602539, -7.962844371795654, -7.5806169509887695, -7.198389053344727, -6.816161155700684, -6.433933734893799, -6.051706314086914, -5.669478416442871, -5.287250518798828, -4.905023097991943, -4.522795677185059, -4.140567779541016, -3.7583401203155518, -3.376112461090088, -2.993884801864624, -2.61165714263916, -2.2294294834136963, -1.8472018241882324, -1.4649741649627686, -1.0827465057373047, -0.7005188465118408, -0.31829118728637695, 0.06393647193908691, 0.4461650848388672, 0.828392744064331, 1.210620403289795, 1.5928480625152588, 1.9750757217407227, 2.3573033809661865, 2.7395310401916504, 3.1217586994171143, 3.503986358642578, 3.886214017868042, 4.268441677093506, 4.650669097900391, 5.032896995544434, 5.415124893188477, 5.797352313995361, 6.179579734802246, 6.561807632446289, 6.944035530090332, 7.326262950897217, 7.708490371704102, 8.090718269348145, 8.472946166992188, 8.855173110961914, 9.237401008605957, 9.61962890625, 10.001856803894043, 10.384084701538086, 10.766311645507812, 11.148539543151855, 11.530767440795898, 11.912994384765625, 12.295222282409668, 12.677450180053711]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 5.0, 7.0, 7.0, 6.0, 9.0, 10.0, 25.0, 31.0, 40.0, 69.0, 109.0, 222.0, 461.0, 1037.0, 2720.0, 8324.0, 36604.0, 3815143.0, 295883.0, 23169.0, 6095.0, 2203.0, 979.0, 469.0, 265.0, 159.0, 79.0, 50.0, 37.0, 22.0, 19.0, 8.0, 2.0, 5.0, 2.0, 4.0, 1.0, 3.0, 1.0], "bins": [-7.61328125, -7.435699462890625, -7.25811767578125, -7.080535888671875, -6.9029541015625, -6.725372314453125, -6.54779052734375, -6.370208740234375, -6.192626953125, -6.015045166015625, -5.83746337890625, -5.659881591796875, -5.4822998046875, -5.304718017578125, -5.12713623046875, -4.949554443359375, -4.77197265625, -4.594390869140625, -4.41680908203125, -4.239227294921875, -4.0616455078125, -3.884063720703125, -3.70648193359375, -3.528900146484375, -3.351318359375, -3.173736572265625, -2.99615478515625, -2.818572998046875, -2.6409912109375, -2.463409423828125, -2.28582763671875, -2.108245849609375, -1.9306640625, -1.753082275390625, -1.57550048828125, -1.397918701171875, -1.2203369140625, -1.042755126953125, -0.86517333984375, -0.687591552734375, -0.510009765625, -0.332427978515625, -0.15484619140625, 0.022735595703125, 0.2003173828125, 0.377899169921875, 0.55548095703125, 0.733062744140625, 0.91064453125, 1.088226318359375, 1.26580810546875, 1.443389892578125, 1.6209716796875, 1.798553466796875, 1.97613525390625, 2.153717041015625, 2.331298828125, 2.508880615234375, 2.68646240234375, 2.864044189453125, 3.0416259765625, 3.219207763671875, 3.39678955078125, 3.574371337890625, 3.751953125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 7.0, 4.0, 6.0, 16.0, 13.0, 13.0, 29.0, 22.0, 36.0, 26.0, 43.0, 37.0, 51.0, 46.0, 55.0, 44.0, 52.0, 55.0, 58.0, 51.0, 51.0, 53.0, 40.0, 29.0, 29.0, 24.0, 26.0, 14.0, 13.0, 12.0, 10.0, 7.0, 8.0, 7.0, 7.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.7939453125, -0.771240234375, -0.74853515625, -0.725830078125, -0.703125, -0.680419921875, -0.65771484375, -0.635009765625, -0.6123046875, -0.589599609375, -0.56689453125, -0.544189453125, -0.521484375, -0.498779296875, -0.47607421875, -0.453369140625, -0.4306640625, -0.407958984375, -0.38525390625, -0.362548828125, -0.33984375, -0.317138671875, -0.29443359375, -0.271728515625, -0.2490234375, -0.226318359375, -0.20361328125, -0.180908203125, -0.158203125, -0.135498046875, -0.11279296875, -0.090087890625, -0.0673828125, -0.044677734375, -0.02197265625, 0.000732421875, 0.0234375, 0.046142578125, 0.06884765625, 0.091552734375, 0.1142578125, 0.136962890625, 0.15966796875, 0.182373046875, 0.205078125, 0.227783203125, 0.25048828125, 0.273193359375, 0.2958984375, 0.318603515625, 0.34130859375, 0.364013671875, 0.38671875, 0.409423828125, 0.43212890625, 0.454833984375, 0.4775390625, 0.500244140625, 0.52294921875, 0.545654296875, 0.568359375, 0.591064453125, 0.61376953125, 0.636474609375, 0.6591796875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 12.0, 6.0, 11.0, 16.0, 18.0, 26.0, 26.0, 55.0, 70.0, 92.0, 150.0, 215.0, 395.0, 565.0, 1035.0, 1858.0, 3671.0, 8511.0, 24315.0, 108291.0, 3766328.0, 221551.0, 35382.0, 11582.0, 4810.0, 2276.0, 1139.0, 685.0, 415.0, 260.0, 168.0, 113.0, 70.0, 47.0, 42.0, 20.0, 16.0, 16.0, 14.0, 11.0, 4.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.3203125, -3.2186279296875, -3.116943359375, -3.0152587890625, -2.91357421875, -2.8118896484375, -2.710205078125, -2.6085205078125, -2.5068359375, -2.4051513671875, -2.303466796875, -2.2017822265625, -2.10009765625, -1.9984130859375, -1.896728515625, -1.7950439453125, -1.693359375, -1.5916748046875, -1.489990234375, -1.3883056640625, -1.28662109375, -1.1849365234375, -1.083251953125, -0.9815673828125, -0.8798828125, -0.7781982421875, -0.676513671875, -0.5748291015625, -0.47314453125, -0.3714599609375, -0.269775390625, -0.1680908203125, -0.06640625, 0.0352783203125, 0.136962890625, 0.2386474609375, 0.34033203125, 0.4420166015625, 0.543701171875, 0.6453857421875, 0.7470703125, 0.8487548828125, 0.950439453125, 1.0521240234375, 1.15380859375, 1.2554931640625, 1.357177734375, 1.4588623046875, 1.560546875, 1.6622314453125, 1.763916015625, 1.8656005859375, 1.96728515625, 2.0689697265625, 2.170654296875, 2.2723388671875, 2.3740234375, 2.4757080078125, 2.577392578125, 2.6790771484375, 2.78076171875, 2.8824462890625, 2.984130859375, 3.0858154296875, 3.1875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 10.0, 9.0, 13.0, 24.0, 42.0, 75.0, 261.0, 3123.0, 306.0, 105.0, 34.0, 25.0, 13.0, 9.0, 6.0, 8.0, 6.0, 2.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.05078125, -2.95697021484375, -2.8631591796875, -2.76934814453125, -2.675537109375, -2.58172607421875, -2.4879150390625, -2.39410400390625, -2.30029296875, -2.20648193359375, -2.1126708984375, -2.01885986328125, -1.925048828125, -1.83123779296875, -1.7374267578125, -1.64361572265625, -1.5498046875, -1.45599365234375, -1.3621826171875, -1.26837158203125, -1.174560546875, -1.08074951171875, -0.9869384765625, -0.89312744140625, -0.79931640625, -0.70550537109375, -0.6116943359375, -0.51788330078125, -0.424072265625, -0.33026123046875, -0.2364501953125, -0.14263916015625, -0.048828125, 0.04498291015625, 0.1387939453125, 0.23260498046875, 0.326416015625, 0.42022705078125, 0.5140380859375, 0.60784912109375, 0.70166015625, 0.79547119140625, 0.8892822265625, 0.98309326171875, 1.076904296875, 1.17071533203125, 1.2645263671875, 1.35833740234375, 1.4521484375, 1.54595947265625, 1.6397705078125, 1.73358154296875, 1.827392578125, 1.92120361328125, 2.0150146484375, 2.10882568359375, 2.20263671875, 2.29644775390625, 2.3902587890625, 2.48406982421875, 2.577880859375, 2.67169189453125, 2.7655029296875, 2.85931396484375, 2.953125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 8.0, 22.0, 76.0, 250.0, 376.0, 190.0, 48.0, 11.0, 10.0, 8.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.179655075073242, -25.575977325439453, -24.97229766845703, -24.368619918823242, -23.764942169189453, -23.161264419555664, -22.557586669921875, -21.953907012939453, -21.350229263305664, -20.746551513671875, -20.142871856689453, -19.539194107055664, -18.935516357421875, -18.331838607788086, -17.728160858154297, -17.124481201171875, -16.520803451538086, -15.917125701904297, -15.313446998596191, -14.709768295288086, -14.106090545654297, -13.502412796020508, -12.898734092712402, -12.295055389404297, -11.691377639770508, -11.087699890136719, -10.484021186828613, -9.880342483520508, -9.276664733886719, -8.67298698425293, -8.069308280944824, -7.465630054473877, -6.861952781677246, -6.258274555206299, -5.654596328735352, -5.050918102264404, -4.447239875793457, -3.8435616493225098, -3.2398834228515625, -2.6362051963806152, -2.032526969909668, -1.4288487434387207, -0.8251705169677734, -0.22149229049682617, 0.3821859359741211, 0.9858641624450684, 1.5895423889160156, 2.193220615386963, 2.79689884185791, 3.4005770683288574, 4.004255294799805, 4.607933521270752, 5.211611747741699, 5.8152899742126465, 6.418968200683594, 7.022646427154541, 7.626324653625488, 8.230003356933594, 8.833681106567383, 9.437358856201172, 10.041037559509277, 10.644716262817383, 11.248394012451172, 11.852071762084961, 12.455750465393066]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 8.0, 7.0, 4.0, 13.0, 19.0, 24.0, 19.0, 21.0, 24.0, 25.0, 31.0, 34.0, 39.0, 36.0, 39.0, 49.0, 50.0, 52.0, 55.0, 42.0, 44.0, 43.0, 39.0, 42.0, 36.0, 37.0, 34.0, 26.0, 21.0, 8.0, 19.0, 15.0, 10.0, 9.0, 7.0, 8.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.794589042663574, -4.642538070678711, -4.4904866218566895, -4.338435649871826, -4.186384201049805, -4.034333229064941, -3.882282018661499, -3.7302308082580566, -3.5781795978546143, -3.426128387451172, -3.2740771770477295, -3.122025966644287, -2.969974994659424, -2.8179235458374023, -2.665872573852539, -2.5138213634490967, -2.3617701530456543, -2.209718942642212, -2.0576677322387695, -1.9056166410446167, -1.7535654306411743, -1.601514220237732, -1.449463129043579, -1.2974119186401367, -1.1453607082366943, -0.993309497833252, -0.8412583470344543, -0.6892071962356567, -0.5371559858322144, -0.385104775428772, -0.23305362462997437, -0.08100247383117676, 0.07104873657226562, 0.22309991717338562, 0.3751510977745056, 0.5272022485733032, 0.6792534589767456, 0.831304669380188, 0.9833558201789856, 1.1354069709777832, 1.2874581813812256, 1.439509391784668, 1.5915606021881104, 1.7436116933822632, 1.8956629037857056, 2.0477142333984375, 2.199765205383301, 2.351816415786743, 2.5038676261901855, 2.655918836593628, 2.8079700469970703, 2.9600212574005127, 3.112072467803955, 3.2641234397888184, 3.4161746501922607, 3.568225860595703, 3.7202770709991455, 3.872328281402588, 4.024379253387451, 4.176430702209473, 4.328481674194336, 4.480533123016357, 4.632584095001221, 4.784635543823242, 4.9366865158081055]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 3.0, 4.0, 0.0, 3.0, 7.0, 8.0, 9.0, 18.0, 27.0, 47.0, 74.0, 118.0, 224.0, 520.0, 1353.0, 4186.0, 18082.0, 113906.0, 648528.0, 221375.0, 30410.0, 6388.0, 1853.0, 665.0, 338.0, 149.0, 89.0, 64.0, 35.0, 21.0, 11.0, 12.0, 14.0, 3.0, 7.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.96484375, -4.81732177734375, -4.6697998046875, -4.52227783203125, -4.374755859375, -4.22723388671875, -4.0797119140625, -3.93218994140625, -3.78466796875, -3.63714599609375, -3.4896240234375, -3.34210205078125, -3.194580078125, -3.04705810546875, -2.8995361328125, -2.75201416015625, -2.6044921875, -2.45697021484375, -2.3094482421875, -2.16192626953125, -2.014404296875, -1.86688232421875, -1.7193603515625, -1.57183837890625, -1.42431640625, -1.27679443359375, -1.1292724609375, -0.98175048828125, -0.834228515625, -0.68670654296875, -0.5391845703125, -0.39166259765625, -0.244140625, -0.09661865234375, 0.0509033203125, 0.19842529296875, 0.345947265625, 0.49346923828125, 0.6409912109375, 0.78851318359375, 0.93603515625, 1.08355712890625, 1.2310791015625, 1.37860107421875, 1.526123046875, 1.67364501953125, 1.8211669921875, 1.96868896484375, 2.1162109375, 2.26373291015625, 2.4112548828125, 2.55877685546875, 2.706298828125, 2.85382080078125, 3.0013427734375, 3.14886474609375, 3.29638671875, 3.44390869140625, 3.5914306640625, 3.73895263671875, 3.886474609375, 4.03399658203125, 4.1815185546875, 4.32904052734375, 4.4765625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 6.0, 5.0, 13.0, 10.0, 10.0, 18.0, 12.0, 32.0, 18.0, 40.0, 30.0, 30.0, 36.0, 43.0, 49.0, 44.0, 52.0, 35.0, 48.0, 49.0, 39.0, 49.0, 38.0, 39.0, 38.0, 30.0, 27.0, 27.0, 27.0, 17.0, 21.0, 8.0, 13.0, 11.0, 8.0, 10.0, 3.0, 2.0, 2.0, 5.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.72314453125, -0.7008132934570312, -0.6784820556640625, -0.6561508178710938, -0.633819580078125, -0.6114883422851562, -0.5891571044921875, -0.5668258666992188, -0.54449462890625, -0.5221633911132812, -0.4998321533203125, -0.47750091552734375, -0.455169677734375, -0.43283843994140625, -0.4105072021484375, -0.38817596435546875, -0.3658447265625, -0.34351348876953125, -0.3211822509765625, -0.29885101318359375, -0.276519775390625, -0.25418853759765625, -0.2318572998046875, -0.20952606201171875, -0.18719482421875, -0.16486358642578125, -0.1425323486328125, -0.12020111083984375, -0.097869873046875, -0.07553863525390625, -0.0532073974609375, -0.03087615966796875, -0.008544921875, 0.01378631591796875, 0.0361175537109375, 0.05844879150390625, 0.080780029296875, 0.10311126708984375, 0.1254425048828125, 0.14777374267578125, 0.17010498046875, 0.19243621826171875, 0.2147674560546875, 0.23709869384765625, 0.259429931640625, 0.28176116943359375, 0.3040924072265625, 0.32642364501953125, 0.3487548828125, 0.37108612060546875, 0.3934173583984375, 0.41574859619140625, 0.438079833984375, 0.46041107177734375, 0.4827423095703125, 0.5050735473632812, 0.52740478515625, 0.5497360229492188, 0.5720672607421875, 0.5943984985351562, 0.616729736328125, 0.6390609741210938, 0.6613922119140625, 0.6837234497070312, 0.7060546875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 5.0, 6.0, 8.0, 12.0, 18.0, 27.0, 43.0, 74.0, 109.0, 236.0, 468.0, 991.0, 2467.0, 6685.0, 21844.0, 99194.0, 547441.0, 297914.0, 50618.0, 12919.0, 4258.0, 1692.0, 727.0, 330.0, 195.0, 110.0, 63.0, 30.0, 19.0, 18.0, 9.0, 8.0, 4.0, 1.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.806640625, -2.70916748046875, -2.6116943359375, -2.51422119140625, -2.416748046875, -2.31927490234375, -2.2218017578125, -2.12432861328125, -2.02685546875, -1.92938232421875, -1.8319091796875, -1.73443603515625, -1.636962890625, -1.53948974609375, -1.4420166015625, -1.34454345703125, -1.2470703125, -1.14959716796875, -1.0521240234375, -0.95465087890625, -0.857177734375, -0.75970458984375, -0.6622314453125, -0.56475830078125, -0.46728515625, -0.36981201171875, -0.2723388671875, -0.17486572265625, -0.077392578125, 0.02008056640625, 0.1175537109375, 0.21502685546875, 0.3125, 0.40997314453125, 0.5074462890625, 0.60491943359375, 0.702392578125, 0.79986572265625, 0.8973388671875, 0.99481201171875, 1.09228515625, 1.18975830078125, 1.2872314453125, 1.38470458984375, 1.482177734375, 1.57965087890625, 1.6771240234375, 1.77459716796875, 1.8720703125, 1.96954345703125, 2.0670166015625, 2.16448974609375, 2.261962890625, 2.35943603515625, 2.4569091796875, 2.55438232421875, 2.65185546875, 2.74932861328125, 2.8468017578125, 2.94427490234375, 3.041748046875, 3.13922119140625, 3.2366943359375, 3.33416748046875, 3.431640625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 2.0, 6.0, 1.0, 6.0, 7.0, 5.0, 7.0, 9.0, 19.0, 17.0, 15.0, 25.0, 29.0, 32.0, 34.0, 35.0, 46.0, 45.0, 44.0, 38.0, 48.0, 62.0, 46.0, 54.0, 52.0, 39.0, 40.0, 33.0, 33.0, 42.0, 21.0, 15.0, 21.0, 12.0, 20.0, 5.0, 7.0, 6.0, 9.0, 6.0, 5.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.615234375, -3.499420166015625, -3.38360595703125, -3.267791748046875, -3.1519775390625, -3.036163330078125, -2.92034912109375, -2.804534912109375, -2.688720703125, -2.572906494140625, -2.45709228515625, -2.341278076171875, -2.2254638671875, -2.109649658203125, -1.99383544921875, -1.878021240234375, -1.76220703125, -1.646392822265625, -1.53057861328125, -1.414764404296875, -1.2989501953125, -1.183135986328125, -1.06732177734375, -0.951507568359375, -0.835693359375, -0.719879150390625, -0.60406494140625, -0.488250732421875, -0.3724365234375, -0.256622314453125, -0.14080810546875, -0.024993896484375, 0.0908203125, 0.206634521484375, 0.32244873046875, 0.438262939453125, 0.5540771484375, 0.669891357421875, 0.78570556640625, 0.901519775390625, 1.017333984375, 1.133148193359375, 1.24896240234375, 1.364776611328125, 1.4805908203125, 1.596405029296875, 1.71221923828125, 1.828033447265625, 1.94384765625, 2.059661865234375, 2.17547607421875, 2.291290283203125, 2.4071044921875, 2.522918701171875, 2.63873291015625, 2.754547119140625, 2.870361328125, 2.986175537109375, 3.10198974609375, 3.217803955078125, 3.3336181640625, 3.449432373046875, 3.56524658203125, 3.681060791015625, 3.796875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 3.0, 6.0, 3.0, 8.0, 10.0, 13.0, 20.0, 40.0, 54.0, 88.0, 130.0, 224.0, 376.0, 632.0, 1098.0, 2047.0, 4265.0, 12249.0, 122839.0, 839956.0, 48491.0, 8540.0, 3442.0, 1702.0, 920.0, 513.0, 336.0, 213.0, 101.0, 76.0, 61.0, 33.0, 19.0, 23.0, 8.0, 6.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6484375, -2.561187744140625, -2.47393798828125, -2.386688232421875, -2.2994384765625, -2.212188720703125, -2.12493896484375, -2.037689208984375, -1.950439453125, -1.863189697265625, -1.77593994140625, -1.688690185546875, -1.6014404296875, -1.514190673828125, -1.42694091796875, -1.339691162109375, -1.25244140625, -1.165191650390625, -1.07794189453125, -0.990692138671875, -0.9034423828125, -0.816192626953125, -0.72894287109375, -0.641693115234375, -0.554443359375, -0.467193603515625, -0.37994384765625, -0.292694091796875, -0.2054443359375, -0.118194580078125, -0.03094482421875, 0.056304931640625, 0.1435546875, 0.230804443359375, 0.31805419921875, 0.405303955078125, 0.4925537109375, 0.579803466796875, 0.66705322265625, 0.754302978515625, 0.841552734375, 0.928802490234375, 1.01605224609375, 1.103302001953125, 1.1905517578125, 1.277801513671875, 1.36505126953125, 1.452301025390625, 1.53955078125, 1.626800537109375, 1.71405029296875, 1.801300048828125, 1.8885498046875, 1.975799560546875, 2.06304931640625, 2.150299072265625, 2.237548828125, 2.324798583984375, 2.41204833984375, 2.499298095703125, 2.5865478515625, 2.673797607421875, 2.76104736328125, 2.848297119140625, 2.935546875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 1.0, 5.0, 7.0, 7.0, 9.0, 17.0, 40.0, 50.0, 113.0, 193.0, 203.0, 163.0, 86.0, 53.0, 22.0, 9.0, 5.0, 4.0, 3.0, 5.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0005145072937011719, -0.0005006939172744751, -0.0004868805408477783, -0.00047306716442108154, -0.00045925378799438477, -0.000445440411567688, -0.0004316270351409912, -0.00041781365871429443, -0.00040400028228759766, -0.0003901869058609009, -0.0003763735294342041, -0.0003625601530075073, -0.00034874677658081055, -0.00033493340015411377, -0.000321120023727417, -0.0003073066473007202, -0.00029349327087402344, -0.00027967989444732666, -0.0002658665180206299, -0.0002520531415939331, -0.00023823976516723633, -0.00022442638874053955, -0.00021061301231384277, -0.000196799635887146, -0.00018298625946044922, -0.00016917288303375244, -0.00015535950660705566, -0.0001415461301803589, -0.0001277327537536621, -0.00011391937732696533, -0.00010010600090026855, -8.629262447357178e-05, -7.2479248046875e-05, -5.866587162017822e-05, -4.4852495193481445e-05, -3.103911876678467e-05, -1.722574234008789e-05, -3.4123659133911133e-06, 1.0401010513305664e-05, 2.421438694000244e-05, 3.802776336669922e-05, 5.1841139793395996e-05, 6.565451622009277e-05, 7.946789264678955e-05, 9.328126907348633e-05, 0.0001070946455001831, 0.00012090802192687988, 0.00013472139835357666, 0.00014853477478027344, 0.00016234815120697021, 0.000176161527633667, 0.00018997490406036377, 0.00020378828048706055, 0.00021760165691375732, 0.0002314150333404541, 0.0002452284097671509, 0.00025904178619384766, 0.00027285516262054443, 0.0002866685390472412, 0.000300481915473938, 0.00031429529190063477, 0.00032810866832733154, 0.0003419220447540283, 0.0003557354211807251, 0.0003695487976074219]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 0.0, 0.0, 9.0, 10.0, 18.0, 29.0, 61.0, 108.0, 149.0, 381.0, 1251.0, 5835.0, 181920.0, 846407.0, 9564.0, 1828.0, 549.0, 193.0, 92.0, 62.0, 36.0, 20.0, 10.0, 15.0, 7.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.0078125, -6.819091796875, -6.63037109375, -6.441650390625, -6.2529296875, -6.064208984375, -5.87548828125, -5.686767578125, -5.498046875, -5.309326171875, -5.12060546875, -4.931884765625, -4.7431640625, -4.554443359375, -4.36572265625, -4.177001953125, -3.98828125, -3.799560546875, -3.61083984375, -3.422119140625, -3.2333984375, -3.044677734375, -2.85595703125, -2.667236328125, -2.478515625, -2.289794921875, -2.10107421875, -1.912353515625, -1.7236328125, -1.534912109375, -1.34619140625, -1.157470703125, -0.96875, -0.780029296875, -0.59130859375, -0.402587890625, -0.2138671875, -0.025146484375, 0.16357421875, 0.352294921875, 0.541015625, 0.729736328125, 0.91845703125, 1.107177734375, 1.2958984375, 1.484619140625, 1.67333984375, 1.862060546875, 2.05078125, 2.239501953125, 2.42822265625, 2.616943359375, 2.8056640625, 2.994384765625, 3.18310546875, 3.371826171875, 3.560546875, 3.749267578125, 3.93798828125, 4.126708984375, 4.3154296875, 4.504150390625, 4.69287109375, 4.881591796875, 5.0703125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 4.0, 3.0, 2.0, 1.0, 3.0, 8.0, 11.0, 22.0, 62.0, 194.0, 336.0, 219.0, 58.0, 29.0, 16.0, 16.0, 9.0, 2.0, 3.0, 2.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6015625, -6.446563720703125, -6.29156494140625, -6.136566162109375, -5.9815673828125, -5.826568603515625, -5.67156982421875, -5.516571044921875, -5.361572265625, -5.206573486328125, -5.05157470703125, -4.896575927734375, -4.7415771484375, -4.586578369140625, -4.43157958984375, -4.276580810546875, -4.12158203125, -3.966583251953125, -3.81158447265625, -3.656585693359375, -3.5015869140625, -3.346588134765625, -3.19158935546875, -3.036590576171875, -2.881591796875, -2.726593017578125, -2.57159423828125, -2.416595458984375, -2.2615966796875, -2.106597900390625, -1.95159912109375, -1.796600341796875, -1.6416015625, -1.486602783203125, -1.33160400390625, -1.176605224609375, -1.0216064453125, -0.866607666015625, -0.71160888671875, -0.556610107421875, -0.401611328125, -0.246612548828125, -0.09161376953125, 0.063385009765625, 0.2183837890625, 0.373382568359375, 0.52838134765625, 0.683380126953125, 0.83837890625, 0.993377685546875, 1.14837646484375, 1.303375244140625, 1.4583740234375, 1.613372802734375, 1.76837158203125, 1.923370361328125, 2.078369140625, 2.233367919921875, 2.38836669921875, 2.543365478515625, 2.6983642578125, 2.853363037109375, 3.00836181640625, 3.163360595703125, 3.318359375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 6.0, 2.0, 6.0, 13.0, 30.0, 55.0, 106.0, 141.0, 204.0, 175.0, 120.0, 69.0, 38.0, 28.0, 5.0, 6.0, 4.0, 3.0, 4.0], "bins": [-57.122108459472656, -56.0565185546875, -54.990928649902344, -53.92533874511719, -52.85974884033203, -51.79416275024414, -50.728572845458984, -49.66298294067383, -48.59739303588867, -47.531803131103516, -46.46621322631836, -45.4006233215332, -44.33503723144531, -43.269447326660156, -42.203857421875, -41.138267517089844, -40.07267761230469, -39.00708770751953, -37.941497802734375, -36.87590789794922, -35.81031799316406, -34.74473190307617, -33.679141998291016, -32.61355209350586, -31.547962188720703, -30.482372283935547, -29.41678237915039, -28.351194381713867, -27.28560447692871, -26.220014572143555, -25.15442657470703, -24.088836669921875, -23.02324676513672, -21.957656860351562, -20.892066955566406, -19.826478958129883, -18.760889053344727, -17.69529914855957, -16.629711151123047, -15.56412124633789, -14.498531341552734, -13.432941436767578, -12.367352485656738, -11.301763534545898, -10.236173629760742, -9.170583724975586, -8.104994773864746, -7.039405345916748, -5.97381591796875, -4.908226490020752, -3.842637062072754, -2.777047634124756, -1.7114582061767578, -0.6458687782287598, 0.4197206497192383, 1.4853100776672363, 2.5508995056152344, 3.6164889335632324, 4.6820783615112305, 5.7476677894592285, 6.813257217407227, 7.878846645355225, 8.944436073303223, 10.010025024414062, 11.075614929199219]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 8.0, 6.0, 2.0, 4.0, 7.0, 10.0, 8.0, 9.0, 25.0, 24.0, 19.0, 24.0, 23.0, 29.0, 31.0, 23.0, 34.0, 46.0, 46.0, 38.0, 45.0, 48.0, 45.0, 39.0, 37.0, 40.0, 47.0, 32.0, 31.0, 28.0, 35.0, 26.0, 17.0, 19.0, 18.0, 11.0, 5.0, 11.0, 3.0, 14.0, 13.0, 6.0, 8.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-17.880279541015625, -17.283172607421875, -16.686063766479492, -16.088956832885742, -15.491849899291992, -14.894742012023926, -14.29763412475586, -13.70052719116211, -13.10342025756836, -12.506312370300293, -11.909205436706543, -11.312097549438477, -10.714990615844727, -10.11788272857666, -9.520774841308594, -8.923667907714844, -8.326560020446777, -7.729452610015869, -7.132345199584961, -6.5352373123168945, -5.9381303787231445, -5.341022491455078, -4.74391508102417, -4.146807670593262, -3.5497002601623535, -2.9525928497314453, -2.355485439300537, -1.7583777904510498, -1.1612703800201416, -0.5641629695892334, 0.032944679260253906, 0.6300520896911621, 1.2271595001220703, 1.8242669105529785, 2.4213743209838867, 3.018481969833374, 3.6155893802642822, 4.2126970291137695, 4.809804439544678, 5.406911849975586, 6.004019260406494, 6.601126670837402, 7.1982340812683105, 7.795341491699219, 8.392449378967285, 8.989556312561035, 9.586664199829102, 10.183771133422852, 10.780879020690918, 11.377986907958984, 11.975093841552734, 12.5722017288208, 13.16930866241455, 13.766416549682617, 14.363523483276367, 14.960631370544434, 15.5577392578125, 16.15484619140625, 16.751955032348633, 17.349061965942383, 17.946168899536133, 18.543275833129883, 19.140384674072266, 19.737491607666016, 20.334598541259766]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 5.0, 1.0, 5.0, 4.0, 11.0, 0.0, 14.0, 17.0, 27.0, 30.0, 51.0, 75.0, 112.0, 177.0, 234.0, 409.0, 774.0, 2006.0, 10603.0, 4150250.0, 24286.0, 2933.0, 944.0, 476.0, 295.0, 193.0, 103.0, 89.0, 46.0, 38.0, 28.0, 10.0, 20.0, 10.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3203125, -5.0626220703125, -4.804931640625, -4.5472412109375, -4.28955078125, -4.0318603515625, -3.774169921875, -3.5164794921875, -3.2587890625, -3.0010986328125, -2.743408203125, -2.4857177734375, -2.22802734375, -1.9703369140625, -1.712646484375, -1.4549560546875, -1.197265625, -0.9395751953125, -0.681884765625, -0.4241943359375, -0.16650390625, 0.0911865234375, 0.348876953125, 0.6065673828125, 0.8642578125, 1.1219482421875, 1.379638671875, 1.6373291015625, 1.89501953125, 2.1527099609375, 2.410400390625, 2.6680908203125, 2.92578125, 3.1834716796875, 3.441162109375, 3.6988525390625, 3.95654296875, 4.2142333984375, 4.471923828125, 4.7296142578125, 4.9873046875, 5.2449951171875, 5.502685546875, 5.7603759765625, 6.01806640625, 6.2757568359375, 6.533447265625, 6.7911376953125, 7.048828125, 7.3065185546875, 7.564208984375, 7.8218994140625, 8.07958984375, 8.3372802734375, 8.594970703125, 8.8526611328125, 9.1103515625, 9.3680419921875, 9.625732421875, 9.8834228515625, 10.14111328125, 10.3988037109375, 10.656494140625, 10.9141845703125, 11.171875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 0.0, 4.0, 3.0, 11.0, 7.0, 7.0, 7.0, 12.0, 9.0, 13.0, 13.0, 23.0, 18.0, 21.0, 24.0, 24.0, 36.0, 33.0, 46.0, 42.0, 42.0, 37.0, 49.0, 40.0, 33.0, 41.0, 41.0, 39.0, 35.0, 32.0, 34.0, 26.0, 21.0, 30.0, 24.0, 20.0, 25.0, 10.0, 6.0, 18.0, 5.0, 6.0, 6.0, 7.0, 5.0, 5.0, 4.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.82373046875, -0.7985076904296875, -0.773284912109375, -0.7480621337890625, -0.72283935546875, -0.6976165771484375, -0.672393798828125, -0.6471710205078125, -0.6219482421875, -0.5967254638671875, -0.571502685546875, -0.5462799072265625, -0.52105712890625, -0.4958343505859375, -0.470611572265625, -0.4453887939453125, -0.420166015625, -0.3949432373046875, -0.369720458984375, -0.3444976806640625, -0.31927490234375, -0.2940521240234375, -0.268829345703125, -0.2436065673828125, -0.2183837890625, -0.1931610107421875, -0.167938232421875, -0.1427154541015625, -0.11749267578125, -0.0922698974609375, -0.067047119140625, -0.0418243408203125, -0.0166015625, 0.0086212158203125, 0.033843994140625, 0.0590667724609375, 0.08428955078125, 0.1095123291015625, 0.134735107421875, 0.1599578857421875, 0.1851806640625, 0.2104034423828125, 0.235626220703125, 0.2608489990234375, 0.28607177734375, 0.3112945556640625, 0.336517333984375, 0.3617401123046875, 0.386962890625, 0.4121856689453125, 0.437408447265625, 0.4626312255859375, 0.48785400390625, 0.5130767822265625, 0.538299560546875, 0.5635223388671875, 0.5887451171875, 0.6139678955078125, 0.639190673828125, 0.6644134521484375, 0.68963623046875, 0.7148590087890625, 0.740081787109375, 0.7653045654296875, 0.79052734375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 2.0, 8.0, 7.0, 10.0, 18.0, 19.0, 23.0, 40.0, 56.0, 78.0, 112.0, 131.0, 158.0, 240.0, 316.0, 448.0, 676.0, 1136.0, 1914.0, 3489.0, 7645.0, 31114.0, 4090180.0, 39090.0, 8248.0, 3605.0, 2014.0, 1175.0, 713.0, 455.0, 328.0, 218.0, 148.0, 128.0, 86.0, 66.0, 51.0, 39.0, 19.0, 18.0, 15.0, 14.0, 11.0, 4.0, 6.0, 5.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3515625, -4.2091064453125, -4.066650390625, -3.9241943359375, -3.78173828125, -3.6392822265625, -3.496826171875, -3.3543701171875, -3.2119140625, -3.0694580078125, -2.927001953125, -2.7845458984375, -2.64208984375, -2.4996337890625, -2.357177734375, -2.2147216796875, -2.072265625, -1.9298095703125, -1.787353515625, -1.6448974609375, -1.50244140625, -1.3599853515625, -1.217529296875, -1.0750732421875, -0.9326171875, -0.7901611328125, -0.647705078125, -0.5052490234375, -0.36279296875, -0.2203369140625, -0.077880859375, 0.0645751953125, 0.20703125, 0.3494873046875, 0.491943359375, 0.6343994140625, 0.77685546875, 0.9193115234375, 1.061767578125, 1.2042236328125, 1.3466796875, 1.4891357421875, 1.631591796875, 1.7740478515625, 1.91650390625, 2.0589599609375, 2.201416015625, 2.3438720703125, 2.486328125, 2.6287841796875, 2.771240234375, 2.9136962890625, 3.05615234375, 3.1986083984375, 3.341064453125, 3.4835205078125, 3.6259765625, 3.7684326171875, 3.910888671875, 4.0533447265625, 4.19580078125, 4.3382568359375, 4.480712890625, 4.6231689453125, 4.765625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 6.0, 2.0, 4.0, 6.0, 26.0, 95.0, 3836.0, 60.0, 18.0, 9.0, 3.0, 1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.51171875, -1.45440673828125, -1.3970947265625, -1.33978271484375, -1.282470703125, -1.22515869140625, -1.1678466796875, -1.11053466796875, -1.05322265625, -0.99591064453125, -0.9385986328125, -0.88128662109375, -0.823974609375, -0.76666259765625, -0.7093505859375, -0.65203857421875, -0.5947265625, -0.53741455078125, -0.4801025390625, -0.42279052734375, -0.365478515625, -0.30816650390625, -0.2508544921875, -0.19354248046875, -0.13623046875, -0.07891845703125, -0.0216064453125, 0.03570556640625, 0.093017578125, 0.15032958984375, 0.2076416015625, 0.26495361328125, 0.322265625, 0.37957763671875, 0.4368896484375, 0.49420166015625, 0.551513671875, 0.60882568359375, 0.6661376953125, 0.72344970703125, 0.78076171875, 0.83807373046875, 0.8953857421875, 0.95269775390625, 1.010009765625, 1.06732177734375, 1.1246337890625, 1.18194580078125, 1.2392578125, 1.29656982421875, 1.3538818359375, 1.41119384765625, 1.468505859375, 1.52581787109375, 1.5831298828125, 1.64044189453125, 1.69775390625, 1.75506591796875, 1.8123779296875, 1.86968994140625, 1.927001953125, 1.98431396484375, 2.0416259765625, 2.09893798828125, 2.15625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 4.0, 12.0, 40.0, 103.0, 231.0, 348.0, 192.0, 58.0, 13.0, 4.0, 1.0, 3.0], "bins": [-16.615558624267578, -16.32680320739746, -16.038047790527344, -15.74929141998291, -15.460536003112793, -15.171780586242676, -14.883025169372559, -14.594268798828125, -14.305513381958008, -14.01675796508789, -13.728002548217773, -13.43924617767334, -13.150490760803223, -12.861735343933105, -12.572979927062988, -12.284223556518555, -11.995468139648438, -11.70671272277832, -11.417957305908203, -11.12920093536377, -10.840445518493652, -10.551690101623535, -10.262934684753418, -9.974178314208984, -9.685423851013184, -9.396668434143066, -9.10791301727295, -8.819156646728516, -8.530401229858398, -8.241645812988281, -7.952890396118164, -7.664134502410889, -7.37537956237793, -7.0866241455078125, -6.797868251800537, -6.50911283493042, -6.2203569412231445, -5.931601524353027, -5.64284610748291, -5.354090213775635, -5.065334320068359, -4.776578903198242, -4.487823009490967, -4.19906759262085, -3.910311698913574, -3.621556282043457, -3.3328006267547607, -3.0440449714660645, -2.755289316177368, -2.466533660888672, -2.1777780055999756, -1.8890224695205688, -1.6002668142318726, -1.3115111589431763, -1.0227556228637695, -0.7339999675750732, -0.44524431228637695, -0.15648868680000305, 0.13226693868637085, 0.42102253437042236, 0.7097781896591187, 0.9985338449478149, 1.2872893810272217, 1.576045036315918, 1.8648006916046143]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 5.0, 2.0, 6.0, 6.0, 15.0, 10.0, 10.0, 15.0, 18.0, 19.0, 19.0, 29.0, 21.0, 35.0, 34.0, 38.0, 33.0, 39.0, 36.0, 33.0, 37.0, 40.0, 32.0, 30.0, 52.0, 42.0, 52.0, 34.0, 31.0, 30.0, 32.0, 22.0, 25.0, 20.0, 16.0, 19.0, 9.0, 9.0, 9.0, 11.0, 5.0, 4.0, 5.0, 10.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.194610595703125, -2.116312026977539, -2.0380136966705322, -1.9597152471542358, -1.8814167976379395, -1.803118348121643, -1.7248198986053467, -1.6465214490890503, -1.568222999572754, -1.4899245500564575, -1.4116261005401611, -1.3333276510238647, -1.2550292015075684, -1.176730751991272, -1.0984323024749756, -1.0201338529586792, -0.9418354034423828, -0.8635369539260864, -0.78523850440979, -0.7069400548934937, -0.6286416053771973, -0.5503431558609009, -0.4720447063446045, -0.3937462568283081, -0.3154478073120117, -0.23714935779571533, -0.15885090827941895, -0.08055245876312256, -0.002254009246826172, 0.07604444026947021, 0.1543428897857666, 0.232641339302063, 0.3109397888183594, 0.38923823833465576, 0.46753668785095215, 0.5458351373672485, 0.6241335868835449, 0.7024320363998413, 0.7807304859161377, 0.8590289354324341, 0.9373273849487305, 1.0156258344650269, 1.0939242839813232, 1.1722227334976196, 1.250521183013916, 1.3288196325302124, 1.4071180820465088, 1.4854165315628052, 1.5637149810791016, 1.642013430595398, 1.7203118801116943, 1.7986103296279907, 1.876908779144287, 1.9552072286605835, 2.03350567817688, 2.1118040084838867, 2.1901025772094727, 2.2684011459350586, 2.3466994762420654, 2.4249978065490723, 2.503296375274658, 2.581594944000244, 2.659893274307251, 2.738191604614258, 2.8164901733398438]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 8.0, 6.0, 10.0, 20.0, 33.0, 32.0, 55.0, 89.0, 107.0, 235.0, 444.0, 982.0, 2068.0, 4959.0, 12038.0, 31065.0, 83969.0, 227832.0, 369462.0, 197494.0, 72383.0, 26841.0, 10366.0, 4378.0, 1886.0, 829.0, 396.0, 218.0, 127.0, 82.0, 55.0, 23.0, 24.0, 8.0, 8.0, 6.0, 6.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.7734375, -2.69287109375, -2.6123046875, -2.53173828125, -2.451171875, -2.37060546875, -2.2900390625, -2.20947265625, -2.12890625, -2.04833984375, -1.9677734375, -1.88720703125, -1.806640625, -1.72607421875, -1.6455078125, -1.56494140625, -1.484375, -1.40380859375, -1.3232421875, -1.24267578125, -1.162109375, -1.08154296875, -1.0009765625, -0.92041015625, -0.83984375, -0.75927734375, -0.6787109375, -0.59814453125, -0.517578125, -0.43701171875, -0.3564453125, -0.27587890625, -0.1953125, -0.11474609375, -0.0341796875, 0.04638671875, 0.126953125, 0.20751953125, 0.2880859375, 0.36865234375, 0.44921875, 0.52978515625, 0.6103515625, 0.69091796875, 0.771484375, 0.85205078125, 0.9326171875, 1.01318359375, 1.09375, 1.17431640625, 1.2548828125, 1.33544921875, 1.416015625, 1.49658203125, 1.5771484375, 1.65771484375, 1.73828125, 1.81884765625, 1.8994140625, 1.97998046875, 2.060546875, 2.14111328125, 2.2216796875, 2.30224609375, 2.3828125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 5.0, 11.0, 7.0, 9.0, 12.0, 14.0, 16.0, 12.0, 18.0, 22.0, 24.0, 16.0, 19.0, 35.0, 43.0, 36.0, 31.0, 41.0, 54.0, 54.0, 51.0, 37.0, 40.0, 42.0, 36.0, 43.0, 30.0, 30.0, 28.0, 36.0, 16.0, 22.0, 15.0, 21.0, 9.0, 18.0, 10.0, 8.0, 5.0, 9.0, 3.0, 3.0, 2.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.99560546875, -0.9639053344726562, -0.9322052001953125, -0.9005050659179688, -0.868804931640625, -0.8371047973632812, -0.8054046630859375, -0.7737045288085938, -0.74200439453125, -0.7103042602539062, -0.6786041259765625, -0.6469039916992188, -0.615203857421875, -0.5835037231445312, -0.5518035888671875, -0.5201034545898438, -0.4884033203125, -0.45670318603515625, -0.4250030517578125, -0.39330291748046875, -0.361602783203125, -0.32990264892578125, -0.2982025146484375, -0.26650238037109375, -0.23480224609375, -0.20310211181640625, -0.1714019775390625, -0.13970184326171875, -0.108001708984375, -0.07630157470703125, -0.0446014404296875, -0.01290130615234375, 0.018798828125, 0.05049896240234375, 0.0821990966796875, 0.11389923095703125, 0.145599365234375, 0.17729949951171875, 0.2089996337890625, 0.24069976806640625, 0.27239990234375, 0.30410003662109375, 0.3358001708984375, 0.36750030517578125, 0.399200439453125, 0.43090057373046875, 0.4626007080078125, 0.49430084228515625, 0.5260009765625, 0.5577011108398438, 0.5894012451171875, 0.6211013793945312, 0.652801513671875, 0.6845016479492188, 0.7162017822265625, 0.7479019165039062, 0.77960205078125, 0.8113021850585938, 0.8430023193359375, 0.8747024536132812, 0.906402587890625, 0.9381027221679688, 0.9698028564453125, 1.0015029907226562, 1.033203125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 6.0, 3.0, 6.0, 4.0, 8.0, 9.0, 8.0, 21.0, 15.0, 30.0, 42.0, 67.0, 94.0, 151.0, 258.0, 469.0, 874.0, 1927.0, 4843.0, 13540.0, 44701.0, 182473.0, 529989.0, 196999.0, 48457.0, 14579.0, 4857.0, 2046.0, 911.0, 437.0, 241.0, 154.0, 96.0, 63.0, 61.0, 27.0, 25.0, 20.0, 7.0, 16.0, 3.0, 5.0, 6.0, 5.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0], "bins": [-3.4375, -3.331817626953125, -3.22613525390625, -3.120452880859375, -3.0147705078125, -2.909088134765625, -2.80340576171875, -2.697723388671875, -2.592041015625, -2.486358642578125, -2.38067626953125, -2.274993896484375, -2.1693115234375, -2.063629150390625, -1.95794677734375, -1.852264404296875, -1.74658203125, -1.640899658203125, -1.53521728515625, -1.429534912109375, -1.3238525390625, -1.218170166015625, -1.11248779296875, -1.006805419921875, -0.901123046875, -0.795440673828125, -0.68975830078125, -0.584075927734375, -0.4783935546875, -0.372711181640625, -0.26702880859375, -0.161346435546875, -0.0556640625, 0.050018310546875, 0.15570068359375, 0.261383056640625, 0.3670654296875, 0.472747802734375, 0.57843017578125, 0.684112548828125, 0.789794921875, 0.895477294921875, 1.00115966796875, 1.106842041015625, 1.2125244140625, 1.318206787109375, 1.42388916015625, 1.529571533203125, 1.63525390625, 1.740936279296875, 1.84661865234375, 1.952301025390625, 2.0579833984375, 2.163665771484375, 2.26934814453125, 2.375030517578125, 2.480712890625, 2.586395263671875, 2.69207763671875, 2.797760009765625, 2.9034423828125, 3.009124755859375, 3.11480712890625, 3.220489501953125, 3.326171875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 5.0, 10.0, 9.0, 8.0, 13.0, 15.0, 25.0, 26.0, 32.0, 23.0, 37.0, 39.0, 37.0, 54.0, 54.0, 44.0, 71.0, 64.0, 44.0, 50.0, 34.0, 37.0, 47.0, 38.0, 30.0, 25.0, 26.0, 24.0, 16.0, 14.0, 9.0, 9.0, 8.0, 8.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.0390625, -6.8272705078125, -6.615478515625, -6.4036865234375, -6.19189453125, -5.9801025390625, -5.768310546875, -5.5565185546875, -5.3447265625, -5.1329345703125, -4.921142578125, -4.7093505859375, -4.49755859375, -4.2857666015625, -4.073974609375, -3.8621826171875, -3.650390625, -3.4385986328125, -3.226806640625, -3.0150146484375, -2.80322265625, -2.5914306640625, -2.379638671875, -2.1678466796875, -1.9560546875, -1.7442626953125, -1.532470703125, -1.3206787109375, -1.10888671875, -0.8970947265625, -0.685302734375, -0.4735107421875, -0.26171875, -0.0499267578125, 0.161865234375, 0.3736572265625, 0.58544921875, 0.7972412109375, 1.009033203125, 1.2208251953125, 1.4326171875, 1.6444091796875, 1.856201171875, 2.0679931640625, 2.27978515625, 2.4915771484375, 2.703369140625, 2.9151611328125, 3.126953125, 3.3387451171875, 3.550537109375, 3.7623291015625, 3.97412109375, 4.1859130859375, 4.397705078125, 4.6094970703125, 4.8212890625, 5.0330810546875, 5.244873046875, 5.4566650390625, 5.66845703125, 5.8802490234375, 6.092041015625, 6.3038330078125, 6.515625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 6.0, 4.0, 4.0, 9.0, 16.0, 14.0, 27.0, 68.0, 91.0, 172.0, 406.0, 1068.0, 3959.0, 26790.0, 735141.0, 263455.0, 13383.0, 2514.0, 781.0, 310.0, 140.0, 75.0, 44.0, 25.0, 19.0, 17.0, 7.0, 6.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.796875, -3.6846923828125, -3.572509765625, -3.4603271484375, -3.34814453125, -3.2359619140625, -3.123779296875, -3.0115966796875, -2.8994140625, -2.7872314453125, -2.675048828125, -2.5628662109375, -2.45068359375, -2.3385009765625, -2.226318359375, -2.1141357421875, -2.001953125, -1.8897705078125, -1.777587890625, -1.6654052734375, -1.55322265625, -1.4410400390625, -1.328857421875, -1.2166748046875, -1.1044921875, -0.9923095703125, -0.880126953125, -0.7679443359375, -0.65576171875, -0.5435791015625, -0.431396484375, -0.3192138671875, -0.20703125, -0.0948486328125, 0.017333984375, 0.1295166015625, 0.24169921875, 0.3538818359375, 0.466064453125, 0.5782470703125, 0.6904296875, 0.8026123046875, 0.914794921875, 1.0269775390625, 1.13916015625, 1.2513427734375, 1.363525390625, 1.4757080078125, 1.587890625, 1.7000732421875, 1.812255859375, 1.9244384765625, 2.03662109375, 2.1488037109375, 2.260986328125, 2.3731689453125, 2.4853515625, 2.5975341796875, 2.709716796875, 2.8218994140625, 2.93408203125, 3.0462646484375, 3.158447265625, 3.2706298828125, 3.3828125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 3.0, 7.0, 9.0, 13.0, 16.0, 11.0, 21.0, 30.0, 23.0, 37.0, 61.0, 69.0, 88.0, 91.0, 98.0, 82.0, 69.0, 51.0, 49.0, 52.0, 31.0, 23.0, 13.0, 12.0, 8.0, 11.0, 5.0, 7.0, 4.0, 2.0, 4.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0002646446228027344, -0.0002568960189819336, -0.0002491474151611328, -0.00024139881134033203, -0.00023365020751953125, -0.00022590160369873047, -0.0002181529998779297, -0.0002104043960571289, -0.00020265579223632812, -0.00019490718841552734, -0.00018715858459472656, -0.00017940998077392578, -0.000171661376953125, -0.00016391277313232422, -0.00015616416931152344, -0.00014841556549072266, -0.00014066696166992188, -0.0001329183578491211, -0.0001251697540283203, -0.00011742115020751953, -0.00010967254638671875, -0.00010192394256591797, -9.417533874511719e-05, -8.64267349243164e-05, -7.867813110351562e-05, -7.092952728271484e-05, -6.318092346191406e-05, -5.543231964111328e-05, -4.76837158203125e-05, -3.993511199951172e-05, -3.218650817871094e-05, -2.4437904357910156e-05, -1.6689300537109375e-05, -8.940696716308594e-06, -1.1920928955078125e-06, 6.556510925292969e-06, 1.430511474609375e-05, 2.205371856689453e-05, 2.9802322387695312e-05, 3.7550926208496094e-05, 4.5299530029296875e-05, 5.3048133850097656e-05, 6.079673767089844e-05, 6.854534149169922e-05, 7.62939453125e-05, 8.404254913330078e-05, 9.179115295410156e-05, 9.953975677490234e-05, 0.00010728836059570312, 0.0001150369644165039, 0.0001227855682373047, 0.00013053417205810547, 0.00013828277587890625, 0.00014603137969970703, 0.0001537799835205078, 0.0001615285873413086, 0.00016927719116210938, 0.00017702579498291016, 0.00018477439880371094, 0.00019252300262451172, 0.0002002716064453125, 0.00020802021026611328, 0.00021576881408691406, 0.00022351741790771484, 0.00023126602172851562]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 6.0, 5.0, 9.0, 23.0, 55.0, 87.0, 189.0, 367.0, 1010.0, 3472.0, 23480.0, 530712.0, 462925.0, 21204.0, 3325.0, 967.0, 362.0, 169.0, 80.0, 44.0, 26.0, 15.0, 10.0, 6.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.93359375, -2.838897705078125, -2.74420166015625, -2.649505615234375, -2.5548095703125, -2.460113525390625, -2.36541748046875, -2.270721435546875, -2.176025390625, -2.081329345703125, -1.98663330078125, -1.891937255859375, -1.7972412109375, -1.702545166015625, -1.60784912109375, -1.513153076171875, -1.41845703125, -1.323760986328125, -1.22906494140625, -1.134368896484375, -1.0396728515625, -0.944976806640625, -0.85028076171875, -0.755584716796875, -0.660888671875, -0.566192626953125, -0.47149658203125, -0.376800537109375, -0.2821044921875, -0.187408447265625, -0.09271240234375, 0.001983642578125, 0.0966796875, 0.191375732421875, 0.28607177734375, 0.380767822265625, 0.4754638671875, 0.570159912109375, 0.66485595703125, 0.759552001953125, 0.854248046875, 0.948944091796875, 1.04364013671875, 1.138336181640625, 1.2330322265625, 1.327728271484375, 1.42242431640625, 1.517120361328125, 1.61181640625, 1.706512451171875, 1.80120849609375, 1.895904541015625, 1.9906005859375, 2.085296630859375, 2.17999267578125, 2.274688720703125, 2.369384765625, 2.464080810546875, 2.55877685546875, 2.653472900390625, 2.7481689453125, 2.842864990234375, 2.93756103515625, 3.032257080078125, 3.126953125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 4.0, 7.0, 7.0, 14.0, 18.0, 36.0, 51.0, 116.0, 157.0, 188.0, 159.0, 99.0, 67.0, 24.0, 18.0, 20.0, 9.0, 3.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.58984375, -4.4674072265625, -4.344970703125, -4.2225341796875, -4.10009765625, -3.9776611328125, -3.855224609375, -3.7327880859375, -3.6103515625, -3.4879150390625, -3.365478515625, -3.2430419921875, -3.12060546875, -2.9981689453125, -2.875732421875, -2.7532958984375, -2.630859375, -2.5084228515625, -2.385986328125, -2.2635498046875, -2.14111328125, -2.0186767578125, -1.896240234375, -1.7738037109375, -1.6513671875, -1.5289306640625, -1.406494140625, -1.2840576171875, -1.16162109375, -1.0391845703125, -0.916748046875, -0.7943115234375, -0.671875, -0.5494384765625, -0.427001953125, -0.3045654296875, -0.18212890625, -0.0596923828125, 0.062744140625, 0.1851806640625, 0.3076171875, 0.4300537109375, 0.552490234375, 0.6749267578125, 0.79736328125, 0.9197998046875, 1.042236328125, 1.1646728515625, 1.287109375, 1.4095458984375, 1.531982421875, 1.6544189453125, 1.77685546875, 1.8992919921875, 2.021728515625, 2.1441650390625, 2.2666015625, 2.3890380859375, 2.511474609375, 2.6339111328125, 2.75634765625, 2.8787841796875, 3.001220703125, 3.1236572265625, 3.24609375]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 9.0, 2.0, 20.0, 33.0, 91.0, 144.0, 225.0, 234.0, 131.0, 82.0, 22.0, 15.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-80.31433868408203, -78.60225677490234, -76.89017486572266, -75.17808532714844, -73.46600341796875, -71.75392150878906, -70.04183959960938, -68.32975769042969, -66.61767578125, -64.90559387207031, -63.19350814819336, -61.48142623901367, -59.769344329833984, -58.05725860595703, -56.345176696777344, -54.633094787597656, -52.92100524902344, -51.20892333984375, -49.4968376159668, -47.78475570678711, -46.07267379760742, -44.36058807373047, -42.64850616455078, -40.936424255371094, -39.224342346191406, -37.51226043701172, -35.800174713134766, -34.08809280395508, -32.37601089477539, -30.663925170898438, -28.95184326171875, -27.23975944519043, -25.527677536010742, -23.815593719482422, -22.103511810302734, -20.391427993774414, -18.679344177246094, -16.967262268066406, -15.255178451538086, -13.543094635009766, -11.831011772155762, -10.118928909301758, -8.406845092773438, -6.694762229919434, -4.9826788902282715, -3.2705955505371094, -1.5585126876831055, 0.15357112884521484, 1.8656539916992188, 3.577737331390381, 5.289820671081543, 7.001903533935547, 8.713987350463867, 10.426070213317871, 12.138153076171875, 13.850236892700195, 15.5623197555542, 17.274402618408203, 18.986486434936523, 20.698570251464844, 22.41065216064453, 24.12273597717285, 25.834819793701172, 27.54690170288086, 29.25898551940918]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 2.0, 6.0, 2.0, 8.0, 5.0, 8.0, 13.0, 8.0, 12.0, 12.0, 25.0, 17.0, 19.0, 34.0, 27.0, 30.0, 42.0, 43.0, 41.0, 69.0, 67.0, 41.0, 52.0, 45.0, 43.0, 49.0, 47.0, 29.0, 41.0, 29.0, 28.0, 22.0, 16.0, 16.0, 11.0, 18.0, 6.0, 6.0, 3.0, 4.0, 5.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-39.04851531982422, -37.98085403442383, -36.91319274902344, -35.84553146362305, -34.777870178222656, -33.710208892822266, -32.642547607421875, -31.574888229370117, -30.507226943969727, -29.439565658569336, -28.371904373168945, -27.304243087768555, -26.236583709716797, -25.168922424316406, -24.101261138916016, -23.033599853515625, -21.965938568115234, -20.898277282714844, -19.830615997314453, -18.762954711914062, -17.695293426513672, -16.62763214111328, -15.559972763061523, -14.492311477661133, -13.424650192260742, -12.356988906860352, -11.289327621459961, -10.221667289733887, -9.154006004333496, -8.086344718933105, -7.018683910369873, -5.951023101806641, -4.883363723754883, -3.8157026767730713, -2.7480416297912598, -1.6803805828094482, -0.6127195358276367, 0.4549417495727539, 1.5226025581359863, 2.5902633666992188, 3.6579246520996094, 4.7255859375, 5.793246746063232, 6.860907554626465, 7.9285688400268555, 8.996230125427246, 10.06389045715332, 11.131551742553711, 12.199213027954102, 13.266874313354492, 14.334535598754883, 15.402195930480957, 16.46985626220703, 17.537517547607422, 18.605178833007812, 19.672840118408203, 20.740501403808594, 21.808162689208984, 22.875823974609375, 23.943485260009766, 25.011146545410156, 26.078807830810547, 27.146467208862305, 28.214128494262695, 29.281789779663086]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 3.0, 4.0, 7.0, 9.0, 8.0, 15.0, 18.0, 28.0, 42.0, 70.0, 99.0, 148.0, 269.0, 526.0, 956.0, 2252.0, 10622.0, 4123142.0, 48473.0, 4623.0, 1405.0, 679.0, 351.0, 200.0, 129.0, 67.0, 40.0, 25.0, 27.0, 13.0, 14.0, 8.0, 6.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.70703125, -5.46685791015625, -5.2266845703125, -4.98651123046875, -4.746337890625, -4.50616455078125, -4.2659912109375, -4.02581787109375, -3.78564453125, -3.54547119140625, -3.3052978515625, -3.06512451171875, -2.824951171875, -2.58477783203125, -2.3446044921875, -2.10443115234375, -1.8642578125, -1.62408447265625, -1.3839111328125, -1.14373779296875, -0.903564453125, -0.66339111328125, -0.4232177734375, -0.18304443359375, 0.05712890625, 0.29730224609375, 0.5374755859375, 0.77764892578125, 1.017822265625, 1.25799560546875, 1.4981689453125, 1.73834228515625, 1.978515625, 2.21868896484375, 2.4588623046875, 2.69903564453125, 2.939208984375, 3.17938232421875, 3.4195556640625, 3.65972900390625, 3.89990234375, 4.14007568359375, 4.3802490234375, 4.62042236328125, 4.860595703125, 5.10076904296875, 5.3409423828125, 5.58111572265625, 5.8212890625, 6.06146240234375, 6.3016357421875, 6.54180908203125, 6.781982421875, 7.02215576171875, 7.2623291015625, 7.50250244140625, 7.74267578125, 7.98284912109375, 8.2230224609375, 8.46319580078125, 8.703369140625, 8.94354248046875, 9.1837158203125, 9.42388916015625, 9.6640625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 4.0, 3.0, 9.0, 11.0, 16.0, 6.0, 12.0, 27.0, 22.0, 24.0, 35.0, 34.0, 43.0, 46.0, 39.0, 76.0, 81.0, 75.0, 58.0, 56.0, 32.0, 46.0, 51.0, 45.0, 31.0, 22.0, 17.0, 16.0, 18.0, 15.0, 5.0, 3.0, 8.0, 6.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.7607421875, -1.7092132568359375, -1.657684326171875, -1.6061553955078125, -1.55462646484375, -1.5030975341796875, -1.451568603515625, -1.4000396728515625, -1.3485107421875, -1.2969818115234375, -1.245452880859375, -1.1939239501953125, -1.14239501953125, -1.0908660888671875, -1.039337158203125, -0.9878082275390625, -0.936279296875, -0.8847503662109375, -0.833221435546875, -0.7816925048828125, -0.73016357421875, -0.6786346435546875, -0.627105712890625, -0.5755767822265625, -0.5240478515625, -0.4725189208984375, -0.420989990234375, -0.3694610595703125, -0.31793212890625, -0.2664031982421875, -0.214874267578125, -0.1633453369140625, -0.11181640625, -0.0602874755859375, -0.008758544921875, 0.0427703857421875, 0.09429931640625, 0.1458282470703125, 0.197357177734375, 0.2488861083984375, 0.3004150390625, 0.3519439697265625, 0.403472900390625, 0.4550018310546875, 0.50653076171875, 0.5580596923828125, 0.609588623046875, 0.6611175537109375, 0.712646484375, 0.7641754150390625, 0.815704345703125, 0.8672332763671875, 0.91876220703125, 0.9702911376953125, 1.021820068359375, 1.0733489990234375, 1.1248779296875, 1.1764068603515625, 1.227935791015625, 1.2794647216796875, 1.33099365234375, 1.3825225830078125, 1.434051513671875, 1.4855804443359375, 1.537109375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 8.0, 3.0, 9.0, 14.0, 24.0, 25.0, 34.0, 51.0, 52.0, 73.0, 98.0, 134.0, 179.0, 240.0, 370.0, 596.0, 974.0, 1643.0, 3435.0, 8875.0, 33904.0, 3998485.0, 117762.0, 15947.0, 5392.0, 2411.0, 1241.0, 717.0, 418.0, 300.0, 202.0, 166.0, 121.0, 84.0, 70.0, 56.0, 42.0, 41.0, 21.0, 15.0, 14.0, 13.0, 7.0, 9.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.52734375, -4.384765625, -4.2421875, -4.099609375, -3.95703125, -3.814453125, -3.671875, -3.529296875, -3.38671875, -3.244140625, -3.1015625, -2.958984375, -2.81640625, -2.673828125, -2.53125, -2.388671875, -2.24609375, -2.103515625, -1.9609375, -1.818359375, -1.67578125, -1.533203125, -1.390625, -1.248046875, -1.10546875, -0.962890625, -0.8203125, -0.677734375, -0.53515625, -0.392578125, -0.25, -0.107421875, 0.03515625, 0.177734375, 0.3203125, 0.462890625, 0.60546875, 0.748046875, 0.890625, 1.033203125, 1.17578125, 1.318359375, 1.4609375, 1.603515625, 1.74609375, 1.888671875, 2.03125, 2.173828125, 2.31640625, 2.458984375, 2.6015625, 2.744140625, 2.88671875, 3.029296875, 3.171875, 3.314453125, 3.45703125, 3.599609375, 3.7421875, 3.884765625, 4.02734375, 4.169921875, 4.3125, 4.455078125, 4.59765625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 3.0, 6.0, 6.0, 15.0, 18.0, 45.0, 184.0, 3606.0, 95.0, 38.0, 19.0, 15.0, 9.0, 3.0, 4.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6181640625, -1.5695953369140625, -1.521026611328125, -1.4724578857421875, -1.42388916015625, -1.3753204345703125, -1.326751708984375, -1.2781829833984375, -1.2296142578125, -1.1810455322265625, -1.132476806640625, -1.0839080810546875, -1.03533935546875, -0.9867706298828125, -0.938201904296875, -0.8896331787109375, -0.841064453125, -0.7924957275390625, -0.743927001953125, -0.6953582763671875, -0.64678955078125, -0.5982208251953125, -0.549652099609375, -0.5010833740234375, -0.4525146484375, -0.4039459228515625, -0.355377197265625, -0.3068084716796875, -0.25823974609375, -0.2096710205078125, -0.161102294921875, -0.1125335693359375, -0.06396484375, -0.0153961181640625, 0.033172607421875, 0.0817413330078125, 0.13031005859375, 0.1788787841796875, 0.227447509765625, 0.2760162353515625, 0.3245849609375, 0.3731536865234375, 0.421722412109375, 0.4702911376953125, 0.51885986328125, 0.5674285888671875, 0.615997314453125, 0.6645660400390625, 0.713134765625, 0.7617034912109375, 0.810272216796875, 0.8588409423828125, 0.90740966796875, 0.9559783935546875, 1.004547119140625, 1.0531158447265625, 1.1016845703125, 1.1502532958984375, 1.198822021484375, 1.2473907470703125, 1.29595947265625, 1.3445281982421875, 1.393096923828125, 1.4416656494140625, 1.490234375]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 14.0, 20.0, 29.0, 35.0, 59.0, 85.0, 81.0, 113.0, 124.0, 121.0, 87.0, 84.0, 59.0, 38.0, 9.0, 12.0, 8.0, 12.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.60648775100708, -3.470785617828369, -3.335083246231079, -3.199381113052368, -3.063678741455078, -2.927976608276367, -2.7922744750976562, -2.6565723419189453, -2.5208699703216553, -2.3851678371429443, -2.2494654655456543, -2.1137633323669434, -1.9780610799789429, -1.8423588275909424, -1.7066566944122314, -1.570954442024231, -1.4352521896362305, -1.29954993724823, -1.1638476848602295, -1.0281455516815186, -0.8924432992935181, -0.7567410469055176, -0.6210388541221619, -0.48533666133880615, -0.34963440895080566, -0.21393218636512756, -0.07822996377944946, 0.05747225880622864, 0.19317448139190674, 0.3288767337799072, 0.46457892656326294, 0.6002811193466187, 0.7359828948974609, 0.8716851472854614, 1.007387399673462, 1.1430895328521729, 1.2787917852401733, 1.4144940376281738, 1.5501961708068848, 1.6858984231948853, 1.8216006755828857, 1.9573029279708862, 2.0930051803588867, 2.2287073135375977, 2.3644094467163086, 2.5001118183135986, 2.6358139514923096, 2.7715163230895996, 2.9072184562683105, 3.0429205894470215, 3.1786229610443115, 3.3143250942230225, 3.4500274658203125, 3.5857295989990234, 3.7214317321777344, 3.8571338653564453, 3.9928362369537354, 4.128538608551025, 4.264240741729736, 4.399942874908447, 4.535645008087158, 4.671347618103027, 4.807049751281738, 4.942751884460449, 5.07845401763916]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 8.0, 5.0, 7.0, 8.0, 14.0, 13.0, 21.0, 12.0, 21.0, 27.0, 36.0, 36.0, 31.0, 33.0, 40.0, 37.0, 53.0, 45.0, 46.0, 31.0, 44.0, 48.0, 52.0, 39.0, 44.0, 28.0, 38.0, 29.0, 30.0, 21.0, 19.0, 19.0, 11.0, 13.0, 7.0, 6.0, 8.0, 6.0, 7.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.2738101482391357, -2.1979146003723145, -2.122018814086914, -2.0461232662200928, -1.970227599143982, -1.894331932067871, -1.8184363842010498, -1.742540717124939, -1.6666450500488281, -1.5907493829727173, -1.5148537158966064, -1.4389581680297852, -1.3630625009536743, -1.2871668338775635, -1.2112712860107422, -1.1353756189346313, -1.0594799518585205, -0.9835842847824097, -0.9076886773109436, -0.8317930698394775, -0.7558974027633667, -0.6800017356872559, -0.6041061282157898, -0.5282105207443237, -0.4523148536682129, -0.37641921639442444, -0.300523579120636, -0.22462794184684753, -0.14873230457305908, -0.07283666729927063, 0.0030589699745178223, 0.07895457744598389, 0.15485000610351562, 0.23074564337730408, 0.30664128065109253, 0.382536917924881, 0.45843255519866943, 0.5343282222747803, 0.6102238297462463, 0.6861194372177124, 0.7620151042938232, 0.8379107713699341, 0.9138063788414001, 0.9897019863128662, 1.065597653388977, 1.141493320465088, 1.2173888683319092, 1.29328453540802, 1.3691802024841309, 1.4450758695602417, 1.5209715366363525, 1.5968670845031738, 1.6727627515792847, 1.7486584186553955, 1.8245539665222168, 1.9004496335983276, 1.9763453006744385, 2.0522408485412598, 2.12813663482666, 2.2040321826934814, 2.2799277305603027, 2.355823516845703, 2.4317190647125244, 2.5076146125793457, 2.583510398864746]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 8.0, 8.0, 5.0, 17.0, 19.0, 27.0, 45.0, 58.0, 102.0, 138.0, 231.0, 402.0, 711.0, 1342.0, 2648.0, 5514.0, 13042.0, 33548.0, 101592.0, 327699.0, 372979.0, 121688.0, 39508.0, 14698.0, 6292.0, 2846.0, 1433.0, 792.0, 449.0, 238.0, 145.0, 107.0, 60.0, 54.0, 42.0, 13.0, 14.0, 10.0, 13.0, 7.0, 4.0, 5.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.67578125, -2.580474853515625, -2.48516845703125, -2.389862060546875, -2.2945556640625, -2.199249267578125, -2.10394287109375, -2.008636474609375, -1.913330078125, -1.818023681640625, -1.72271728515625, -1.627410888671875, -1.5321044921875, -1.436798095703125, -1.34149169921875, -1.246185302734375, -1.15087890625, -1.055572509765625, -0.96026611328125, -0.864959716796875, -0.7696533203125, -0.674346923828125, -0.57904052734375, -0.483734130859375, -0.388427734375, -0.293121337890625, -0.19781494140625, -0.102508544921875, -0.0072021484375, 0.088104248046875, 0.18341064453125, 0.278717041015625, 0.3740234375, 0.469329833984375, 0.56463623046875, 0.659942626953125, 0.7552490234375, 0.850555419921875, 0.94586181640625, 1.041168212890625, 1.136474609375, 1.231781005859375, 1.32708740234375, 1.422393798828125, 1.5177001953125, 1.613006591796875, 1.70831298828125, 1.803619384765625, 1.89892578125, 1.994232177734375, 2.08953857421875, 2.184844970703125, 2.2801513671875, 2.375457763671875, 2.47076416015625, 2.566070556640625, 2.661376953125, 2.756683349609375, 2.85198974609375, 2.947296142578125, 3.0426025390625, 3.137908935546875, 3.23321533203125, 3.328521728515625, 3.423828125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 6.0, 2.0, 6.0, 13.0, 13.0, 9.0, 13.0, 13.0, 34.0, 30.0, 36.0, 38.0, 51.0, 57.0, 53.0, 68.0, 89.0, 68.0, 74.0, 48.0, 51.0, 44.0, 45.0, 31.0, 32.0, 15.0, 16.0, 12.0, 10.0, 9.0, 7.0, 3.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.00390625, -1.94598388671875, -1.8880615234375, -1.83013916015625, -1.772216796875, -1.71429443359375, -1.6563720703125, -1.59844970703125, -1.54052734375, -1.48260498046875, -1.4246826171875, -1.36676025390625, -1.308837890625, -1.25091552734375, -1.1929931640625, -1.13507080078125, -1.0771484375, -1.01922607421875, -0.9613037109375, -0.90338134765625, -0.845458984375, -0.78753662109375, -0.7296142578125, -0.67169189453125, -0.61376953125, -0.55584716796875, -0.4979248046875, -0.44000244140625, -0.382080078125, -0.32415771484375, -0.2662353515625, -0.20831298828125, -0.150390625, -0.09246826171875, -0.0345458984375, 0.02337646484375, 0.081298828125, 0.13922119140625, 0.1971435546875, 0.25506591796875, 0.31298828125, 0.37091064453125, 0.4288330078125, 0.48675537109375, 0.544677734375, 0.60260009765625, 0.6605224609375, 0.71844482421875, 0.7763671875, 0.83428955078125, 0.8922119140625, 0.95013427734375, 1.008056640625, 1.06597900390625, 1.1239013671875, 1.18182373046875, 1.23974609375, 1.29766845703125, 1.3555908203125, 1.41351318359375, 1.471435546875, 1.52935791015625, 1.5872802734375, 1.64520263671875, 1.703125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 0.0, 7.0, 7.0, 14.0, 19.0, 24.0, 33.0, 48.0, 84.0, 146.0, 277.0, 494.0, 1155.0, 3108.0, 13031.0, 129243.0, 807384.0, 79185.0, 9684.0, 2530.0, 982.0, 460.0, 262.0, 134.0, 89.0, 58.0, 41.0, 20.0, 15.0, 9.0, 2.0, 2.0, 6.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.796875, -8.5552978515625, -8.313720703125, -8.0721435546875, -7.83056640625, -7.5889892578125, -7.347412109375, -7.1058349609375, -6.8642578125, -6.6226806640625, -6.381103515625, -6.1395263671875, -5.89794921875, -5.6563720703125, -5.414794921875, -5.1732177734375, -4.931640625, -4.6900634765625, -4.448486328125, -4.2069091796875, -3.96533203125, -3.7237548828125, -3.482177734375, -3.2406005859375, -2.9990234375, -2.7574462890625, -2.515869140625, -2.2742919921875, -2.03271484375, -1.7911376953125, -1.549560546875, -1.3079833984375, -1.06640625, -0.8248291015625, -0.583251953125, -0.3416748046875, -0.10009765625, 0.1414794921875, 0.383056640625, 0.6246337890625, 0.8662109375, 1.1077880859375, 1.349365234375, 1.5909423828125, 1.83251953125, 2.0740966796875, 2.315673828125, 2.5572509765625, 2.798828125, 3.0404052734375, 3.281982421875, 3.5235595703125, 3.76513671875, 4.0067138671875, 4.248291015625, 4.4898681640625, 4.7314453125, 4.9730224609375, 5.214599609375, 5.4561767578125, 5.69775390625, 5.9393310546875, 6.180908203125, 6.4224853515625, 6.6640625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 2.0, 2.0, 4.0, 5.0, 8.0, 7.0, 19.0, 23.0, 51.0, 58.0, 58.0, 71.0, 84.0, 101.0, 86.0, 85.0, 78.0, 58.0, 56.0, 51.0, 31.0, 20.0, 9.0, 15.0, 7.0, 10.0, 4.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.8984375, -13.500244140625, -13.10205078125, -12.703857421875, -12.3056640625, -11.907470703125, -11.50927734375, -11.111083984375, -10.712890625, -10.314697265625, -9.91650390625, -9.518310546875, -9.1201171875, -8.721923828125, -8.32373046875, -7.925537109375, -7.52734375, -7.129150390625, -6.73095703125, -6.332763671875, -5.9345703125, -5.536376953125, -5.13818359375, -4.739990234375, -4.341796875, -3.943603515625, -3.54541015625, -3.147216796875, -2.7490234375, -2.350830078125, -1.95263671875, -1.554443359375, -1.15625, -0.758056640625, -0.35986328125, 0.038330078125, 0.4365234375, 0.834716796875, 1.23291015625, 1.631103515625, 2.029296875, 2.427490234375, 2.82568359375, 3.223876953125, 3.6220703125, 4.020263671875, 4.41845703125, 4.816650390625, 5.21484375, 5.613037109375, 6.01123046875, 6.409423828125, 6.8076171875, 7.205810546875, 7.60400390625, 8.002197265625, 8.400390625, 8.798583984375, 9.19677734375, 9.594970703125, 9.9931640625, 10.391357421875, 10.78955078125, 11.187744140625, 11.5859375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 4.0, 12.0, 14.0, 23.0, 30.0, 75.0, 133.0, 257.0, 825.0, 3154.0, 19630.0, 777060.0, 233908.0, 10289.0, 2078.0, 591.0, 229.0, 108.0, 52.0, 33.0, 12.0, 11.0, 7.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.23828125, -6.0855712890625, -5.932861328125, -5.7801513671875, -5.62744140625, -5.4747314453125, -5.322021484375, -5.1693115234375, -5.0166015625, -4.8638916015625, -4.711181640625, -4.5584716796875, -4.40576171875, -4.2530517578125, -4.100341796875, -3.9476318359375, -3.794921875, -3.6422119140625, -3.489501953125, -3.3367919921875, -3.18408203125, -3.0313720703125, -2.878662109375, -2.7259521484375, -2.5732421875, -2.4205322265625, -2.267822265625, -2.1151123046875, -1.96240234375, -1.8096923828125, -1.656982421875, -1.5042724609375, -1.3515625, -1.1988525390625, -1.046142578125, -0.8934326171875, -0.74072265625, -0.5880126953125, -0.435302734375, -0.2825927734375, -0.1298828125, 0.0228271484375, 0.175537109375, 0.3282470703125, 0.48095703125, 0.6336669921875, 0.786376953125, 0.9390869140625, 1.091796875, 1.2445068359375, 1.397216796875, 1.5499267578125, 1.70263671875, 1.8553466796875, 2.008056640625, 2.1607666015625, 2.3134765625, 2.4661865234375, 2.618896484375, 2.7716064453125, 2.92431640625, 3.0770263671875, 3.229736328125, 3.3824462890625, 3.53515625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 3.0, 4.0, 5.0, 4.0, 7.0, 9.0, 6.0, 25.0, 35.0, 73.0, 121.0, 167.0, 174.0, 151.0, 84.0, 55.0, 29.0, 15.0, 11.0, 9.0, 10.0, 4.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00033664703369140625, -0.00031998753547668457, -0.0003033280372619629, -0.0002866685390472412, -0.00027000904083251953, -0.00025334954261779785, -0.00023669004440307617, -0.0002200305461883545, -0.0002033710479736328, -0.00018671154975891113, -0.00017005205154418945, -0.00015339255332946777, -0.0001367330551147461, -0.00012007355690002441, -0.00010341405868530273, -8.675456047058105e-05, -7.009506225585938e-05, -5.3435564041137695e-05, -3.6776065826416016e-05, -2.0116567611694336e-05, -3.4570693969726562e-06, 1.3202428817749023e-05, 2.9861927032470703e-05, 4.652142524719238e-05, 6.318092346191406e-05, 7.984042167663574e-05, 9.649991989135742e-05, 0.0001131594181060791, 0.00012981891632080078, 0.00014647841453552246, 0.00016313791275024414, 0.00017979741096496582, 0.0001964569091796875, 0.00021311640739440918, 0.00022977590560913086, 0.00024643540382385254, 0.0002630949020385742, 0.0002797544002532959, 0.0002964138984680176, 0.00031307339668273926, 0.00032973289489746094, 0.0003463923931121826, 0.0003630518913269043, 0.000379711389541626, 0.00039637088775634766, 0.00041303038597106934, 0.000429689884185791, 0.0004463493824005127, 0.0004630088806152344, 0.00047966837882995605, 0.0004963278770446777, 0.0005129873752593994, 0.0005296468734741211, 0.0005463063716888428, 0.0005629658699035645, 0.0005796253681182861, 0.0005962848663330078, 0.0006129443645477295, 0.0006296038627624512, 0.0006462633609771729, 0.0006629228591918945, 0.0006795823574066162, 0.0006962418556213379, 0.0007129013538360596, 0.0007295608520507812]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 1.0, 2.0, 8.0, 18.0, 25.0, 49.0, 80.0, 171.0, 495.0, 1828.0, 14623.0, 817296.0, 205501.0, 6691.0, 1182.0, 304.0, 152.0, 54.0, 38.0, 18.0, 13.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.44140625, -5.2705078125, -5.099609375, -4.9287109375, -4.7578125, -4.5869140625, -4.416015625, -4.2451171875, -4.07421875, -3.9033203125, -3.732421875, -3.5615234375, -3.390625, -3.2197265625, -3.048828125, -2.8779296875, -2.70703125, -2.5361328125, -2.365234375, -2.1943359375, -2.0234375, -1.8525390625, -1.681640625, -1.5107421875, -1.33984375, -1.1689453125, -0.998046875, -0.8271484375, -0.65625, -0.4853515625, -0.314453125, -0.1435546875, 0.02734375, 0.1982421875, 0.369140625, 0.5400390625, 0.7109375, 0.8818359375, 1.052734375, 1.2236328125, 1.39453125, 1.5654296875, 1.736328125, 1.9072265625, 2.078125, 2.2490234375, 2.419921875, 2.5908203125, 2.76171875, 2.9326171875, 3.103515625, 3.2744140625, 3.4453125, 3.6162109375, 3.787109375, 3.9580078125, 4.12890625, 4.2998046875, 4.470703125, 4.6416015625, 4.8125, 4.9833984375, 5.154296875, 5.3251953125, 5.49609375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 1.0, 9.0, 15.0, 25.0, 88.0, 171.0, 291.0, 214.0, 108.0, 54.0, 10.0, 9.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.529296875, -3.318878173828125, -3.10845947265625, -2.898040771484375, -2.6876220703125, -2.477203369140625, -2.26678466796875, -2.056365966796875, -1.845947265625, -1.635528564453125, -1.42510986328125, -1.214691162109375, -1.0042724609375, -0.793853759765625, -0.58343505859375, -0.373016357421875, -0.16259765625, 0.047821044921875, 0.25823974609375, 0.468658447265625, 0.6790771484375, 0.889495849609375, 1.09991455078125, 1.310333251953125, 1.520751953125, 1.731170654296875, 1.94158935546875, 2.152008056640625, 2.3624267578125, 2.572845458984375, 2.78326416015625, 2.993682861328125, 3.2041015625, 3.414520263671875, 3.62493896484375, 3.835357666015625, 4.0457763671875, 4.256195068359375, 4.46661376953125, 4.677032470703125, 4.887451171875, 5.097869873046875, 5.30828857421875, 5.518707275390625, 5.7291259765625, 5.939544677734375, 6.14996337890625, 6.360382080078125, 6.57080078125, 6.781219482421875, 6.99163818359375, 7.202056884765625, 7.4124755859375, 7.622894287109375, 7.83331298828125, 8.043731689453125, 8.254150390625, 8.464569091796875, 8.67498779296875, 8.885406494140625, 9.0958251953125, 9.306243896484375, 9.51666259765625, 9.727081298828125, 9.9375]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 9.0, 30.0, 48.0, 121.0, 262.0, 243.0, 143.0, 73.0, 37.0, 16.0, 5.0, 9.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.92731475830078, -57.61813735961914, -55.3089599609375, -52.99978256225586, -50.69060516357422, -48.38142776489258, -46.07225036621094, -43.76306915283203, -41.453895568847656, -39.144718170166016, -36.835540771484375, -34.526363372802734, -32.217185974121094, -29.908008575439453, -27.59882926940918, -25.28965187072754, -22.980472564697266, -20.671295166015625, -18.362117767333984, -16.052940368652344, -13.743762016296387, -11.434584617614746, -9.125406265258789, -6.816228866577148, -4.507051467895508, -2.197873830795288, 0.11130380630493164, 2.4204816818237305, 4.729659080505371, 7.038836479187012, 9.348014831542969, 11.65719223022461, 13.96636962890625, 16.27554702758789, 18.58472442626953, 20.893901824951172, 23.203079223632812, 25.512256622314453, 27.821435928344727, 30.130613327026367, 32.439788818359375, 34.748966217041016, 37.058143615722656, 39.3673210144043, 41.67649841308594, 43.98567581176758, 46.29485321044922, 48.604034423828125, 50.913211822509766, 53.222389221191406, 55.53156661987305, 57.84074401855469, 60.14992141723633, 62.45909881591797, 64.76828002929688, 67.07745361328125, 69.38663482666016, 71.69581604003906, 74.00498962402344, 76.31417083740234, 78.62334442138672, 80.93252563476562, 83.24169921875, 85.5508804321289, 87.86005401611328]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 5.0, 7.0, 8.0, 12.0, 5.0, 8.0, 15.0, 13.0, 12.0, 23.0, 33.0, 39.0, 38.0, 55.0, 59.0, 51.0, 61.0, 61.0, 57.0, 48.0, 50.0, 45.0, 39.0, 45.0, 33.0, 37.0, 25.0, 23.0, 19.0, 13.0, 16.0, 12.0, 7.0, 6.0, 11.0, 3.0, 4.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.09374237060547, -35.908870697021484, -34.724002838134766, -33.53913116455078, -32.35426330566406, -31.169391632080078, -29.984519958496094, -28.799650192260742, -27.61478042602539, -26.42991065979004, -25.245040893554688, -24.060169219970703, -22.87529945373535, -21.6904296875, -20.505558013916016, -19.320688247680664, -18.135818481445312, -16.95094871520996, -15.766077995300293, -14.581207275390625, -13.396337509155273, -12.211467742919922, -11.026597023010254, -9.841726303100586, -8.656856536865234, -7.471986293792725, -6.287116050720215, -5.102245807647705, -3.9173755645751953, -2.7325053215026855, -1.5476350784301758, -0.3627643585205078, 0.8221015930175781, 2.006971836090088, 3.1918420791625977, 4.376712322235107, 5.561582565307617, 6.746452808380127, 7.931323051452637, 9.116193771362305, 10.301063537597656, 11.485933303833008, 12.670804023742676, 13.855674743652344, 15.040544509887695, 16.225414276123047, 17.41028594970703, 18.595155715942383, 19.780025482177734, 20.964895248413086, 22.149765014648438, 23.334636688232422, 24.519506454467773, 25.704376220703125, 26.88924789428711, 28.07411766052246, 29.258987426757812, 30.443857192993164, 31.628726959228516, 32.8135986328125, 33.99846649169922, 35.1833381652832, 36.36820983886719, 37.553077697753906, 38.73794937133789]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 9.0, 8.0, 8.0, 19.0, 36.0, 48.0, 79.0, 116.0, 231.0, 401.0, 777.0, 2027.0, 7693.0, 4135063.0, 40592.0, 4545.0, 1285.0, 603.0, 294.0, 163.0, 97.0, 67.0, 33.0, 29.0, 20.0, 21.0, 7.0, 4.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.1484375, -9.88702392578125, -9.6256103515625, -9.36419677734375, -9.102783203125, -8.84136962890625, -8.5799560546875, -8.31854248046875, -8.05712890625, -7.79571533203125, -7.5343017578125, -7.27288818359375, -7.011474609375, -6.75006103515625, -6.4886474609375, -6.22723388671875, -5.9658203125, -5.70440673828125, -5.4429931640625, -5.18157958984375, -4.920166015625, -4.65875244140625, -4.3973388671875, -4.13592529296875, -3.87451171875, -3.61309814453125, -3.3516845703125, -3.09027099609375, -2.828857421875, -2.56744384765625, -2.3060302734375, -2.04461669921875, -1.783203125, -1.52178955078125, -1.2603759765625, -0.99896240234375, -0.737548828125, -0.47613525390625, -0.2147216796875, 0.04669189453125, 0.30810546875, 0.56951904296875, 0.8309326171875, 1.09234619140625, 1.353759765625, 1.61517333984375, 1.8765869140625, 2.13800048828125, 2.3994140625, 2.66082763671875, 2.9222412109375, 3.18365478515625, 3.445068359375, 3.70648193359375, 3.9678955078125, 4.22930908203125, 4.49072265625, 4.75213623046875, 5.0135498046875, 5.27496337890625, 5.536376953125, 5.79779052734375, 6.0592041015625, 6.32061767578125, 6.58203125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 2.0, 7.0, 7.0, 4.0, 8.0, 10.0, 13.0, 15.0, 10.0, 18.0, 24.0, 36.0, 30.0, 43.0, 43.0, 56.0, 56.0, 64.0, 78.0, 59.0, 55.0, 52.0, 42.0, 45.0, 42.0, 33.0, 30.0, 24.0, 17.0, 19.0, 12.0, 10.0, 10.0, 3.0, 5.0, 4.0, 7.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.8837890625, -1.824462890625, -1.76513671875, -1.705810546875, -1.646484375, -1.587158203125, -1.52783203125, -1.468505859375, -1.4091796875, -1.349853515625, -1.29052734375, -1.231201171875, -1.171875, -1.112548828125, -1.05322265625, -0.993896484375, -0.9345703125, -0.875244140625, -0.81591796875, -0.756591796875, -0.697265625, -0.637939453125, -0.57861328125, -0.519287109375, -0.4599609375, -0.400634765625, -0.34130859375, -0.281982421875, -0.22265625, -0.163330078125, -0.10400390625, -0.044677734375, 0.0146484375, 0.073974609375, 0.13330078125, 0.192626953125, 0.251953125, 0.311279296875, 0.37060546875, 0.429931640625, 0.4892578125, 0.548583984375, 0.60791015625, 0.667236328125, 0.7265625, 0.785888671875, 0.84521484375, 0.904541015625, 0.9638671875, 1.023193359375, 1.08251953125, 1.141845703125, 1.201171875, 1.260498046875, 1.31982421875, 1.379150390625, 1.4384765625, 1.497802734375, 1.55712890625, 1.616455078125, 1.67578125, 1.735107421875, 1.79443359375, 1.853759765625, 1.9130859375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 8.0, 3.0, 14.0, 13.0, 8.0, 21.0, 27.0, 32.0, 44.0, 90.0, 125.0, 193.0, 288.0, 483.0, 890.0, 1682.0, 3685.0, 10807.0, 98770.0, 4052740.0, 15302.0, 4515.0, 1998.0, 1006.0, 571.0, 337.0, 190.0, 142.0, 98.0, 60.0, 46.0, 30.0, 20.0, 18.0, 8.0, 5.0, 6.0, 3.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9140625, -4.75616455078125, -4.5982666015625, -4.44036865234375, -4.282470703125, -4.12457275390625, -3.9666748046875, -3.80877685546875, -3.65087890625, -3.49298095703125, -3.3350830078125, -3.17718505859375, -3.019287109375, -2.86138916015625, -2.7034912109375, -2.54559326171875, -2.3876953125, -2.22979736328125, -2.0718994140625, -1.91400146484375, -1.756103515625, -1.59820556640625, -1.4403076171875, -1.28240966796875, -1.12451171875, -0.96661376953125, -0.8087158203125, -0.65081787109375, -0.492919921875, -0.33502197265625, -0.1771240234375, -0.01922607421875, 0.138671875, 0.29656982421875, 0.4544677734375, 0.61236572265625, 0.770263671875, 0.92816162109375, 1.0860595703125, 1.24395751953125, 1.40185546875, 1.55975341796875, 1.7176513671875, 1.87554931640625, 2.033447265625, 2.19134521484375, 2.3492431640625, 2.50714111328125, 2.6650390625, 2.82293701171875, 2.9808349609375, 3.13873291015625, 3.296630859375, 3.45452880859375, 3.6124267578125, 3.77032470703125, 3.92822265625, 4.08612060546875, 4.2440185546875, 4.40191650390625, 4.559814453125, 4.71771240234375, 4.8756103515625, 5.03350830078125, 5.19140625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 5.0, 7.0, 7.0, 9.0, 22.0, 38.0, 3539.0, 394.0, 27.0, 17.0, 3.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.369140625, -2.3197708129882812, -2.2704010009765625, -2.2210311889648438, -2.171661376953125, -2.1222915649414062, -2.0729217529296875, -2.0235519409179688, -1.97418212890625, -1.9248123168945312, -1.8754425048828125, -1.8260726928710938, -1.776702880859375, -1.7273330688476562, -1.6779632568359375, -1.6285934448242188, -1.5792236328125, -1.5298538208007812, -1.4804840087890625, -1.4311141967773438, -1.381744384765625, -1.3323745727539062, -1.2830047607421875, -1.2336349487304688, -1.18426513671875, -1.1348953247070312, -1.0855255126953125, -1.0361557006835938, -0.986785888671875, -0.9374160766601562, -0.8880462646484375, -0.8386764526367188, -0.789306640625, -0.7399368286132812, -0.6905670166015625, -0.6411972045898438, -0.591827392578125, -0.5424575805664062, -0.4930877685546875, -0.44371795654296875, -0.39434814453125, -0.34497833251953125, -0.2956085205078125, -0.24623870849609375, -0.196868896484375, -0.14749908447265625, -0.0981292724609375, -0.04875946044921875, 0.0006103515625, 0.04998016357421875, 0.0993499755859375, 0.14871978759765625, 0.198089599609375, 0.24745941162109375, 0.2968292236328125, 0.34619903564453125, 0.39556884765625, 0.44493865966796875, 0.4943084716796875, 0.5436782836914062, 0.593048095703125, 0.6424179077148438, 0.6917877197265625, 0.7411575317382812, 0.79052734375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 18.0, 71.0, 302.0, 483.0, 120.0, 8.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.93079948425293, -15.468399047851562, -15.005998611450195, -14.543598175048828, -14.081197738647461, -13.618797302246094, -13.156396865844727, -12.69399642944336, -12.231595993041992, -11.769195556640625, -11.306795120239258, -10.84439468383789, -10.381994247436523, -9.919593811035156, -9.457193374633789, -8.994792938232422, -8.532392501831055, -8.069992065429688, -7.60759162902832, -7.145191192626953, -6.682790756225586, -6.220390319824219, -5.757989883422852, -5.295589447021484, -4.833189964294434, -4.370789527893066, -3.908389091491699, -3.445988655090332, -2.983588218688965, -2.5211880207061768, -2.0587875843048096, -1.5963871479034424, -1.133986473083496, -0.6715860366821289, -0.2091856598854065, 0.2532147169113159, 0.7156151533126831, 1.1780154705047607, 1.640415906906128, 2.102816343307495, 2.5652167797088623, 3.0276172161102295, 3.4900176525115967, 3.9524178504943848, 4.414818286895752, 4.877218723297119, 5.339619159698486, 5.8020195960998535, 6.264420032501221, 6.726820468902588, 7.189220905303955, 7.651621341705322, 8.114021301269531, 8.576421737670898, 9.038822174072266, 9.501222610473633, 9.963623046875, 10.426023483276367, 10.888423919677734, 11.350824356079102, 11.813224792480469, 12.275625228881836, 12.738025665283203, 13.20042610168457, 13.662826538085938]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 9.0, 13.0, 13.0, 19.0, 14.0, 21.0, 23.0, 27.0, 20.0, 32.0, 41.0, 36.0, 43.0, 55.0, 44.0, 60.0, 50.0, 47.0, 51.0, 39.0, 47.0, 54.0, 32.0, 34.0, 32.0, 22.0, 31.0, 18.0, 14.0, 18.0, 10.0, 14.0, 2.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-3.122488498687744, -3.0384509563446045, -2.9544131755828857, -2.870375633239746, -2.7863378524780273, -2.7023003101348877, -2.618262529373169, -2.5342249870300293, -2.4501872062683105, -2.366149663925171, -2.282111883163452, -2.1980743408203125, -2.1140365600585938, -2.029999017715454, -1.9459612369537354, -1.8619236946105957, -1.7778860330581665, -1.6938483715057373, -1.609810709953308, -1.525773048400879, -1.4417353868484497, -1.3576977252960205, -1.2736601829528809, -1.189622402191162, -1.1055848598480225, -1.0215471982955933, -0.9375095367431641, -0.8534718751907349, -0.7694342136383057, -0.6853965520858765, -0.601358950138092, -0.5173212885856628, -0.43328356742858887, -0.34924590587615967, -0.26520824432373047, -0.18117061257362366, -0.09713295102119446, -0.013095289468765259, 0.07094234228134155, 0.15498000383377075, 0.23901766538619995, 0.32305532693862915, 0.40709298849105835, 0.49113062024116516, 0.575168251991272, 0.6592059135437012, 0.7432435750961304, 0.8272812366485596, 0.9113188982009888, 0.995356559753418, 1.0793942213058472, 1.1634318828582764, 1.2474695444107056, 1.3315072059631348, 1.4155447483062744, 1.4995825290679932, 1.5836200714111328, 1.667657732963562, 1.7516953945159912, 1.8357330560684204, 1.9197707176208496, 2.0038082599639893, 2.087846040725708, 2.1718835830688477, 2.2559213638305664]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 6.0, 6.0, 8.0, 9.0, 20.0, 26.0, 38.0, 46.0, 65.0, 75.0, 144.0, 161.0, 275.0, 421.0, 638.0, 1009.0, 1709.0, 2993.0, 5601.0, 11098.0, 23538.0, 56806.0, 157733.0, 387155.0, 248034.0, 85312.0, 33674.0, 14974.0, 7409.0, 3908.0, 2129.0, 1230.0, 752.0, 473.0, 324.0, 237.0, 163.0, 104.0, 65.0, 53.0, 40.0, 29.0, 17.0, 17.0, 9.0, 10.0, 9.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.08984375, -2.992401123046875, -2.89495849609375, -2.797515869140625, -2.7000732421875, -2.602630615234375, -2.50518798828125, -2.407745361328125, -2.310302734375, -2.212860107421875, -2.11541748046875, -2.017974853515625, -1.9205322265625, -1.823089599609375, -1.72564697265625, -1.628204345703125, -1.53076171875, -1.433319091796875, -1.33587646484375, -1.238433837890625, -1.1409912109375, -1.043548583984375, -0.94610595703125, -0.848663330078125, -0.751220703125, -0.653778076171875, -0.55633544921875, -0.458892822265625, -0.3614501953125, -0.264007568359375, -0.16656494140625, -0.069122314453125, 0.0283203125, 0.125762939453125, 0.22320556640625, 0.320648193359375, 0.4180908203125, 0.515533447265625, 0.61297607421875, 0.710418701171875, 0.807861328125, 0.905303955078125, 1.00274658203125, 1.100189208984375, 1.1976318359375, 1.295074462890625, 1.39251708984375, 1.489959716796875, 1.58740234375, 1.684844970703125, 1.78228759765625, 1.879730224609375, 1.9771728515625, 2.074615478515625, 2.17205810546875, 2.269500732421875, 2.366943359375, 2.464385986328125, 2.56182861328125, 2.659271240234375, 2.7567138671875, 2.854156494140625, 2.95159912109375, 3.049041748046875, 3.146484375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 1.0, 9.0, 7.0, 7.0, 7.0, 16.0, 6.0, 11.0, 12.0, 20.0, 25.0, 37.0, 28.0, 42.0, 48.0, 53.0, 62.0, 54.0, 66.0, 70.0, 62.0, 60.0, 55.0, 38.0, 25.0, 27.0, 31.0, 32.0, 16.0, 15.0, 11.0, 9.0, 8.0, 6.0, 5.0, 6.0, 4.0, 6.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.8408203125, -1.7787017822265625, -1.716583251953125, -1.6544647216796875, -1.59234619140625, -1.5302276611328125, -1.468109130859375, -1.4059906005859375, -1.3438720703125, -1.2817535400390625, -1.219635009765625, -1.1575164794921875, -1.09539794921875, -1.0332794189453125, -0.971160888671875, -0.9090423583984375, -0.846923828125, -0.7848052978515625, -0.722686767578125, -0.6605682373046875, -0.59844970703125, -0.5363311767578125, -0.474212646484375, -0.4120941162109375, -0.3499755859375, -0.2878570556640625, -0.225738525390625, -0.1636199951171875, -0.10150146484375, -0.0393829345703125, 0.022735595703125, 0.0848541259765625, 0.14697265625, 0.2090911865234375, 0.271209716796875, 0.3333282470703125, 0.39544677734375, 0.4575653076171875, 0.519683837890625, 0.5818023681640625, 0.6439208984375, 0.7060394287109375, 0.768157958984375, 0.8302764892578125, 0.89239501953125, 0.9545135498046875, 1.016632080078125, 1.0787506103515625, 1.140869140625, 1.2029876708984375, 1.265106201171875, 1.3272247314453125, 1.38934326171875, 1.4514617919921875, 1.513580322265625, 1.5756988525390625, 1.6378173828125, 1.6999359130859375, 1.762054443359375, 1.8241729736328125, 1.88629150390625, 1.9484100341796875, 2.010528564453125, 2.0726470947265625, 2.134765625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 5.0, 5.0, 23.0, 25.0, 52.0, 105.0, 197.0, 413.0, 1036.0, 3088.0, 16361.0, 374411.0, 624234.0, 22786.0, 3774.0, 1137.0, 450.0, 213.0, 107.0, 46.0, 32.0, 22.0, 10.0, 9.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.15625, -9.858154296875, -9.56005859375, -9.261962890625, -8.9638671875, -8.665771484375, -8.36767578125, -8.069580078125, -7.771484375, -7.473388671875, -7.17529296875, -6.877197265625, -6.5791015625, -6.281005859375, -5.98291015625, -5.684814453125, -5.38671875, -5.088623046875, -4.79052734375, -4.492431640625, -4.1943359375, -3.896240234375, -3.59814453125, -3.300048828125, -3.001953125, -2.703857421875, -2.40576171875, -2.107666015625, -1.8095703125, -1.511474609375, -1.21337890625, -0.915283203125, -0.6171875, -0.319091796875, -0.02099609375, 0.277099609375, 0.5751953125, 0.873291015625, 1.17138671875, 1.469482421875, 1.767578125, 2.065673828125, 2.36376953125, 2.661865234375, 2.9599609375, 3.258056640625, 3.55615234375, 3.854248046875, 4.15234375, 4.450439453125, 4.74853515625, 5.046630859375, 5.3447265625, 5.642822265625, 5.94091796875, 6.239013671875, 6.537109375, 6.835205078125, 7.13330078125, 7.431396484375, 7.7294921875, 8.027587890625, 8.32568359375, 8.623779296875, 8.921875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 9.0, 5.0, 7.0, 10.0, 16.0, 16.0, 17.0, 12.0, 32.0, 32.0, 40.0, 58.0, 48.0, 62.0, 65.0, 58.0, 67.0, 61.0, 66.0, 46.0, 35.0, 41.0, 32.0, 44.0, 21.0, 26.0, 26.0, 11.0, 13.0, 7.0, 5.0, 4.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-12.7890625, -12.46453857421875, -12.1400146484375, -11.81549072265625, -11.490966796875, -11.16644287109375, -10.8419189453125, -10.51739501953125, -10.19287109375, -9.86834716796875, -9.5438232421875, -9.21929931640625, -8.894775390625, -8.57025146484375, -8.2457275390625, -7.92120361328125, -7.5966796875, -7.27215576171875, -6.9476318359375, -6.62310791015625, -6.298583984375, -5.97406005859375, -5.6495361328125, -5.32501220703125, -5.00048828125, -4.67596435546875, -4.3514404296875, -4.02691650390625, -3.702392578125, -3.37786865234375, -3.0533447265625, -2.72882080078125, -2.404296875, -2.07977294921875, -1.7552490234375, -1.43072509765625, -1.106201171875, -0.78167724609375, -0.4571533203125, -0.13262939453125, 0.19189453125, 0.51641845703125, 0.8409423828125, 1.16546630859375, 1.489990234375, 1.81451416015625, 2.1390380859375, 2.46356201171875, 2.7880859375, 3.11260986328125, 3.4371337890625, 3.76165771484375, 4.086181640625, 4.41070556640625, 4.7352294921875, 5.05975341796875, 5.38427734375, 5.70880126953125, 6.0333251953125, 6.35784912109375, 6.682373046875, 7.00689697265625, 7.3314208984375, 7.65594482421875, 7.98046875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 7.0, 6.0, 11.0, 21.0, 40.0, 72.0, 259.0, 748.0, 3602.0, 109699.0, 926168.0, 6268.0, 1137.0, 312.0, 101.0, 52.0, 18.0, 13.0, 4.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.88671875, -7.51361083984375, -7.1405029296875, -6.76739501953125, -6.394287109375, -6.02117919921875, -5.6480712890625, -5.27496337890625, -4.90185546875, -4.52874755859375, -4.1556396484375, -3.78253173828125, -3.409423828125, -3.03631591796875, -2.6632080078125, -2.29010009765625, -1.9169921875, -1.54388427734375, -1.1707763671875, -0.79766845703125, -0.424560546875, -0.05145263671875, 0.3216552734375, 0.69476318359375, 1.06787109375, 1.44097900390625, 1.8140869140625, 2.18719482421875, 2.560302734375, 2.93341064453125, 3.3065185546875, 3.67962646484375, 4.052734375, 4.42584228515625, 4.7989501953125, 5.17205810546875, 5.545166015625, 5.91827392578125, 6.2913818359375, 6.66448974609375, 7.03759765625, 7.41070556640625, 7.7838134765625, 8.15692138671875, 8.530029296875, 8.90313720703125, 9.2762451171875, 9.64935302734375, 10.0224609375, 10.39556884765625, 10.7686767578125, 11.14178466796875, 11.514892578125, 11.88800048828125, 12.2611083984375, 12.63421630859375, 13.00732421875, 13.38043212890625, 13.7535400390625, 14.12664794921875, 14.499755859375, 14.87286376953125, 15.2459716796875, 15.61907958984375, 15.9921875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 7.0, 10.0, 17.0, 23.0, 36.0, 88.0, 171.0, 228.0, 188.0, 101.0, 60.0, 29.0, 10.0, 6.0, 8.0, 5.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0008711814880371094, -0.0008473619818687439, -0.0008235424757003784, -0.0007997229695320129, -0.0007759034633636475, -0.000752083957195282, -0.0007282644510269165, -0.000704444944858551, -0.0006806254386901855, -0.0006568059325218201, -0.0006329864263534546, -0.0006091669201850891, -0.0005853474140167236, -0.0005615279078483582, -0.0005377084016799927, -0.0005138888955116272, -0.0004900693893432617, -0.00046624988317489624, -0.00044243037700653076, -0.0004186108708381653, -0.0003947913646697998, -0.0003709718585014343, -0.00034715235233306885, -0.00032333284616470337, -0.0002995133399963379, -0.0002756938338279724, -0.00025187432765960693, -0.00022805482149124146, -0.00020423531532287598, -0.0001804158091545105, -0.00015659630298614502, -0.00013277679681777954, -0.00010895729064941406, -8.513778448104858e-05, -6.13182783126831e-05, -3.749877214431763e-05, -1.3679265975952148e-05, 1.014024019241333e-05, 3.395974636077881e-05, 5.777925252914429e-05, 8.159875869750977e-05, 0.00010541826486587524, 0.00012923777103424072, 0.0001530572772026062, 0.00017687678337097168, 0.00020069628953933716, 0.00022451579570770264, 0.0002483353018760681, 0.0002721548080444336, 0.00029597431421279907, 0.00031979382038116455, 0.00034361332654953003, 0.0003674328327178955, 0.000391252338886261, 0.00041507184505462646, 0.00043889135122299194, 0.0004627108573913574, 0.0004865303635597229, 0.0005103498697280884, 0.0005341693758964539, 0.0005579888820648193, 0.0005818083882331848, 0.0006056278944015503, 0.0006294474005699158, 0.0006532669067382812]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 3.0, 8.0, 13.0, 18.0, 20.0, 32.0, 58.0, 100.0, 188.0, 361.0, 696.0, 1853.0, 6694.0, 90886.0, 924728.0, 17216.0, 3358.0, 1235.0, 537.0, 233.0, 118.0, 76.0, 37.0, 31.0, 17.0, 15.0, 5.0, 6.0, 2.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.81640625, -6.59112548828125, -6.3658447265625, -6.14056396484375, -5.915283203125, -5.69000244140625, -5.4647216796875, -5.23944091796875, -5.01416015625, -4.78887939453125, -4.5635986328125, -4.33831787109375, -4.113037109375, -3.88775634765625, -3.6624755859375, -3.43719482421875, -3.2119140625, -2.98663330078125, -2.7613525390625, -2.53607177734375, -2.310791015625, -2.08551025390625, -1.8602294921875, -1.63494873046875, -1.40966796875, -1.18438720703125, -0.9591064453125, -0.73382568359375, -0.508544921875, -0.28326416015625, -0.0579833984375, 0.16729736328125, 0.392578125, 0.61785888671875, 0.8431396484375, 1.06842041015625, 1.293701171875, 1.51898193359375, 1.7442626953125, 1.96954345703125, 2.19482421875, 2.42010498046875, 2.6453857421875, 2.87066650390625, 3.095947265625, 3.32122802734375, 3.5465087890625, 3.77178955078125, 3.9970703125, 4.22235107421875, 4.4476318359375, 4.67291259765625, 4.898193359375, 5.12347412109375, 5.3487548828125, 5.57403564453125, 5.79931640625, 6.02459716796875, 6.2498779296875, 6.47515869140625, 6.700439453125, 6.92572021484375, 7.1510009765625, 7.37628173828125, 7.6015625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 5.0, 2.0, 2.0, 2.0, 7.0, 9.0, 12.0, 38.0, 115.0, 346.0, 297.0, 89.0, 26.0, 13.0, 6.0, 7.0, 4.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 4.0, 1.0], "bins": [-17.5, -17.1265869140625, -16.753173828125, -16.3797607421875, -16.00634765625, -15.6329345703125, -15.259521484375, -14.8861083984375, -14.5126953125, -14.1392822265625, -13.765869140625, -13.3924560546875, -13.01904296875, -12.6456298828125, -12.272216796875, -11.8988037109375, -11.525390625, -11.1519775390625, -10.778564453125, -10.4051513671875, -10.03173828125, -9.6583251953125, -9.284912109375, -8.9114990234375, -8.5380859375, -8.1646728515625, -7.791259765625, -7.4178466796875, -7.04443359375, -6.6710205078125, -6.297607421875, -5.9241943359375, -5.55078125, -5.1773681640625, -4.803955078125, -4.4305419921875, -4.05712890625, -3.6837158203125, -3.310302734375, -2.9368896484375, -2.5634765625, -2.1900634765625, -1.816650390625, -1.4432373046875, -1.06982421875, -0.6964111328125, -0.322998046875, 0.0504150390625, 0.423828125, 0.7972412109375, 1.170654296875, 1.5440673828125, 1.91748046875, 2.2908935546875, 2.664306640625, 3.0377197265625, 3.4111328125, 3.7845458984375, 4.157958984375, 4.5313720703125, 4.90478515625, 5.2781982421875, 5.651611328125, 6.0250244140625, 6.3984375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 7.0, 15.0, 32.0, 72.0, 192.0, 303.0, 241.0, 101.0, 34.0, 8.0, 5.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-132.70132446289062, -129.462158203125, -126.22298431396484, -122.98381805419922, -119.74464416503906, -116.50547790527344, -113.26631164550781, -110.02714538574219, -106.78797149658203, -103.5488052368164, -100.30963134765625, -97.07046508789062, -93.831298828125, -90.59212493896484, -87.35295867919922, -84.11378479003906, -80.87461853027344, -77.63545227050781, -74.39627838134766, -71.15711212158203, -67.91793823242188, -64.67877197265625, -61.439605712890625, -58.200435638427734, -54.961265563964844, -51.72209548950195, -48.48292541503906, -45.24375915527344, -42.00458908081055, -38.765419006347656, -35.52625274658203, -32.28708267211914, -29.04790496826172, -25.808734893798828, -22.56956672668457, -19.330398559570312, -16.091228485107422, -12.852058410644531, -9.612890243530273, -6.373722076416016, -3.134552001953125, 0.10461711883544922, 3.3437862396240234, 6.582955360412598, 9.822124481201172, 13.061294555664062, 16.30046272277832, 19.539630889892578, 22.77880096435547, 26.01797103881836, 29.257139205932617, 32.496307373046875, 35.735477447509766, 38.974647521972656, 42.21381378173828, 45.45298385620117, 48.69215393066406, 51.93132400512695, 55.170494079589844, 58.40966033935547, 61.64883041381836, 64.88800048828125, 68.12716674804688, 71.3663330078125, 74.60550689697266]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 7.0, 7.0, 5.0, 6.0, 6.0, 11.0, 15.0, 21.0, 25.0, 31.0, 27.0, 24.0, 37.0, 37.0, 25.0, 28.0, 38.0, 44.0, 54.0, 54.0, 45.0, 51.0, 46.0, 34.0, 43.0, 34.0, 36.0, 28.0, 32.0, 32.0, 25.0, 18.0, 17.0, 13.0, 5.0, 12.0, 6.0, 8.0, 7.0, 3.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0], "bins": [-52.13043212890625, -50.757164001464844, -49.38389587402344, -48.01062774658203, -46.637359619140625, -45.26408767700195, -43.89081954956055, -42.51755142211914, -41.144283294677734, -39.77101516723633, -38.39774703979492, -37.024478912353516, -35.651206970214844, -34.27793884277344, -32.90467071533203, -31.531402587890625, -30.15813446044922, -28.784866333007812, -27.411598205566406, -26.038328170776367, -24.66506004333496, -23.291791915893555, -21.918521881103516, -20.54525375366211, -19.171985626220703, -17.798717498779297, -16.42544937133789, -15.052179336547852, -13.678911209106445, -12.305643081665039, -10.932374000549316, -9.559104919433594, -8.185836791992188, -6.812568187713623, -5.439299583435059, -4.066030979156494, -2.6927623748779297, -1.3194937705993652, 0.05377483367919922, 1.4270439147949219, 2.800312042236328, 4.173580646514893, 5.546849250793457, 6.9201178550720215, 8.293386459350586, 9.666654586791992, 11.039923667907715, 12.413192749023438, 13.786460876464844, 15.15972900390625, 16.532997131347656, 17.906267166137695, 19.2795352935791, 20.652803421020508, 22.026073455810547, 23.399341583251953, 24.77260971069336, 26.145877838134766, 27.519145965576172, 28.89241600036621, 30.265684127807617, 31.638952255249023, 33.01222229003906, 34.38549041748047, 35.758758544921875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 8.0, 5.0, 6.0, 8.0, 15.0, 18.0, 15.0, 27.0, 32.0, 58.0, 78.0, 125.0, 198.0, 387.0, 811.0, 1876.0, 6661.0, 88012.0, 4077930.0, 13086.0, 2796.0, 1035.0, 474.0, 238.0, 113.0, 83.0, 57.0, 34.0, 23.0, 12.0, 18.0, 11.0, 4.0, 5.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-8.7421875, -8.442626953125, -8.14306640625, -7.843505859375, -7.5439453125, -7.244384765625, -6.94482421875, -6.645263671875, -6.345703125, -6.046142578125, -5.74658203125, -5.447021484375, -5.1474609375, -4.847900390625, -4.54833984375, -4.248779296875, -3.94921875, -3.649658203125, -3.35009765625, -3.050537109375, -2.7509765625, -2.451416015625, -2.15185546875, -1.852294921875, -1.552734375, -1.253173828125, -0.95361328125, -0.654052734375, -0.3544921875, -0.054931640625, 0.24462890625, 0.544189453125, 0.84375, 1.143310546875, 1.44287109375, 1.742431640625, 2.0419921875, 2.341552734375, 2.64111328125, 2.940673828125, 3.240234375, 3.539794921875, 3.83935546875, 4.138916015625, 4.4384765625, 4.738037109375, 5.03759765625, 5.337158203125, 5.63671875, 5.936279296875, 6.23583984375, 6.535400390625, 6.8349609375, 7.134521484375, 7.43408203125, 7.733642578125, 8.033203125, 8.332763671875, 8.63232421875, 8.931884765625, 9.2314453125, 9.531005859375, 9.83056640625, 10.130126953125, 10.4296875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 4.0, 1.0, 6.0, 6.0, 10.0, 17.0, 16.0, 20.0, 35.0, 47.0, 47.0, 60.0, 76.0, 89.0, 84.0, 91.0, 78.0, 77.0, 60.0, 55.0, 30.0, 30.0, 17.0, 14.0, 8.0, 8.0, 6.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4921875, -3.39892578125, -3.3056640625, -3.21240234375, -3.119140625, -3.02587890625, -2.9326171875, -2.83935546875, -2.74609375, -2.65283203125, -2.5595703125, -2.46630859375, -2.373046875, -2.27978515625, -2.1865234375, -2.09326171875, -2.0, -1.90673828125, -1.8134765625, -1.72021484375, -1.626953125, -1.53369140625, -1.4404296875, -1.34716796875, -1.25390625, -1.16064453125, -1.0673828125, -0.97412109375, -0.880859375, -0.78759765625, -0.6943359375, -0.60107421875, -0.5078125, -0.41455078125, -0.3212890625, -0.22802734375, -0.134765625, -0.04150390625, 0.0517578125, 0.14501953125, 0.23828125, 0.33154296875, 0.4248046875, 0.51806640625, 0.611328125, 0.70458984375, 0.7978515625, 0.89111328125, 0.984375, 1.07763671875, 1.1708984375, 1.26416015625, 1.357421875, 1.45068359375, 1.5439453125, 1.63720703125, 1.73046875, 1.82373046875, 1.9169921875, 2.01025390625, 2.103515625, 2.19677734375, 2.2900390625, 2.38330078125, 2.4765625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 4.0, 5.0, 4.0, 17.0, 15.0, 14.0, 24.0, 32.0, 38.0, 36.0, 47.0, 69.0, 91.0, 110.0, 129.0, 179.0, 247.0, 287.0, 426.0, 936.0, 12164.0, 4167871.0, 9008.0, 782.0, 367.0, 297.0, 245.0, 178.0, 140.0, 124.0, 73.0, 69.0, 59.0, 35.0, 37.0, 24.0, 31.0, 10.0, 18.0, 12.0, 5.0, 12.0, 5.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-26.015625, -25.16162109375, -24.3076171875, -23.45361328125, -22.599609375, -21.74560546875, -20.8916015625, -20.03759765625, -19.18359375, -18.32958984375, -17.4755859375, -16.62158203125, -15.767578125, -14.91357421875, -14.0595703125, -13.20556640625, -12.3515625, -11.49755859375, -10.6435546875, -9.78955078125, -8.935546875, -8.08154296875, -7.2275390625, -6.37353515625, -5.51953125, -4.66552734375, -3.8115234375, -2.95751953125, -2.103515625, -1.24951171875, -0.3955078125, 0.45849609375, 1.3125, 2.16650390625, 3.0205078125, 3.87451171875, 4.728515625, 5.58251953125, 6.4365234375, 7.29052734375, 8.14453125, 8.99853515625, 9.8525390625, 10.70654296875, 11.560546875, 12.41455078125, 13.2685546875, 14.12255859375, 14.9765625, 15.83056640625, 16.6845703125, 17.53857421875, 18.392578125, 19.24658203125, 20.1005859375, 20.95458984375, 21.80859375, 22.66259765625, 23.5166015625, 24.37060546875, 25.224609375, 26.07861328125, 26.9326171875, 27.78662109375, 28.640625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 8.0, 65.0, 3902.0, 94.0, 13.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3515625, -7.7801513671875, -7.208740234375, -6.6373291015625, -6.06591796875, -5.4945068359375, -4.923095703125, -4.3516845703125, -3.7802734375, -3.2088623046875, -2.637451171875, -2.0660400390625, -1.49462890625, -0.9232177734375, -0.351806640625, 0.2196044921875, 0.791015625, 1.3624267578125, 1.933837890625, 2.5052490234375, 3.07666015625, 3.6480712890625, 4.219482421875, 4.7908935546875, 5.3623046875, 5.9337158203125, 6.505126953125, 7.0765380859375, 7.64794921875, 8.2193603515625, 8.790771484375, 9.3621826171875, 9.93359375, 10.5050048828125, 11.076416015625, 11.6478271484375, 12.21923828125, 12.7906494140625, 13.362060546875, 13.9334716796875, 14.5048828125, 15.0762939453125, 15.647705078125, 16.2191162109375, 16.79052734375, 17.3619384765625, 17.933349609375, 18.5047607421875, 19.076171875, 19.6475830078125, 20.218994140625, 20.7904052734375, 21.36181640625, 21.9332275390625, 22.504638671875, 23.0760498046875, 23.6474609375, 24.2188720703125, 24.790283203125, 25.3616943359375, 25.93310546875, 26.5045166015625, 27.075927734375, 27.6473388671875, 28.21875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 0.0, 3.0, 9.0, 26.0, 54.0, 128.0, 301.0, 275.0, 129.0, 52.0, 20.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.75062084197998, -13.301531791687012, -11.85244369506836, -10.40335464477539, -8.954265594482422, -7.5051774978637695, -6.056088447570801, -4.607000350952148, -3.1579113006591797, -1.7088226079940796, -0.2597339153289795, 1.1893548965454102, 2.6384434700012207, 4.087532043457031, 5.53662109375, 6.985709190368652, 8.434798240661621, 9.88388729095459, 11.332975387573242, 12.782064437866211, 14.23115348815918, 15.680241584777832, 17.129329681396484, 18.578418731689453, 20.027507781982422, 21.47659683227539, 22.92568588256836, 24.374774932861328, 25.823862075805664, 27.272951126098633, 28.7220401763916, 30.171127319335938, 31.620220184326172, 33.06930923461914, 34.51839828491211, 35.96748733520508, 37.41657638549805, 38.86566162109375, 40.31475067138672, 41.76383972167969, 43.212928771972656, 44.662017822265625, 46.111106872558594, 47.56019592285156, 49.00928497314453, 50.4583740234375, 51.90746307373047, 53.35654830932617, 54.805641174316406, 56.254730224609375, 57.703819274902344, 59.15290832519531, 60.60199737548828, 62.05108642578125, 63.50017547607422, 64.94926452636719, 66.39834594726562, 67.8474349975586, 69.29652404785156, 70.74561309814453, 72.1947021484375, 73.64379119873047, 75.09288024902344, 76.5419692993164, 77.99105834960938]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 6.0, 2.0, 8.0, 14.0, 22.0, 26.0, 39.0, 50.0, 85.0, 94.0, 118.0, 130.0, 120.0, 95.0, 61.0, 48.0, 29.0, 18.0, 20.0, 7.0, 6.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.21601867675781, -45.784751892089844, -44.353485107421875, -42.922218322753906, -41.49095153808594, -40.059688568115234, -38.628421783447266, -37.1971549987793, -35.76588821411133, -34.33462142944336, -32.90335464477539, -31.472089767456055, -30.040822982788086, -28.609556198120117, -27.17829132080078, -25.747024536132812, -24.315757751464844, -22.884490966796875, -21.453224182128906, -20.02195930480957, -18.5906925201416, -17.159425735473633, -15.72815990447998, -14.296894073486328, -12.86562728881836, -11.43436050415039, -10.003094673156738, -8.571828842163086, -7.140562057495117, -5.709295749664307, -4.278029441833496, -2.8467636108398438, -1.415496826171875, 0.015769481658935547, 1.447035789489746, 2.8783020973205566, 4.309568405151367, 5.740834712982178, 7.172101020812988, 8.60336685180664, 10.03463363647461, 11.465900421142578, 12.89716625213623, 14.328432083129883, 15.759698867797852, 17.19096565246582, 18.622230529785156, 20.053497314453125, 21.484764099121094, 22.916030883789062, 24.34729766845703, 25.778562545776367, 27.209829330444336, 28.641096115112305, 30.07236099243164, 31.50362777709961, 32.93489456176758, 34.36616134643555, 35.797428131103516, 37.228694915771484, 38.65995788574219, 40.091224670410156, 41.522491455078125, 42.953758239746094, 44.38502502441406]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 6.0, 2.0, 6.0, 5.0, 7.0, 18.0, 18.0, 35.0, 44.0, 66.0, 81.0, 162.0, 299.0, 513.0, 1033.0, 2141.0, 5540.0, 16192.0, 61003.0, 322169.0, 499952.0, 101564.0, 24340.0, 7686.0, 2891.0, 1278.0, 595.0, 345.0, 191.0, 146.0, 83.0, 54.0, 29.0, 21.0, 18.0, 6.0, 10.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.7734375, -5.59393310546875, -5.4144287109375, -5.23492431640625, -5.055419921875, -4.87591552734375, -4.6964111328125, -4.51690673828125, -4.33740234375, -4.15789794921875, -3.9783935546875, -3.79888916015625, -3.619384765625, -3.43988037109375, -3.2603759765625, -3.08087158203125, -2.9013671875, -2.72186279296875, -2.5423583984375, -2.36285400390625, -2.183349609375, -2.00384521484375, -1.8243408203125, -1.64483642578125, -1.46533203125, -1.28582763671875, -1.1063232421875, -0.92681884765625, -0.747314453125, -0.56781005859375, -0.3883056640625, -0.20880126953125, -0.029296875, 0.15020751953125, 0.3297119140625, 0.50921630859375, 0.688720703125, 0.86822509765625, 1.0477294921875, 1.22723388671875, 1.40673828125, 1.58624267578125, 1.7657470703125, 1.94525146484375, 2.124755859375, 2.30426025390625, 2.4837646484375, 2.66326904296875, 2.8427734375, 3.02227783203125, 3.2017822265625, 3.38128662109375, 3.560791015625, 3.74029541015625, 3.9197998046875, 4.09930419921875, 4.27880859375, 4.45831298828125, 4.6378173828125, 4.81732177734375, 4.996826171875, 5.17633056640625, 5.3558349609375, 5.53533935546875, 5.71484375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 6.0, 6.0, 7.0, 11.0, 13.0, 24.0, 24.0, 51.0, 62.0, 85.0, 88.0, 94.0, 84.0, 95.0, 94.0, 66.0, 46.0, 42.0, 25.0, 26.0, 22.0, 15.0, 6.0, 5.0, 4.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.33984375, -4.2012939453125, -4.062744140625, -3.9241943359375, -3.78564453125, -3.6470947265625, -3.508544921875, -3.3699951171875, -3.2314453125, -3.0928955078125, -2.954345703125, -2.8157958984375, -2.67724609375, -2.5386962890625, -2.400146484375, -2.2615966796875, -2.123046875, -1.9844970703125, -1.845947265625, -1.7073974609375, -1.56884765625, -1.4302978515625, -1.291748046875, -1.1531982421875, -1.0146484375, -0.8760986328125, -0.737548828125, -0.5989990234375, -0.46044921875, -0.3218994140625, -0.183349609375, -0.0447998046875, 0.09375, 0.2322998046875, 0.370849609375, 0.5093994140625, 0.64794921875, 0.7864990234375, 0.925048828125, 1.0635986328125, 1.2021484375, 1.3406982421875, 1.479248046875, 1.6177978515625, 1.75634765625, 1.8948974609375, 2.033447265625, 2.1719970703125, 2.310546875, 2.4490966796875, 2.587646484375, 2.7261962890625, 2.86474609375, 3.0032958984375, 3.141845703125, 3.2803955078125, 3.4189453125, 3.5574951171875, 3.696044921875, 3.8345947265625, 3.97314453125, 4.1116943359375, 4.250244140625, 4.3887939453125, 4.52734375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 8.0, 7.0, 14.0, 28.0, 37.0, 70.0, 150.0, 345.0, 965.0, 9069.0, 1021038.0, 14905.0, 1159.0, 390.0, 161.0, 85.0, 47.0, 23.0, 17.0, 5.0, 7.0, 4.0, 4.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-33.59375, -32.529296875, -31.46484375, -30.400390625, -29.3359375, -28.271484375, -27.20703125, -26.142578125, -25.078125, -24.013671875, -22.94921875, -21.884765625, -20.8203125, -19.755859375, -18.69140625, -17.626953125, -16.5625, -15.498046875, -14.43359375, -13.369140625, -12.3046875, -11.240234375, -10.17578125, -9.111328125, -8.046875, -6.982421875, -5.91796875, -4.853515625, -3.7890625, -2.724609375, -1.66015625, -0.595703125, 0.46875, 1.533203125, 2.59765625, 3.662109375, 4.7265625, 5.791015625, 6.85546875, 7.919921875, 8.984375, 10.048828125, 11.11328125, 12.177734375, 13.2421875, 14.306640625, 15.37109375, 16.435546875, 17.5, 18.564453125, 19.62890625, 20.693359375, 21.7578125, 22.822265625, 23.88671875, 24.951171875, 26.015625, 27.080078125, 28.14453125, 29.208984375, 30.2734375, 31.337890625, 32.40234375, 33.466796875, 34.53125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 10.0, 27.0, 60.0, 114.0, 122.0, 176.0, 192.0, 125.0, 88.0, 59.0, 16.0, 12.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.59375, -24.41943359375, -23.2451171875, -22.07080078125, -20.896484375, -19.72216796875, -18.5478515625, -17.37353515625, -16.19921875, -15.02490234375, -13.8505859375, -12.67626953125, -11.501953125, -10.32763671875, -9.1533203125, -7.97900390625, -6.8046875, -5.63037109375, -4.4560546875, -3.28173828125, -2.107421875, -0.93310546875, 0.2412109375, 1.41552734375, 2.58984375, 3.76416015625, 4.9384765625, 6.11279296875, 7.287109375, 8.46142578125, 9.6357421875, 10.81005859375, 11.984375, 13.15869140625, 14.3330078125, 15.50732421875, 16.681640625, 17.85595703125, 19.0302734375, 20.20458984375, 21.37890625, 22.55322265625, 23.7275390625, 24.90185546875, 26.076171875, 27.25048828125, 28.4248046875, 29.59912109375, 30.7734375, 31.94775390625, 33.1220703125, 34.29638671875, 35.470703125, 36.64501953125, 37.8193359375, 38.99365234375, 40.16796875, 41.34228515625, 42.5166015625, 43.69091796875, 44.865234375, 46.03955078125, 47.2138671875, 48.38818359375, 49.5625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 7.0, 7.0, 14.0, 32.0, 49.0, 74.0, 172.0, 413.0, 1478.0, 14116.0, 954592.0, 73274.0, 3111.0, 713.0, 242.0, 113.0, 48.0, 29.0, 22.0, 8.0, 7.0, 6.0, 2.0, 9.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.59765625, -5.3880615234375, -5.178466796875, -4.9688720703125, -4.75927734375, -4.5496826171875, -4.340087890625, -4.1304931640625, -3.9208984375, -3.7113037109375, -3.501708984375, -3.2921142578125, -3.08251953125, -2.8729248046875, -2.663330078125, -2.4537353515625, -2.244140625, -2.0345458984375, -1.824951171875, -1.6153564453125, -1.40576171875, -1.1961669921875, -0.986572265625, -0.7769775390625, -0.5673828125, -0.3577880859375, -0.148193359375, 0.0614013671875, 0.27099609375, 0.4805908203125, 0.690185546875, 0.8997802734375, 1.109375, 1.3189697265625, 1.528564453125, 1.7381591796875, 1.94775390625, 2.1573486328125, 2.366943359375, 2.5765380859375, 2.7861328125, 2.9957275390625, 3.205322265625, 3.4149169921875, 3.62451171875, 3.8341064453125, 4.043701171875, 4.2532958984375, 4.462890625, 4.6724853515625, 4.882080078125, 5.0916748046875, 5.30126953125, 5.5108642578125, 5.720458984375, 5.9300537109375, 6.1396484375, 6.3492431640625, 6.558837890625, 6.7684326171875, 6.97802734375, 7.1876220703125, 7.397216796875, 7.6068115234375, 7.81640625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 2.0, 3.0, 10.0, 7.0, 10.0, 15.0, 36.0, 42.0, 79.0, 99.0, 143.0, 169.0, 131.0, 93.0, 49.0, 35.0, 21.0, 17.0, 16.0, 8.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0004391670227050781, -0.0004211738705635071, -0.00040318071842193604, -0.000385187566280365, -0.00036719441413879395, -0.0003492012619972229, -0.00033120810985565186, -0.0003132149577140808, -0.00029522180557250977, -0.0002772286534309387, -0.0002592355012893677, -0.00024124234914779663, -0.00022324919700622559, -0.00020525604486465454, -0.0001872628927230835, -0.00016926974058151245, -0.0001512765884399414, -0.00013328343629837036, -0.00011529028415679932, -9.729713201522827e-05, -7.930397987365723e-05, -6.131082773208618e-05, -4.331767559051514e-05, -2.5324523448944092e-05, -7.331371307373047e-06, 1.0661780834197998e-05, 2.8654932975769043e-05, 4.664808511734009e-05, 6.464123725891113e-05, 8.263438940048218e-05, 0.00010062754154205322, 0.00011862069368362427, 0.0001366138458251953, 0.00015460699796676636, 0.0001726001501083374, 0.00019059330224990845, 0.0002085864543914795, 0.00022657960653305054, 0.0002445727586746216, 0.0002625659108161926, 0.00028055906295776367, 0.0002985522150993347, 0.00031654536724090576, 0.0003345385193824768, 0.00035253167152404785, 0.0003705248236656189, 0.00038851797580718994, 0.000406511127948761, 0.00042450428009033203, 0.0004424974322319031, 0.0004604905843734741, 0.00047848373651504517, 0.0004964768886566162, 0.0005144700407981873, 0.0005324631929397583, 0.0005504563450813293, 0.0005684494972229004, 0.0005864426493644714, 0.0006044358015060425, 0.0006224289536476135, 0.0006404221057891846, 0.0006584152579307556, 0.0006764084100723267, 0.0006944015622138977, 0.0007123947143554688]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 8.0, 15.0, 39.0, 106.0, 274.0, 1195.0, 15404.0, 1006491.0, 23151.0, 1386.0, 329.0, 76.0, 30.0, 20.0, 18.0, 6.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.5625, -11.2969970703125, -11.031494140625, -10.7659912109375, -10.50048828125, -10.2349853515625, -9.969482421875, -9.7039794921875, -9.4384765625, -9.1729736328125, -8.907470703125, -8.6419677734375, -8.37646484375, -8.1109619140625, -7.845458984375, -7.5799560546875, -7.314453125, -7.0489501953125, -6.783447265625, -6.5179443359375, -6.25244140625, -5.9869384765625, -5.721435546875, -5.4559326171875, -5.1904296875, -4.9249267578125, -4.659423828125, -4.3939208984375, -4.12841796875, -3.8629150390625, -3.597412109375, -3.3319091796875, -3.06640625, -2.8009033203125, -2.535400390625, -2.2698974609375, -2.00439453125, -1.7388916015625, -1.473388671875, -1.2078857421875, -0.9423828125, -0.6768798828125, -0.411376953125, -0.1458740234375, 0.11962890625, 0.3851318359375, 0.650634765625, 0.9161376953125, 1.181640625, 1.4471435546875, 1.712646484375, 1.9781494140625, 2.24365234375, 2.5091552734375, 2.774658203125, 3.0401611328125, 3.3056640625, 3.5711669921875, 3.836669921875, 4.1021728515625, 4.36767578125, 4.6331787109375, 4.898681640625, 5.1641845703125, 5.4296875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 7.0, 0.0, 6.0, 12.0, 7.0, 13.0, 22.0, 28.0, 21.0, 40.0, 48.0, 89.0, 85.0, 104.0, 125.0, 97.0, 66.0, 57.0, 48.0, 25.0, 25.0, 18.0, 12.0, 14.0, 4.0, 5.0, 5.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.599609375, -3.502777099609375, -3.40594482421875, -3.309112548828125, -3.2122802734375, -3.115447998046875, -3.01861572265625, -2.921783447265625, -2.824951171875, -2.728118896484375, -2.63128662109375, -2.534454345703125, -2.4376220703125, -2.340789794921875, -2.24395751953125, -2.147125244140625, -2.05029296875, -1.953460693359375, -1.85662841796875, -1.759796142578125, -1.6629638671875, -1.566131591796875, -1.46929931640625, -1.372467041015625, -1.275634765625, -1.178802490234375, -1.08197021484375, -0.985137939453125, -0.8883056640625, -0.791473388671875, -0.69464111328125, -0.597808837890625, -0.5009765625, -0.404144287109375, -0.30731201171875, -0.210479736328125, -0.1136474609375, -0.016815185546875, 0.08001708984375, 0.176849365234375, 0.273681640625, 0.370513916015625, 0.46734619140625, 0.564178466796875, 0.6610107421875, 0.757843017578125, 0.85467529296875, 0.951507568359375, 1.04833984375, 1.145172119140625, 1.24200439453125, 1.338836669921875, 1.4356689453125, 1.532501220703125, 1.62933349609375, 1.726165771484375, 1.822998046875, 1.919830322265625, 2.01666259765625, 2.113494873046875, 2.2103271484375, 2.307159423828125, 2.40399169921875, 2.500823974609375, 2.59765625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 9.0, 21.0, 105.0, 435.0, 328.0, 84.0, 19.0, 9.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-341.6352233886719, -334.0104675292969, -326.3857116699219, -318.7609558105469, -311.1361999511719, -303.511474609375, -295.88671875, -288.261962890625, -280.63720703125, -273.012451171875, -265.3876953125, -257.762939453125, -250.13819885253906, -242.51344299316406, -234.88868713378906, -227.26393127441406, -219.63917541503906, -212.01441955566406, -204.38966369628906, -196.76492309570312, -189.14016723632812, -181.51541137695312, -173.89065551757812, -166.26589965820312, -158.64114379882812, -151.01638793945312, -143.39163208007812, -135.76687622070312, -128.1421356201172, -120.51737976074219, -112.89262390136719, -105.26786804199219, -97.64312744140625, -90.01837158203125, -82.39362335205078, -74.76886749267578, -67.14411926269531, -59.51936340332031, -51.89460754394531, -44.26985549926758, -36.645103454589844, -29.02035140991211, -21.395597457885742, -13.770843505859375, -6.146091461181641, 1.4786605834960938, 9.103416442871094, 16.728168487548828, 24.352920532226562, 31.977672576904297, 39.60242462158203, 47.22718048095703, 54.851932525634766, 62.4766845703125, 70.1014404296875, 77.7261962890625, 85.35094451904297, 92.97570037841797, 100.60044860839844, 108.22520446777344, 115.84996032714844, 123.4747085571289, 131.09945678710938, 138.72421264648438, 146.34896850585938]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 4.0, 0.0, 4.0, 4.0, 3.0, 9.0, 7.0, 10.0, 14.0, 11.0, 21.0, 24.0, 26.0, 25.0, 26.0, 27.0, 33.0, 29.0, 44.0, 51.0, 62.0, 53.0, 52.0, 48.0, 45.0, 50.0, 43.0, 44.0, 42.0, 38.0, 23.0, 22.0, 17.0, 19.0, 14.0, 9.0, 10.0, 17.0, 7.0, 6.0, 10.0, 2.0, 4.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-55.12194061279297, -53.03818893432617, -50.95444107055664, -48.870689392089844, -46.78694152832031, -44.703189849853516, -42.61943817138672, -40.53569030761719, -38.45193862915039, -36.368186950683594, -34.28443908691406, -32.200687408447266, -30.1169376373291, -28.033187866210938, -25.94943618774414, -23.865686416625977, -21.781936645507812, -19.69818687438965, -17.614437103271484, -15.530685424804688, -13.446935653686523, -11.36318588256836, -9.279435157775879, -7.195684432983398, -5.111934661865234, -3.028184413909912, -0.9444341659545898, 1.1393160820007324, 3.2230663299560547, 5.306816101074219, 7.390566825866699, 9.47431755065918, 11.558074951171875, 13.641824722290039, 15.72557544708252, 17.809326171875, 19.893075942993164, 21.976825714111328, 24.060577392578125, 26.14432716369629, 28.228076934814453, 30.311826705932617, 32.39557647705078, 34.47932815551758, 36.563079833984375, 38.646827697753906, 40.7305793762207, 42.8143310546875, 44.89807891845703, 46.98183059692383, 49.06557846069336, 51.149330139160156, 53.23307800292969, 55.316829681396484, 57.40058135986328, 59.48432922363281, 61.56808090209961, 63.651832580566406, 65.73558044433594, 67.81932830810547, 69.90308380126953, 71.98683166503906, 74.0705795288086, 76.15433502197266, 78.23808288574219]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 5.0, 2.0, 3.0, 3.0, 5.0, 8.0, 8.0, 7.0, 25.0, 21.0, 45.0, 65.0, 110.0, 182.0, 307.0, 583.0, 1108.0, 2541.0, 6299.0, 19261.0, 100632.0, 3499742.0, 506107.0, 39752.0, 10725.0, 3760.0, 1543.0, 669.0, 367.0, 193.0, 91.0, 50.0, 31.0, 19.0, 4.0, 3.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4609375, -5.29412841796875, -5.1273193359375, -4.96051025390625, -4.793701171875, -4.62689208984375, -4.4600830078125, -4.29327392578125, -4.12646484375, -3.95965576171875, -3.7928466796875, -3.62603759765625, -3.459228515625, -3.29241943359375, -3.1256103515625, -2.95880126953125, -2.7919921875, -2.62518310546875, -2.4583740234375, -2.29156494140625, -2.124755859375, -1.95794677734375, -1.7911376953125, -1.62432861328125, -1.45751953125, -1.29071044921875, -1.1239013671875, -0.95709228515625, -0.790283203125, -0.62347412109375, -0.4566650390625, -0.28985595703125, -0.123046875, 0.04376220703125, 0.2105712890625, 0.37738037109375, 0.544189453125, 0.71099853515625, 0.8778076171875, 1.04461669921875, 1.21142578125, 1.37823486328125, 1.5450439453125, 1.71185302734375, 1.878662109375, 2.04547119140625, 2.2122802734375, 2.37908935546875, 2.5458984375, 2.71270751953125, 2.8795166015625, 3.04632568359375, 3.213134765625, 3.37994384765625, 3.5467529296875, 3.71356201171875, 3.88037109375, 4.04718017578125, 4.2139892578125, 4.38079833984375, 4.547607421875, 4.71441650390625, 4.8812255859375, 5.04803466796875, 5.21484375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 8.0, 5.0, 10.0, 9.0, 16.0, 16.0, 22.0, 18.0, 31.0, 48.0, 43.0, 46.0, 41.0, 69.0, 75.0, 83.0, 75.0, 68.0, 60.0, 61.0, 38.0, 43.0, 23.0, 23.0, 19.0, 18.0, 8.0, 9.0, 7.0, 4.0, 3.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.87890625, -2.786712646484375, -2.69451904296875, -2.602325439453125, -2.5101318359375, -2.417938232421875, -2.32574462890625, -2.233551025390625, -2.141357421875, -2.049163818359375, -1.95697021484375, -1.864776611328125, -1.7725830078125, -1.680389404296875, -1.58819580078125, -1.496002197265625, -1.40380859375, -1.311614990234375, -1.21942138671875, -1.127227783203125, -1.0350341796875, -0.942840576171875, -0.85064697265625, -0.758453369140625, -0.666259765625, -0.574066162109375, -0.48187255859375, -0.389678955078125, -0.2974853515625, -0.205291748046875, -0.11309814453125, -0.020904541015625, 0.0712890625, 0.163482666015625, 0.25567626953125, 0.347869873046875, 0.4400634765625, 0.532257080078125, 0.62445068359375, 0.716644287109375, 0.808837890625, 0.901031494140625, 0.99322509765625, 1.085418701171875, 1.1776123046875, 1.269805908203125, 1.36199951171875, 1.454193115234375, 1.54638671875, 1.638580322265625, 1.73077392578125, 1.822967529296875, 1.9151611328125, 2.007354736328125, 2.09954833984375, 2.191741943359375, 2.283935546875, 2.376129150390625, 2.46832275390625, 2.560516357421875, 2.6527099609375, 2.744903564453125, 2.83709716796875, 2.929290771484375, 3.021484375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 7.0, 1.0, 6.0, 8.0, 11.0, 23.0, 66.0, 153.0, 296.0, 809.0, 3936.0, 74441.0, 4063712.0, 46894.0, 2844.0, 631.0, 220.0, 114.0, 50.0, 32.0, 15.0, 5.0, 4.0, 3.0, 5.0, 0.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.890625, -11.44091796875, -10.9912109375, -10.54150390625, -10.091796875, -9.64208984375, -9.1923828125, -8.74267578125, -8.29296875, -7.84326171875, -7.3935546875, -6.94384765625, -6.494140625, -6.04443359375, -5.5947265625, -5.14501953125, -4.6953125, -4.24560546875, -3.7958984375, -3.34619140625, -2.896484375, -2.44677734375, -1.9970703125, -1.54736328125, -1.09765625, -0.64794921875, -0.1982421875, 0.25146484375, 0.701171875, 1.15087890625, 1.6005859375, 2.05029296875, 2.5, 2.94970703125, 3.3994140625, 3.84912109375, 4.298828125, 4.74853515625, 5.1982421875, 5.64794921875, 6.09765625, 6.54736328125, 6.9970703125, 7.44677734375, 7.896484375, 8.34619140625, 8.7958984375, 9.24560546875, 9.6953125, 10.14501953125, 10.5947265625, 11.04443359375, 11.494140625, 11.94384765625, 12.3935546875, 12.84326171875, 13.29296875, 13.74267578125, 14.1923828125, 14.64208984375, 15.091796875, 15.54150390625, 15.9912109375, 16.44091796875, 16.890625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 5.0, 9.0, 9.0, 17.0, 19.0, 35.0, 47.0, 48.0, 113.0, 293.0, 1345.0, 1452.0, 371.0, 115.0, 53.0, 42.0, 29.0, 20.0, 16.0, 11.0, 11.0, 6.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-12.3671875, -12.0927734375, -11.818359375, -11.5439453125, -11.26953125, -10.9951171875, -10.720703125, -10.4462890625, -10.171875, -9.8974609375, -9.623046875, -9.3486328125, -9.07421875, -8.7998046875, -8.525390625, -8.2509765625, -7.9765625, -7.7021484375, -7.427734375, -7.1533203125, -6.87890625, -6.6044921875, -6.330078125, -6.0556640625, -5.78125, -5.5068359375, -5.232421875, -4.9580078125, -4.68359375, -4.4091796875, -4.134765625, -3.8603515625, -3.5859375, -3.3115234375, -3.037109375, -2.7626953125, -2.48828125, -2.2138671875, -1.939453125, -1.6650390625, -1.390625, -1.1162109375, -0.841796875, -0.5673828125, -0.29296875, -0.0185546875, 0.255859375, 0.5302734375, 0.8046875, 1.0791015625, 1.353515625, 1.6279296875, 1.90234375, 2.1767578125, 2.451171875, 2.7255859375, 3.0, 3.2744140625, 3.548828125, 3.8232421875, 4.09765625, 4.3720703125, 4.646484375, 4.9208984375, 5.1953125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 6.0, 2.0, 8.0, 18.0, 36.0, 104.0, 209.0, 348.0, 179.0, 57.0, 17.0, 8.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.36531066894531, -66.52143859863281, -63.67756271362305, -60.83368682861328, -57.989810943603516, -55.14593505859375, -52.30206298828125, -49.458187103271484, -46.61431121826172, -43.77043533325195, -40.92656326293945, -38.08268737792969, -35.23881149291992, -32.394935607910156, -29.551063537597656, -26.70718765258789, -23.86331558227539, -21.019441604614258, -18.175565719604492, -15.33169174194336, -12.48781681060791, -9.643941879272461, -6.800067901611328, -3.9561920166015625, -1.1123180389404297, 1.7315566539764404, 4.5754313468933105, 7.419305801391602, 10.26318073272705, 13.1070556640625, 15.950929641723633, 18.7948055267334, 21.63867950439453, 24.482553482055664, 27.32642936706543, 30.170303344726562, 33.01417922973633, 35.858055114746094, 38.701927185058594, 41.54580307006836, 44.389678955078125, 47.23355484008789, 50.07742691040039, 52.921302795410156, 55.76517868041992, 58.60905456542969, 61.45292663574219, 64.29679870605469, 67.14067077636719, 69.98454284667969, 72.82842254638672, 75.67229461669922, 78.51616668701172, 81.36004638671875, 84.20391845703125, 87.04779052734375, 89.89167022705078, 92.73554229736328, 95.57942199707031, 98.42329406738281, 101.26716613769531, 104.11104583740234, 106.95491790771484, 109.79879760742188, 112.64266967773438]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 8.0, 7.0, 18.0, 29.0, 32.0, 32.0, 54.0, 46.0, 69.0, 81.0, 91.0, 89.0, 81.0, 82.0, 66.0, 51.0, 38.0, 36.0, 22.0, 16.0, 12.0, 15.0, 10.0, 5.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-60.63743209838867, -58.96272659301758, -57.28802490234375, -55.613319396972656, -53.93861389160156, -52.26390838623047, -50.58920669555664, -48.91450119018555, -47.23979568481445, -45.56509017944336, -43.89038848876953, -42.21568298339844, -40.540977478027344, -38.86627197265625, -37.19157028198242, -35.51686477661133, -33.8421630859375, -32.167457580566406, -30.492753982543945, -28.818050384521484, -27.14334487915039, -25.46864128112793, -23.79393768310547, -22.119232177734375, -20.44452667236328, -18.76982307434082, -17.095117568969727, -15.420413970947266, -13.745708465576172, -12.071004867553711, -10.396300315856934, -8.721595764160156, -7.0468902587890625, -5.372185707092285, -3.697481393814087, -2.0227770805358887, -0.34807252883911133, 1.3266315460205078, 3.001336097717285, 4.6760406494140625, 6.35074520111084, 8.025449752807617, 9.700154304504395, 11.374858856201172, 13.049562454223633, 14.72426700592041, 16.398971557617188, 18.07367706298828, 19.748380661010742, 21.423084259033203, 23.097789764404297, 24.772493362426758, 26.44719886779785, 28.121902465820312, 29.796607971191406, 31.471311569213867, 33.14601516723633, 34.82072067260742, 36.49542236328125, 38.170127868652344, 39.84483337402344, 41.51953887939453, 43.19424057006836, 44.86894607543945, 46.54365158081055]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 7.0, 4.0, 16.0, 18.0, 25.0, 44.0, 58.0, 102.0, 152.0, 320.0, 598.0, 1217.0, 2652.0, 6498.0, 19466.0, 68058.0, 271237.0, 475106.0, 145198.0, 38116.0, 11826.0, 4218.0, 1797.0, 821.0, 418.0, 228.0, 134.0, 79.0, 48.0, 30.0, 20.0, 9.0, 14.0, 5.0, 5.0, 6.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.5546875, -4.4090576171875, -4.263427734375, -4.1177978515625, -3.97216796875, -3.8265380859375, -3.680908203125, -3.5352783203125, -3.3896484375, -3.2440185546875, -3.098388671875, -2.9527587890625, -2.80712890625, -2.6614990234375, -2.515869140625, -2.3702392578125, -2.224609375, -2.0789794921875, -1.933349609375, -1.7877197265625, -1.64208984375, -1.4964599609375, -1.350830078125, -1.2052001953125, -1.0595703125, -0.9139404296875, -0.768310546875, -0.6226806640625, -0.47705078125, -0.3314208984375, -0.185791015625, -0.0401611328125, 0.10546875, 0.2510986328125, 0.396728515625, 0.5423583984375, 0.68798828125, 0.8336181640625, 0.979248046875, 1.1248779296875, 1.2705078125, 1.4161376953125, 1.561767578125, 1.7073974609375, 1.85302734375, 1.9986572265625, 2.144287109375, 2.2899169921875, 2.435546875, 2.5811767578125, 2.726806640625, 2.8724365234375, 3.01806640625, 3.1636962890625, 3.309326171875, 3.4549560546875, 3.6005859375, 3.7462158203125, 3.891845703125, 4.0374755859375, 4.18310546875, 4.3287353515625, 4.474365234375, 4.6199951171875, 4.765625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 5.0, 8.0, 12.0, 12.0, 20.0, 18.0, 24.0, 35.0, 43.0, 42.0, 56.0, 61.0, 52.0, 56.0, 55.0, 61.0, 64.0, 53.0, 58.0, 46.0, 43.0, 34.0, 17.0, 25.0, 31.0, 15.0, 8.0, 7.0, 10.0, 10.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.671875, -2.594970703125, -2.51806640625, -2.441162109375, -2.3642578125, -2.287353515625, -2.21044921875, -2.133544921875, -2.056640625, -1.979736328125, -1.90283203125, -1.825927734375, -1.7490234375, -1.672119140625, -1.59521484375, -1.518310546875, -1.44140625, -1.364501953125, -1.28759765625, -1.210693359375, -1.1337890625, -1.056884765625, -0.97998046875, -0.903076171875, -0.826171875, -0.749267578125, -0.67236328125, -0.595458984375, -0.5185546875, -0.441650390625, -0.36474609375, -0.287841796875, -0.2109375, -0.134033203125, -0.05712890625, 0.019775390625, 0.0966796875, 0.173583984375, 0.25048828125, 0.327392578125, 0.404296875, 0.481201171875, 0.55810546875, 0.635009765625, 0.7119140625, 0.788818359375, 0.86572265625, 0.942626953125, 1.01953125, 1.096435546875, 1.17333984375, 1.250244140625, 1.3271484375, 1.404052734375, 1.48095703125, 1.557861328125, 1.634765625, 1.711669921875, 1.78857421875, 1.865478515625, 1.9423828125, 2.019287109375, 2.09619140625, 2.173095703125, 2.25]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 5.0, 3.0, 8.0, 14.0, 11.0, 39.0, 55.0, 62.0, 138.0, 259.0, 551.0, 1231.0, 4115.0, 33568.0, 852192.0, 144722.0, 8116.0, 1969.0, 730.0, 356.0, 179.0, 98.0, 70.0, 32.0, 16.0, 6.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-16.515625, -16.11962890625, -15.7236328125, -15.32763671875, -14.931640625, -14.53564453125, -14.1396484375, -13.74365234375, -13.34765625, -12.95166015625, -12.5556640625, -12.15966796875, -11.763671875, -11.36767578125, -10.9716796875, -10.57568359375, -10.1796875, -9.78369140625, -9.3876953125, -8.99169921875, -8.595703125, -8.19970703125, -7.8037109375, -7.40771484375, -7.01171875, -6.61572265625, -6.2197265625, -5.82373046875, -5.427734375, -5.03173828125, -4.6357421875, -4.23974609375, -3.84375, -3.44775390625, -3.0517578125, -2.65576171875, -2.259765625, -1.86376953125, -1.4677734375, -1.07177734375, -0.67578125, -0.27978515625, 0.1162109375, 0.51220703125, 0.908203125, 1.30419921875, 1.7001953125, 2.09619140625, 2.4921875, 2.88818359375, 3.2841796875, 3.68017578125, 4.076171875, 4.47216796875, 4.8681640625, 5.26416015625, 5.66015625, 6.05615234375, 6.4521484375, 6.84814453125, 7.244140625, 7.64013671875, 8.0361328125, 8.43212890625, 8.828125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 3.0, 10.0, 8.0, 20.0, 15.0, 27.0, 33.0, 43.0, 50.0, 46.0, 65.0, 63.0, 73.0, 73.0, 82.0, 73.0, 57.0, 53.0, 44.0, 41.0, 23.0, 25.0, 26.0, 13.0, 11.0, 8.0, 5.0, 4.0, 5.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.171875, -18.6983642578125, -18.224853515625, -17.7513427734375, -17.27783203125, -16.8043212890625, -16.330810546875, -15.8572998046875, -15.3837890625, -14.9102783203125, -14.436767578125, -13.9632568359375, -13.48974609375, -13.0162353515625, -12.542724609375, -12.0692138671875, -11.595703125, -11.1221923828125, -10.648681640625, -10.1751708984375, -9.70166015625, -9.2281494140625, -8.754638671875, -8.2811279296875, -7.8076171875, -7.3341064453125, -6.860595703125, -6.3870849609375, -5.91357421875, -5.4400634765625, -4.966552734375, -4.4930419921875, -4.01953125, -3.5460205078125, -3.072509765625, -2.5989990234375, -2.12548828125, -1.6519775390625, -1.178466796875, -0.7049560546875, -0.2314453125, 0.2420654296875, 0.715576171875, 1.1890869140625, 1.66259765625, 2.1361083984375, 2.609619140625, 3.0831298828125, 3.556640625, 4.0301513671875, 4.503662109375, 4.9771728515625, 5.45068359375, 5.9241943359375, 6.397705078125, 6.8712158203125, 7.3447265625, 7.8182373046875, 8.291748046875, 8.7652587890625, 9.23876953125, 9.7122802734375, 10.185791015625, 10.6593017578125, 11.1328125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 7.0, 2.0, 13.0, 15.0, 16.0, 15.0, 30.0, 50.0, 92.0, 131.0, 315.0, 737.0, 2140.0, 9409.0, 100068.0, 863947.0, 61443.0, 7178.0, 1752.0, 620.0, 254.0, 129.0, 64.0, 41.0, 26.0, 24.0, 13.0, 9.0, 2.0, 4.0, 4.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.47265625, -2.36236572265625, -2.2520751953125, -2.14178466796875, -2.031494140625, -1.92120361328125, -1.8109130859375, -1.70062255859375, -1.59033203125, -1.48004150390625, -1.3697509765625, -1.25946044921875, -1.149169921875, -1.03887939453125, -0.9285888671875, -0.81829833984375, -0.7080078125, -0.59771728515625, -0.4874267578125, -0.37713623046875, -0.266845703125, -0.15655517578125, -0.0462646484375, 0.06402587890625, 0.17431640625, 0.28460693359375, 0.3948974609375, 0.50518798828125, 0.615478515625, 0.72576904296875, 0.8360595703125, 0.94635009765625, 1.056640625, 1.16693115234375, 1.2772216796875, 1.38751220703125, 1.497802734375, 1.60809326171875, 1.7183837890625, 1.82867431640625, 1.93896484375, 2.04925537109375, 2.1595458984375, 2.26983642578125, 2.380126953125, 2.49041748046875, 2.6007080078125, 2.71099853515625, 2.8212890625, 2.93157958984375, 3.0418701171875, 3.15216064453125, 3.262451171875, 3.37274169921875, 3.4830322265625, 3.59332275390625, 3.70361328125, 3.81390380859375, 3.9241943359375, 4.03448486328125, 4.144775390625, 4.25506591796875, 4.3653564453125, 4.47564697265625, 4.5859375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 5.0, 5.0, 16.0, 15.0, 28.0, 25.0, 46.0, 62.0, 105.0, 107.0, 155.0, 130.0, 95.0, 51.0, 46.0, 32.0, 23.0, 20.0, 11.0, 9.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006422996520996094, -0.0006246790289878845, -0.0006070584058761597, -0.0005894377827644348, -0.00057181715965271, -0.0005541965365409851, -0.0005365759134292603, -0.0005189552903175354, -0.0005013346672058105, -0.0004837140440940857, -0.00046609342098236084, -0.000448472797870636, -0.00043085217475891113, -0.0004132315516471863, -0.0003956109285354614, -0.00037799030542373657, -0.0003603696823120117, -0.00034274905920028687, -0.000325128436088562, -0.00030750781297683716, -0.0002898871898651123, -0.00027226656675338745, -0.0002546459436416626, -0.00023702532052993774, -0.0002194046974182129, -0.00020178407430648804, -0.00018416345119476318, -0.00016654282808303833, -0.00014892220497131348, -0.00013130158185958862, -0.00011368095874786377, -9.606033563613892e-05, -7.843971252441406e-05, -6.081908941268921e-05, -4.3198466300964355e-05, -2.5577843189239502e-05, -7.957220077514648e-06, 9.663403034210205e-06, 2.728402614593506e-05, 4.490464925765991e-05, 6.252527236938477e-05, 8.014589548110962e-05, 9.776651859283447e-05, 0.00011538714170455933, 0.00013300776481628418, 0.00015062838792800903, 0.0001682490110397339, 0.00018586963415145874, 0.0002034902572631836, 0.00022111088037490845, 0.0002387315034866333, 0.00025635212659835815, 0.000273972749710083, 0.00029159337282180786, 0.0003092139959335327, 0.00032683461904525757, 0.0003444552421569824, 0.0003620758652687073, 0.00037969648838043213, 0.000397317111492157, 0.00041493773460388184, 0.0004325583577156067, 0.00045017898082733154, 0.0004677996039390564, 0.00048542022705078125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 5.0, 4.0, 5.0, 7.0, 9.0, 11.0, 13.0, 18.0, 31.0, 51.0, 63.0, 92.0, 143.0, 266.0, 476.0, 882.0, 1858.0, 4878.0, 18759.0, 146596.0, 735548.0, 114552.0, 16084.0, 4366.0, 1741.0, 858.0, 498.0, 257.0, 150.0, 102.0, 58.0, 48.0, 42.0, 16.0, 12.0, 10.0, 13.0, 8.0, 11.0, 6.0, 3.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.298828125, -2.2301025390625, -2.161376953125, -2.0926513671875, -2.02392578125, -1.9552001953125, -1.886474609375, -1.8177490234375, -1.7490234375, -1.6802978515625, -1.611572265625, -1.5428466796875, -1.47412109375, -1.4053955078125, -1.336669921875, -1.2679443359375, -1.19921875, -1.1304931640625, -1.061767578125, -0.9930419921875, -0.92431640625, -0.8555908203125, -0.786865234375, -0.7181396484375, -0.6494140625, -0.5806884765625, -0.511962890625, -0.4432373046875, -0.37451171875, -0.3057861328125, -0.237060546875, -0.1683349609375, -0.099609375, -0.0308837890625, 0.037841796875, 0.1065673828125, 0.17529296875, 0.2440185546875, 0.312744140625, 0.3814697265625, 0.4501953125, 0.5189208984375, 0.587646484375, 0.6563720703125, 0.72509765625, 0.7938232421875, 0.862548828125, 0.9312744140625, 1.0, 1.0687255859375, 1.137451171875, 1.2061767578125, 1.27490234375, 1.3436279296875, 1.412353515625, 1.4810791015625, 1.5498046875, 1.6185302734375, 1.687255859375, 1.7559814453125, 1.82470703125, 1.8934326171875, 1.962158203125, 2.0308837890625, 2.099609375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 5.0, 5.0, 7.0, 14.0, 13.0, 16.0, 25.0, 23.0, 43.0, 41.0, 74.0, 63.0, 69.0, 78.0, 85.0, 85.0, 59.0, 57.0, 50.0, 39.0, 35.0, 33.0, 27.0, 12.0, 15.0, 7.0, 5.0, 5.0, 4.0, 1.0, 2.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.890625, -2.8125, -2.734375, -2.65625, -2.578125, -2.5, -2.421875, -2.34375, -2.265625, -2.1875, -2.109375, -2.03125, -1.953125, -1.875, -1.796875, -1.71875, -1.640625, -1.5625, -1.484375, -1.40625, -1.328125, -1.25, -1.171875, -1.09375, -1.015625, -0.9375, -0.859375, -0.78125, -0.703125, -0.625, -0.546875, -0.46875, -0.390625, -0.3125, -0.234375, -0.15625, -0.078125, 0.0, 0.078125, 0.15625, 0.234375, 0.3125, 0.390625, 0.46875, 0.546875, 0.625, 0.703125, 0.78125, 0.859375, 0.9375, 1.015625, 1.09375, 1.171875, 1.25, 1.328125, 1.40625, 1.484375, 1.5625, 1.640625, 1.71875, 1.796875, 1.875, 1.953125, 2.03125, 2.109375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 2.0, 10.0, 14.0, 32.0, 68.0, 200.0, 315.0, 230.0, 79.0, 30.0, 12.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.82553100585938, -117.14591217041016, -114.4662857055664, -111.78666687011719, -109.10704040527344, -106.42742156982422, -103.747802734375, -101.06817626953125, -98.38855743408203, -95.70893859863281, -93.02931213378906, -90.34969329833984, -87.67007446289062, -84.99044799804688, -82.31082916259766, -79.63121032714844, -76.95158386230469, -74.27196502685547, -71.59233856201172, -68.9127197265625, -66.23309326171875, -63.55347442626953, -60.87385559082031, -58.19423294067383, -55.514610290527344, -52.83498764038086, -50.155364990234375, -47.475746154785156, -44.79612350463867, -42.11650085449219, -39.43688201904297, -36.757259368896484, -34.07763671875, -31.398014068603516, -28.718393325805664, -26.038772583007812, -23.359149932861328, -20.679527282714844, -17.999906539916992, -15.32028579711914, -12.640663146972656, -9.961041450500488, -7.28141975402832, -4.601798057556152, -1.9221763610839844, 0.7574453353881836, 3.4370670318603516, 6.116687774658203, 8.796310424804688, 11.475932121276855, 14.155553817749023, 16.835174560546875, 19.51479721069336, 22.194419860839844, 24.874040603637695, 27.553661346435547, 30.23328399658203, 32.912906646728516, 35.592529296875, 38.27214813232422, 40.9517707824707, 43.63139343261719, 46.311012268066406, 48.99063491821289, 51.670257568359375]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 5.0, 9.0, 10.0, 19.0, 11.0, 16.0, 27.0, 27.0, 38.0, 35.0, 52.0, 58.0, 56.0, 88.0, 91.0, 82.0, 75.0, 65.0, 41.0, 36.0, 41.0, 27.0, 21.0, 20.0, 18.0, 9.0, 7.0, 7.0, 5.0, 3.0, 3.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-64.48323059082031, -62.764495849609375, -61.04575729370117, -59.32701873779297, -57.60828399658203, -55.889549255371094, -54.17081069946289, -52.45207214355469, -50.73333740234375, -49.01460266113281, -47.29586410522461, -45.577125549316406, -43.85839080810547, -42.13965606689453, -40.42091751098633, -38.702178955078125, -36.98344421386719, -35.26470947265625, -33.54597091674805, -31.827234268188477, -30.108497619628906, -28.389760971069336, -26.671024322509766, -24.952287673950195, -23.233551025390625, -21.514814376831055, -19.796077728271484, -18.077341079711914, -16.358604431152344, -14.639867782592773, -12.921131134033203, -11.202394485473633, -9.483657836914062, -7.764921188354492, -6.046184539794922, -4.327447891235352, -2.6087112426757812, -0.8899745941162109, 0.8287620544433594, 2.5474987030029297, 4.2662353515625, 5.98497200012207, 7.703708648681641, 9.422445297241211, 11.141181945800781, 12.859918594360352, 14.578655242919922, 16.297391891479492, 18.016128540039062, 19.734865188598633, 21.453601837158203, 23.172338485717773, 24.891075134277344, 26.609811782836914, 28.328548431396484, 30.047285079956055, 31.766021728515625, 33.48475646972656, 35.203495025634766, 36.92223358154297, 38.640968322753906, 40.359703063964844, 42.07844161987305, 43.79718017578125, 45.51591491699219]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 6.0, 5.0, 5.0, 5.0, 7.0, 10.0, 20.0, 13.0, 21.0, 20.0, 43.0, 49.0, 61.0, 95.0, 199.0, 355.0, 860.0, 2698.0, 14322.0, 402824.0, 3723715.0, 39249.0, 6621.0, 1888.0, 662.0, 237.0, 99.0, 63.0, 37.0, 20.0, 14.0, 18.0, 15.0, 7.0, 3.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.5625, -7.33477783203125, -7.1070556640625, -6.87933349609375, -6.651611328125, -6.42388916015625, -6.1961669921875, -5.96844482421875, -5.74072265625, -5.51300048828125, -5.2852783203125, -5.05755615234375, -4.829833984375, -4.60211181640625, -4.3743896484375, -4.14666748046875, -3.9189453125, -3.69122314453125, -3.4635009765625, -3.23577880859375, -3.008056640625, -2.78033447265625, -2.5526123046875, -2.32489013671875, -2.09716796875, -1.86944580078125, -1.6417236328125, -1.41400146484375, -1.186279296875, -0.95855712890625, -0.7308349609375, -0.50311279296875, -0.275390625, -0.04766845703125, 0.1800537109375, 0.40777587890625, 0.635498046875, 0.86322021484375, 1.0909423828125, 1.31866455078125, 1.54638671875, 1.77410888671875, 2.0018310546875, 2.22955322265625, 2.457275390625, 2.68499755859375, 2.9127197265625, 3.14044189453125, 3.3681640625, 3.59588623046875, 3.8236083984375, 4.05133056640625, 4.279052734375, 4.50677490234375, 4.7344970703125, 4.96221923828125, 5.18994140625, 5.41766357421875, 5.6453857421875, 5.87310791015625, 6.100830078125, 6.32855224609375, 6.5562744140625, 6.78399658203125, 7.01171875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 18.0, 32.0, 69.0, 120.0, 152.0, 172.0, 190.0, 118.0, 68.0, 44.0, 13.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-11.1640625, -10.93389892578125, -10.7037353515625, -10.47357177734375, -10.243408203125, -10.01324462890625, -9.7830810546875, -9.55291748046875, -9.32275390625, -9.09259033203125, -8.8624267578125, -8.63226318359375, -8.402099609375, -8.17193603515625, -7.9417724609375, -7.71160888671875, -7.4814453125, -7.25128173828125, -7.0211181640625, -6.79095458984375, -6.560791015625, -6.33062744140625, -6.1004638671875, -5.87030029296875, -5.64013671875, -5.40997314453125, -5.1798095703125, -4.94964599609375, -4.719482421875, -4.48931884765625, -4.2591552734375, -4.02899169921875, -3.798828125, -3.56866455078125, -3.3385009765625, -3.10833740234375, -2.878173828125, -2.64801025390625, -2.4178466796875, -2.18768310546875, -1.95751953125, -1.72735595703125, -1.4971923828125, -1.26702880859375, -1.036865234375, -0.80670166015625, -0.5765380859375, -0.34637451171875, -0.1162109375, 0.11395263671875, 0.3441162109375, 0.57427978515625, 0.804443359375, 1.03460693359375, 1.2647705078125, 1.49493408203125, 1.72509765625, 1.95526123046875, 2.1854248046875, 2.41558837890625, 2.645751953125, 2.87591552734375, 3.1060791015625, 3.33624267578125, 3.56640625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 8.0, 18.0, 18.0, 33.0, 61.0, 96.0, 139.0, 303.0, 592.0, 1609.0, 4861.0, 16354.0, 81639.0, 3271251.0, 756643.0, 45196.0, 10653.0, 2966.0, 995.0, 430.0, 176.0, 101.0, 59.0, 36.0, 19.0, 4.0, 8.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.6875, -7.508056640625, -7.32861328125, -7.149169921875, -6.9697265625, -6.790283203125, -6.61083984375, -6.431396484375, -6.251953125, -6.072509765625, -5.89306640625, -5.713623046875, -5.5341796875, -5.354736328125, -5.17529296875, -4.995849609375, -4.81640625, -4.636962890625, -4.45751953125, -4.278076171875, -4.0986328125, -3.919189453125, -3.73974609375, -3.560302734375, -3.380859375, -3.201416015625, -3.02197265625, -2.842529296875, -2.6630859375, -2.483642578125, -2.30419921875, -2.124755859375, -1.9453125, -1.765869140625, -1.58642578125, -1.406982421875, -1.2275390625, -1.048095703125, -0.86865234375, -0.689208984375, -0.509765625, -0.330322265625, -0.15087890625, 0.028564453125, 0.2080078125, 0.387451171875, 0.56689453125, 0.746337890625, 0.92578125, 1.105224609375, 1.28466796875, 1.464111328125, 1.6435546875, 1.822998046875, 2.00244140625, 2.181884765625, 2.361328125, 2.540771484375, 2.72021484375, 2.899658203125, 3.0791015625, 3.258544921875, 3.43798828125, 3.617431640625, 3.796875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 7.0, 3.0, 6.0, 11.0, 7.0, 6.0, 11.0, 18.0, 17.0, 31.0, 47.0, 71.0, 128.0, 303.0, 684.0, 1133.0, 764.0, 335.0, 170.0, 112.0, 54.0, 33.0, 31.0, 17.0, 11.0, 12.0, 14.0, 6.0, 4.0, 5.0, 3.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-5.76171875, -5.608642578125, -5.45556640625, -5.302490234375, -5.1494140625, -4.996337890625, -4.84326171875, -4.690185546875, -4.537109375, -4.384033203125, -4.23095703125, -4.077880859375, -3.9248046875, -3.771728515625, -3.61865234375, -3.465576171875, -3.3125, -3.159423828125, -3.00634765625, -2.853271484375, -2.7001953125, -2.547119140625, -2.39404296875, -2.240966796875, -2.087890625, -1.934814453125, -1.78173828125, -1.628662109375, -1.4755859375, -1.322509765625, -1.16943359375, -1.016357421875, -0.86328125, -0.710205078125, -0.55712890625, -0.404052734375, -0.2509765625, -0.097900390625, 0.05517578125, 0.208251953125, 0.361328125, 0.514404296875, 0.66748046875, 0.820556640625, 0.9736328125, 1.126708984375, 1.27978515625, 1.432861328125, 1.5859375, 1.739013671875, 1.89208984375, 2.045166015625, 2.1982421875, 2.351318359375, 2.50439453125, 2.657470703125, 2.810546875, 2.963623046875, 3.11669921875, 3.269775390625, 3.4228515625, 3.575927734375, 3.72900390625, 3.882080078125, 4.03515625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 6.0, 6.0, 14.0, 43.0, 116.0, 282.0, 288.0, 161.0, 47.0, 23.0, 10.0, 5.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.48533630371094, -64.64071655273438, -62.79609298706055, -60.951473236083984, -59.106849670410156, -57.262229919433594, -55.41761016845703, -53.5729866027832, -51.72836685180664, -49.88374710083008, -48.03912353515625, -46.19450378417969, -44.34988021850586, -42.5052604675293, -40.66063690185547, -38.816017150878906, -36.971397399902344, -35.12677764892578, -33.28215408325195, -31.43753433227539, -29.592912673950195, -27.748291015625, -25.903669357299805, -24.05904769897461, -22.21442413330078, -20.369802474975586, -18.52518081665039, -16.680561065673828, -14.835939407348633, -12.991317749023438, -11.146696090698242, -9.302075386047363, -7.457454681396484, -5.612833499908447, -3.768212080001831, -1.9235906600952148, -0.07896947860717773, 1.7656517028808594, 3.6102733612060547, 5.454894065856934, 7.299515724182129, 9.144137382507324, 10.988758087158203, 12.833379745483398, 14.678001403808594, 16.522621154785156, 18.367244720458984, 20.211864471435547, 22.056486129760742, 23.901107788085938, 25.745729446411133, 27.590351104736328, 29.43497085571289, 31.279592514038086, 33.12421417236328, 34.968833923339844, 36.81345748901367, 38.658077239990234, 40.50270080566406, 42.347320556640625, 44.19194412231445, 46.036563873291016, 47.881187438964844, 49.725807189941406, 51.57042694091797]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 3.0, 8.0, 3.0, 5.0, 11.0, 18.0, 25.0, 47.0, 55.0, 63.0, 108.0, 78.0, 95.0, 92.0, 79.0, 73.0, 60.0, 48.0, 39.0, 30.0, 17.0, 21.0, 11.0, 7.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.922029495239258, -23.755842208862305, -22.58965492248535, -21.4234676361084, -20.257280349731445, -19.091093063354492, -17.92490577697754, -16.758718490600586, -15.592531204223633, -14.42634391784668, -13.260156631469727, -12.093969345092773, -10.92778205871582, -9.761594772338867, -8.595407485961914, -7.429220199584961, -6.263032913208008, -5.096845626831055, -3.9306583404541016, -2.7644710540771484, -1.5982837677001953, -0.4320964813232422, 0.7340908050537109, 1.900278091430664, 3.066465377807617, 4.23265266418457, 5.398839950561523, 6.565027236938477, 7.73121452331543, 8.897401809692383, 10.063589096069336, 11.229776382446289, 12.39596176147461, 13.562149047851562, 14.728336334228516, 15.894523620605469, 17.060710906982422, 18.226898193359375, 19.393085479736328, 20.55927276611328, 21.725460052490234, 22.891647338867188, 24.05783462524414, 25.224021911621094, 26.390209197998047, 27.556396484375, 28.722583770751953, 29.888771057128906, 31.05495834350586, 32.22114562988281, 33.387332916259766, 34.55352020263672, 35.71970748901367, 36.885894775390625, 38.05208206176758, 39.21826934814453, 40.384456634521484, 41.55064392089844, 42.71683120727539, 43.883018493652344, 45.0492057800293, 46.21539306640625, 47.3815803527832, 48.547767639160156, 49.71395492553711]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 4.0, 6.0, 3.0, 1.0, 7.0, 10.0, 6.0, 12.0, 17.0, 21.0, 43.0, 61.0, 87.0, 143.0, 259.0, 417.0, 827.0, 1530.0, 3186.0, 6971.0, 17007.0, 44838.0, 133563.0, 385122.0, 300367.0, 96488.0, 33360.0, 12976.0, 5736.0, 2553.0, 1259.0, 645.0, 400.0, 217.0, 156.0, 75.0, 60.0, 38.0, 20.0, 20.0, 12.0, 15.0, 5.0, 6.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.06640625, -2.956329345703125, -2.84625244140625, -2.736175537109375, -2.6260986328125, -2.516021728515625, -2.40594482421875, -2.295867919921875, -2.185791015625, -2.075714111328125, -1.96563720703125, -1.855560302734375, -1.7454833984375, -1.635406494140625, -1.52532958984375, -1.415252685546875, -1.30517578125, -1.195098876953125, -1.08502197265625, -0.974945068359375, -0.8648681640625, -0.754791259765625, -0.64471435546875, -0.534637451171875, -0.424560546875, -0.314483642578125, -0.20440673828125, -0.094329833984375, 0.0157470703125, 0.125823974609375, 0.23590087890625, 0.345977783203125, 0.4560546875, 0.566131591796875, 0.67620849609375, 0.786285400390625, 0.8963623046875, 1.006439208984375, 1.11651611328125, 1.226593017578125, 1.336669921875, 1.446746826171875, 1.55682373046875, 1.666900634765625, 1.7769775390625, 1.887054443359375, 1.99713134765625, 2.107208251953125, 2.21728515625, 2.327362060546875, 2.43743896484375, 2.547515869140625, 2.6575927734375, 2.767669677734375, 2.87774658203125, 2.987823486328125, 3.097900390625, 3.207977294921875, 3.31805419921875, 3.428131103515625, 3.5382080078125, 3.648284912109375, 3.75836181640625, 3.868438720703125, 3.978515625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 5.0, 6.0, 7.0, 12.0, 16.0, 19.0, 37.0, 39.0, 58.0, 89.0, 81.0, 76.0, 99.0, 80.0, 74.0, 81.0, 61.0, 49.0, 31.0, 28.0, 25.0, 10.0, 10.0, 3.0, 8.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.16015625, -4.052215576171875, -3.94427490234375, -3.836334228515625, -3.7283935546875, -3.620452880859375, -3.51251220703125, -3.404571533203125, -3.296630859375, -3.188690185546875, -3.08074951171875, -2.972808837890625, -2.8648681640625, -2.756927490234375, -2.64898681640625, -2.541046142578125, -2.43310546875, -2.325164794921875, -2.21722412109375, -2.109283447265625, -2.0013427734375, -1.893402099609375, -1.78546142578125, -1.677520751953125, -1.569580078125, -1.461639404296875, -1.35369873046875, -1.245758056640625, -1.1378173828125, -1.029876708984375, -0.92193603515625, -0.813995361328125, -0.7060546875, -0.598114013671875, -0.49017333984375, -0.382232666015625, -0.2742919921875, -0.166351318359375, -0.05841064453125, 0.049530029296875, 0.157470703125, 0.265411376953125, 0.37335205078125, 0.481292724609375, 0.5892333984375, 0.697174072265625, 0.80511474609375, 0.913055419921875, 1.02099609375, 1.128936767578125, 1.23687744140625, 1.344818115234375, 1.4527587890625, 1.560699462890625, 1.66864013671875, 1.776580810546875, 1.884521484375, 1.992462158203125, 2.10040283203125, 2.208343505859375, 2.3162841796875, 2.424224853515625, 2.53216552734375, 2.640106201171875, 2.748046875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 7.0, 1.0, 5.0, 2.0, 9.0, 12.0, 8.0, 19.0, 35.0, 53.0, 68.0, 106.0, 225.0, 413.0, 854.0, 2353.0, 11623.0, 172420.0, 803064.0, 48757.0, 5776.0, 1391.0, 629.0, 290.0, 154.0, 91.0, 54.0, 40.0, 35.0, 12.0, 11.0, 10.0, 10.0, 2.0, 7.0, 1.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.296875, -7.992919921875, -7.68896484375, -7.385009765625, -7.0810546875, -6.777099609375, -6.47314453125, -6.169189453125, -5.865234375, -5.561279296875, -5.25732421875, -4.953369140625, -4.6494140625, -4.345458984375, -4.04150390625, -3.737548828125, -3.43359375, -3.129638671875, -2.82568359375, -2.521728515625, -2.2177734375, -1.913818359375, -1.60986328125, -1.305908203125, -1.001953125, -0.697998046875, -0.39404296875, -0.090087890625, 0.2138671875, 0.517822265625, 0.82177734375, 1.125732421875, 1.4296875, 1.733642578125, 2.03759765625, 2.341552734375, 2.6455078125, 2.949462890625, 3.25341796875, 3.557373046875, 3.861328125, 4.165283203125, 4.46923828125, 4.773193359375, 5.0771484375, 5.381103515625, 5.68505859375, 5.989013671875, 6.29296875, 6.596923828125, 6.90087890625, 7.204833984375, 7.5087890625, 7.812744140625, 8.11669921875, 8.420654296875, 8.724609375, 9.028564453125, 9.33251953125, 9.636474609375, 9.9404296875, 10.244384765625, 10.54833984375, 10.852294921875, 11.15625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 3.0, 4.0, 9.0, 9.0, 13.0, 13.0, 14.0, 30.0, 24.0, 31.0, 54.0, 43.0, 61.0, 58.0, 74.0, 71.0, 71.0, 62.0, 48.0, 63.0, 54.0, 55.0, 34.0, 21.0, 19.0, 16.0, 12.0, 8.0, 8.0, 4.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.859375, -9.5184326171875, -9.177490234375, -8.8365478515625, -8.49560546875, -8.1546630859375, -7.813720703125, -7.4727783203125, -7.1318359375, -6.7908935546875, -6.449951171875, -6.1090087890625, -5.76806640625, -5.4271240234375, -5.086181640625, -4.7452392578125, -4.404296875, -4.0633544921875, -3.722412109375, -3.3814697265625, -3.04052734375, -2.6995849609375, -2.358642578125, -2.0177001953125, -1.6767578125, -1.3358154296875, -0.994873046875, -0.6539306640625, -0.31298828125, 0.0279541015625, 0.368896484375, 0.7098388671875, 1.05078125, 1.3917236328125, 1.732666015625, 2.0736083984375, 2.41455078125, 2.7554931640625, 3.096435546875, 3.4373779296875, 3.7783203125, 4.1192626953125, 4.460205078125, 4.8011474609375, 5.14208984375, 5.4830322265625, 5.823974609375, 6.1649169921875, 6.505859375, 6.8468017578125, 7.187744140625, 7.5286865234375, 7.86962890625, 8.2105712890625, 8.551513671875, 8.8924560546875, 9.2333984375, 9.5743408203125, 9.915283203125, 10.2562255859375, 10.59716796875, 10.9381103515625, 11.279052734375, 11.6199951171875, 11.9609375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 3.0, 7.0, 10.0, 8.0, 18.0, 43.0, 62.0, 159.0, 497.0, 2727.0, 49786.0, 944777.0, 46973.0, 2667.0, 498.0, 162.0, 73.0, 34.0, 17.0, 10.0, 6.0, 9.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.078125, -3.93499755859375, -3.7918701171875, -3.64874267578125, -3.505615234375, -3.36248779296875, -3.2193603515625, -3.07623291015625, -2.93310546875, -2.78997802734375, -2.6468505859375, -2.50372314453125, -2.360595703125, -2.21746826171875, -2.0743408203125, -1.93121337890625, -1.7880859375, -1.64495849609375, -1.5018310546875, -1.35870361328125, -1.215576171875, -1.07244873046875, -0.9293212890625, -0.78619384765625, -0.64306640625, -0.49993896484375, -0.3568115234375, -0.21368408203125, -0.070556640625, 0.07257080078125, 0.2156982421875, 0.35882568359375, 0.501953125, 0.64508056640625, 0.7882080078125, 0.93133544921875, 1.074462890625, 1.21759033203125, 1.3607177734375, 1.50384521484375, 1.64697265625, 1.79010009765625, 1.9332275390625, 2.07635498046875, 2.219482421875, 2.36260986328125, 2.5057373046875, 2.64886474609375, 2.7919921875, 2.93511962890625, 3.0782470703125, 3.22137451171875, 3.364501953125, 3.50762939453125, 3.6507568359375, 3.79388427734375, 3.93701171875, 4.08013916015625, 4.2232666015625, 4.36639404296875, 4.509521484375, 4.65264892578125, 4.7957763671875, 4.93890380859375, 5.08203125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 3.0, 4.0, 6.0, 6.0, 6.0, 17.0, 21.0, 44.0, 66.0, 86.0, 116.0, 151.0, 134.0, 106.0, 69.0, 70.0, 39.0, 28.0, 13.0, 10.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005373954772949219, -0.0005175024271011353, -0.0004976093769073486, -0.000477716326713562, -0.0004578232765197754, -0.00043793022632598877, -0.00041803717613220215, -0.00039814412593841553, -0.0003782510757446289, -0.0003583580255508423, -0.00033846497535705566, -0.00031857192516326904, -0.0002986788749694824, -0.0002787858247756958, -0.0002588927745819092, -0.00023899972438812256, -0.00021910667419433594, -0.00019921362400054932, -0.0001793205738067627, -0.00015942752361297607, -0.00013953447341918945, -0.00011964142322540283, -9.974837303161621e-05, -7.985532283782959e-05, -5.996227264404297e-05, -4.006922245025635e-05, -2.0176172256469727e-05, -2.8312206268310547e-07, 1.9609928131103516e-05, 3.950297832489014e-05, 5.939602851867676e-05, 7.928907871246338e-05, 9.918212890625e-05, 0.00011907517910003662, 0.00013896822929382324, 0.00015886127948760986, 0.00017875432968139648, 0.0001986473798751831, 0.00021854043006896973, 0.00023843348026275635, 0.00025832653045654297, 0.0002782195806503296, 0.0002981126308441162, 0.00031800568103790283, 0.00033789873123168945, 0.0003577917814254761, 0.0003776848316192627, 0.0003975778818130493, 0.00041747093200683594, 0.00043736398220062256, 0.0004572570323944092, 0.0004771500825881958, 0.0004970431327819824, 0.000516936182975769, 0.0005368292331695557, 0.0005567222833633423, 0.0005766153335571289, 0.0005965083837509155, 0.0006164014339447021, 0.0006362944841384888, 0.0006561875343322754, 0.000676080584526062, 0.0006959736347198486, 0.0007158666849136353, 0.0007357597351074219]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 12.0, 10.0, 5.0, 22.0, 31.0, 45.0, 75.0, 143.0, 273.0, 604.0, 1720.0, 7364.0, 78773.0, 809375.0, 136373.0, 10222.0, 2162.0, 690.0, 305.0, 141.0, 79.0, 41.0, 30.0, 24.0, 7.0, 11.0, 9.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.17578125, -2.09075927734375, -2.0057373046875, -1.92071533203125, -1.835693359375, -1.75067138671875, -1.6656494140625, -1.58062744140625, -1.49560546875, -1.41058349609375, -1.3255615234375, -1.24053955078125, -1.155517578125, -1.07049560546875, -0.9854736328125, -0.90045166015625, -0.8154296875, -0.73040771484375, -0.6453857421875, -0.56036376953125, -0.475341796875, -0.39031982421875, -0.3052978515625, -0.22027587890625, -0.13525390625, -0.05023193359375, 0.0347900390625, 0.11981201171875, 0.204833984375, 0.28985595703125, 0.3748779296875, 0.45989990234375, 0.544921875, 0.62994384765625, 0.7149658203125, 0.79998779296875, 0.885009765625, 0.97003173828125, 1.0550537109375, 1.14007568359375, 1.22509765625, 1.31011962890625, 1.3951416015625, 1.48016357421875, 1.565185546875, 1.65020751953125, 1.7352294921875, 1.82025146484375, 1.9052734375, 1.99029541015625, 2.0753173828125, 2.16033935546875, 2.245361328125, 2.33038330078125, 2.4154052734375, 2.50042724609375, 2.58544921875, 2.67047119140625, 2.7554931640625, 2.84051513671875, 2.925537109375, 3.01055908203125, 3.0955810546875, 3.18060302734375, 3.265625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 7.0, 7.0, 18.0, 13.0, 34.0, 31.0, 40.0, 52.0, 51.0, 82.0, 81.0, 88.0, 80.0, 72.0, 76.0, 58.0, 56.0, 41.0, 36.0, 22.0, 11.0, 13.0, 10.0, 7.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 0.0, 1.0], "bins": [-2.849609375, -2.7817840576171875, -2.713958740234375, -2.6461334228515625, -2.57830810546875, -2.5104827880859375, -2.442657470703125, -2.3748321533203125, -2.3070068359375, -2.2391815185546875, -2.171356201171875, -2.1035308837890625, -2.03570556640625, -1.9678802490234375, -1.900054931640625, -1.8322296142578125, -1.764404296875, -1.6965789794921875, -1.628753662109375, -1.5609283447265625, -1.49310302734375, -1.4252777099609375, -1.357452392578125, -1.2896270751953125, -1.2218017578125, -1.1539764404296875, -1.086151123046875, -1.0183258056640625, -0.95050048828125, -0.8826751708984375, -0.814849853515625, -0.7470245361328125, -0.67919921875, -0.6113739013671875, -0.543548583984375, -0.4757232666015625, -0.40789794921875, -0.3400726318359375, -0.272247314453125, -0.2044219970703125, -0.1365966796875, -0.0687713623046875, -0.000946044921875, 0.0668792724609375, 0.13470458984375, 0.2025299072265625, 0.270355224609375, 0.3381805419921875, 0.406005859375, 0.4738311767578125, 0.541656494140625, 0.6094818115234375, 0.67730712890625, 0.7451324462890625, 0.812957763671875, 0.8807830810546875, 0.9486083984375, 1.0164337158203125, 1.084259033203125, 1.1520843505859375, 1.21990966796875, 1.2877349853515625, 1.355560302734375, 1.4233856201171875, 1.4912109375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 2.0, 2.0, 4.0, 6.0, 10.0, 39.0, 83.0, 187.0, 281.0, 209.0, 107.0, 44.0, 15.0, 9.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.718894958496094, -30.642587661743164, -28.566280364990234, -26.489974975585938, -24.413667678833008, -22.337360382080078, -20.26105499267578, -18.18474769592285, -16.108440399169922, -14.032133102416992, -11.955826759338379, -9.879520416259766, -7.803213119506836, -5.726905822753906, -3.650599479675293, -1.5742931365966797, 0.50201416015625, 2.5783209800720215, 4.654627799987793, 6.7309346199035645, 8.807241439819336, 10.883548736572266, 12.959855079650879, 15.036161422729492, 17.112468719482422, 19.18877601623535, 21.26508331298828, 23.341388702392578, 25.417695999145508, 27.494003295898438, 29.570308685302734, 31.646615982055664, 33.72291564941406, 35.79922103881836, 37.87553024291992, 39.95183563232422, 42.02814483642578, 44.10445022583008, 46.180755615234375, 48.25706481933594, 50.333370208740234, 52.40967559814453, 54.485984802246094, 56.56229019165039, 58.63859558105469, 60.71490478515625, 62.79121017456055, 64.86751556396484, 66.9438247680664, 69.02013397216797, 71.096435546875, 73.17274475097656, 75.24905395507812, 77.32536315917969, 79.40166473388672, 81.47797393798828, 83.55427551269531, 85.63058471679688, 87.7068862915039, 89.78319549560547, 91.85950469970703, 93.93580627441406, 96.01211547851562, 98.08842468261719, 100.16473388671875]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 1.0, 7.0, 10.0, 8.0, 10.0, 11.0, 13.0, 12.0, 19.0, 25.0, 21.0, 21.0, 35.0, 43.0, 37.0, 49.0, 53.0, 51.0, 67.0, 63.0, 66.0, 56.0, 36.0, 53.0, 28.0, 34.0, 38.0, 32.0, 17.0, 19.0, 22.0, 10.0, 10.0, 7.0, 4.0, 7.0, 2.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-42.638832092285156, -41.41974639892578, -40.20066452026367, -38.9815788269043, -37.76249694824219, -36.54341125488281, -35.3243293762207, -34.10524368286133, -32.88616180419922, -31.667078018188477, -30.447994232177734, -29.228910446166992, -28.00982666015625, -26.790740966796875, -25.571657180786133, -24.35257339477539, -23.133487701416016, -21.914403915405273, -20.69532012939453, -19.47623634338379, -18.257152557373047, -17.038066864013672, -15.81898307800293, -14.599899291992188, -13.380815505981445, -12.161731719970703, -10.942647933959961, -9.723563194274902, -8.50447940826416, -7.285395622253418, -6.066311359405518, -4.847227096557617, -3.6281471252441406, -2.4090631008148193, -1.189979076385498, 0.029104948043823242, 1.2481889724731445, 2.4672727584838867, 3.686357021331787, 4.9054412841796875, 6.12452507019043, 7.343608856201172, 8.562692642211914, 9.781777381896973, 11.000861167907715, 12.219944953918457, 13.439029693603516, 14.658113479614258, 15.877197265625, 17.096281051635742, 18.315364837646484, 19.534448623657227, 20.75353240966797, 21.972618103027344, 23.191701889038086, 24.410785675048828, 25.62986946105957, 26.848953247070312, 28.068037033081055, 29.287120819091797, 30.506206512451172, 31.72528839111328, 32.944374084472656, 34.16345977783203, 35.38254165649414]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 8.0, 9.0, 11.0, 26.0, 32.0, 47.0, 75.0, 81.0, 137.0, 236.0, 360.0, 705.0, 1456.0, 3344.0, 9695.0, 36552.0, 255176.0, 2583755.0, 1153484.0, 113190.0, 23603.0, 7110.0, 2700.0, 1176.0, 558.0, 315.0, 173.0, 101.0, 62.0, 42.0, 24.0, 16.0, 7.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0], "bins": [-3.626953125, -3.540191650390625, -3.45343017578125, -3.366668701171875, -3.2799072265625, -3.193145751953125, -3.10638427734375, -3.019622802734375, -2.932861328125, -2.846099853515625, -2.75933837890625, -2.672576904296875, -2.5858154296875, -2.499053955078125, -2.41229248046875, -2.325531005859375, -2.23876953125, -2.152008056640625, -2.06524658203125, -1.978485107421875, -1.8917236328125, -1.804962158203125, -1.71820068359375, -1.631439208984375, -1.544677734375, -1.457916259765625, -1.37115478515625, -1.284393310546875, -1.1976318359375, -1.110870361328125, -1.02410888671875, -0.937347412109375, -0.8505859375, -0.763824462890625, -0.67706298828125, -0.590301513671875, -0.5035400390625, -0.416778564453125, -0.33001708984375, -0.243255615234375, -0.156494140625, -0.069732666015625, 0.01702880859375, 0.103790283203125, 0.1905517578125, 0.277313232421875, 0.36407470703125, 0.450836181640625, 0.53759765625, 0.624359130859375, 0.71112060546875, 0.797882080078125, 0.8846435546875, 0.971405029296875, 1.05816650390625, 1.144927978515625, 1.231689453125, 1.318450927734375, 1.40521240234375, 1.491973876953125, 1.5787353515625, 1.665496826171875, 1.75225830078125, 1.839019775390625, 1.92578125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 4.0, 1.0, 4.0, 7.0, 6.0, 13.0, 13.0, 31.0, 29.0, 17.0, 29.0, 54.0, 59.0, 65.0, 76.0, 71.0, 83.0, 65.0, 68.0, 69.0, 43.0, 53.0, 31.0, 26.0, 27.0, 20.0, 11.0, 10.0, 10.0, 6.0, 5.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-3.51171875, -3.4322357177734375, -3.352752685546875, -3.2732696533203125, -3.19378662109375, -3.1143035888671875, -3.034820556640625, -2.9553375244140625, -2.8758544921875, -2.7963714599609375, -2.716888427734375, -2.6374053955078125, -2.55792236328125, -2.4784393310546875, -2.398956298828125, -2.3194732666015625, -2.239990234375, -2.1605072021484375, -2.081024169921875, -2.0015411376953125, -1.92205810546875, -1.8425750732421875, -1.763092041015625, -1.6836090087890625, -1.6041259765625, -1.5246429443359375, -1.445159912109375, -1.3656768798828125, -1.28619384765625, -1.2067108154296875, -1.127227783203125, -1.0477447509765625, -0.96826171875, -0.8887786865234375, -0.809295654296875, -0.7298126220703125, -0.65032958984375, -0.5708465576171875, -0.491363525390625, -0.4118804931640625, -0.3323974609375, -0.2529144287109375, -0.173431396484375, -0.0939483642578125, -0.01446533203125, 0.0650177001953125, 0.144500732421875, 0.2239837646484375, 0.303466796875, 0.3829498291015625, 0.462432861328125, 0.5419158935546875, 0.62139892578125, 0.7008819580078125, 0.780364990234375, 0.8598480224609375, 0.9393310546875, 1.0188140869140625, 1.098297119140625, 1.1777801513671875, 1.25726318359375, 1.3367462158203125, 1.416229248046875, 1.4957122802734375, 1.5751953125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 3.0, 7.0, 10.0, 22.0, 26.0, 40.0, 64.0, 94.0, 174.0, 250.0, 465.0, 856.0, 2015.0, 5923.0, 24517.0, 146115.0, 3099233.0, 826351.0, 67333.0, 14102.0, 3901.0, 1404.0, 595.0, 273.0, 176.0, 98.0, 70.0, 46.0, 33.0, 21.0, 20.0, 12.0, 5.0, 4.0, 3.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.6171875, -4.491729736328125, -4.36627197265625, -4.240814208984375, -4.1153564453125, -3.989898681640625, -3.86444091796875, -3.738983154296875, -3.613525390625, -3.488067626953125, -3.36260986328125, -3.237152099609375, -3.1116943359375, -2.986236572265625, -2.86077880859375, -2.735321044921875, -2.60986328125, -2.484405517578125, -2.35894775390625, -2.233489990234375, -2.1080322265625, -1.982574462890625, -1.85711669921875, -1.731658935546875, -1.606201171875, -1.480743408203125, -1.35528564453125, -1.229827880859375, -1.1043701171875, -0.978912353515625, -0.85345458984375, -0.727996826171875, -0.6025390625, -0.477081298828125, -0.35162353515625, -0.226165771484375, -0.1007080078125, 0.024749755859375, 0.15020751953125, 0.275665283203125, 0.401123046875, 0.526580810546875, 0.65203857421875, 0.777496337890625, 0.9029541015625, 1.028411865234375, 1.15386962890625, 1.279327392578125, 1.40478515625, 1.530242919921875, 1.65570068359375, 1.781158447265625, 1.9066162109375, 2.032073974609375, 2.15753173828125, 2.282989501953125, 2.408447265625, 2.533905029296875, 2.65936279296875, 2.784820556640625, 2.9102783203125, 3.035736083984375, 3.16119384765625, 3.286651611328125, 3.412109375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 8.0, 7.0, 9.0, 21.0, 23.0, 35.0, 47.0, 61.0, 79.0, 128.0, 259.0, 580.0, 1028.0, 803.0, 421.0, 201.0, 106.0, 92.0, 41.0, 29.0, 27.0, 17.0, 13.0, 11.0, 9.0, 5.0, 6.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.18359375, -6.028045654296875, -5.87249755859375, -5.716949462890625, -5.5614013671875, -5.405853271484375, -5.25030517578125, -5.094757080078125, -4.939208984375, -4.783660888671875, -4.62811279296875, -4.472564697265625, -4.3170166015625, -4.161468505859375, -4.00592041015625, -3.850372314453125, -3.69482421875, -3.539276123046875, -3.38372802734375, -3.228179931640625, -3.0726318359375, -2.917083740234375, -2.76153564453125, -2.605987548828125, -2.450439453125, -2.294891357421875, -2.13934326171875, -1.983795166015625, -1.8282470703125, -1.672698974609375, -1.51715087890625, -1.361602783203125, -1.2060546875, -1.050506591796875, -0.89495849609375, -0.739410400390625, -0.5838623046875, -0.428314208984375, -0.27276611328125, -0.117218017578125, 0.038330078125, 0.193878173828125, 0.34942626953125, 0.504974365234375, 0.6605224609375, 0.816070556640625, 0.97161865234375, 1.127166748046875, 1.28271484375, 1.438262939453125, 1.59381103515625, 1.749359130859375, 1.9049072265625, 2.060455322265625, 2.21600341796875, 2.371551513671875, 2.527099609375, 2.682647705078125, 2.83819580078125, 2.993743896484375, 3.1492919921875, 3.304840087890625, 3.46038818359375, 3.615936279296875, 3.771484375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 1.0, 5.0, 2.0, 24.0, 90.0, 225.0, 295.0, 233.0, 72.0, 25.0, 11.0, 14.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-71.75726318359375, -69.92715454101562, -68.09705352783203, -66.2669448852539, -64.43683624267578, -62.60673522949219, -60.77662658691406, -58.9465217590332, -57.116416931152344, -55.286312103271484, -53.45620346069336, -51.6260986328125, -49.79599380493164, -47.96588897705078, -46.135780334472656, -44.3056755065918, -42.47556686401367, -40.64546203613281, -38.81535339355469, -36.98524856567383, -35.15514373779297, -33.325035095214844, -31.494930267333984, -29.664825439453125, -27.834718704223633, -26.00461196899414, -24.17450714111328, -22.34440040588379, -20.514293670654297, -18.684188842773438, -16.854082107543945, -15.02397632598877, -13.193866729736328, -11.363760948181152, -9.533655166625977, -7.703548431396484, -5.873442649841309, -4.043336868286133, -2.2132301330566406, -0.38312435150146484, 1.446981430053711, 3.277087450027466, 5.107193470001221, 6.937299728393555, 8.76740550994873, 10.597511291503906, 12.427618026733398, 14.257723808288574, 16.08782958984375, 17.917936325073242, 19.7480411529541, 21.578147888183594, 23.408252716064453, 25.238359451293945, 27.068466186523438, 28.898571014404297, 30.72867774963379, 32.55878448486328, 34.38888931274414, 36.218994140625, 38.049102783203125, 39.879207611083984, 41.709312438964844, 43.53942108154297, 45.36952590942383]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 11.0, 7.0, 9.0, 14.0, 16.0, 20.0, 16.0, 29.0, 43.0, 33.0, 35.0, 49.0, 55.0, 61.0, 57.0, 53.0, 48.0, 60.0, 49.0, 45.0, 52.0, 45.0, 35.0, 24.0, 34.0, 17.0, 12.0, 15.0, 13.0, 12.0, 8.0, 5.0, 5.0, 6.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.823684692382812, -16.08842658996582, -15.353168487548828, -14.617911338806152, -13.88265323638916, -13.147395133972168, -12.412137985229492, -11.6768798828125, -10.941621780395508, -10.206363677978516, -9.471105575561523, -8.735848426818848, -8.000590324401855, -7.265332221984863, -6.530074596405029, -5.794816970825195, -5.059558868408203, -4.324300765991211, -3.589043140411377, -2.853785276412964, -2.118527412414551, -1.3832695484161377, -0.6480116844177246, 0.08724594116210938, 0.8225040435791016, 1.5577619075775146, 2.2930197715759277, 3.028277635574341, 3.763535499572754, 4.498793601989746, 5.23405122756958, 5.969308853149414, 6.704566955566406, 7.439825057983398, 8.17508316040039, 8.910340309143066, 9.645598411560059, 10.38085651397705, 11.116113662719727, 11.851371765136719, 12.586629867553711, 13.321887969970703, 14.057146072387695, 14.792403221130371, 15.527661323547363, 16.26291847229004, 16.99817657470703, 17.733434677124023, 18.468692779541016, 19.203950881958008, 19.939208984375, 20.674467086791992, 21.409725189208984, 22.144981384277344, 22.880239486694336, 23.615497589111328, 24.35075569152832, 25.086013793945312, 25.821271896362305, 26.556529998779297, 27.291786193847656, 28.02704429626465, 28.76230239868164, 29.497560501098633, 30.232818603515625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 5.0, 10.0, 17.0, 15.0, 38.0, 55.0, 64.0, 126.0, 178.0, 310.0, 508.0, 905.0, 1418.0, 2596.0, 4410.0, 8115.0, 15049.0, 28337.0, 54099.0, 104352.0, 191618.0, 256878.0, 177281.0, 95467.0, 49564.0, 26126.0, 13755.0, 7443.0, 4122.0, 2314.0, 1266.0, 783.0, 480.0, 308.0, 192.0, 114.0, 79.0, 60.0, 31.0, 28.0, 8.0, 15.0, 11.0, 4.0, 3.0, 2.0, 2.0], "bins": [-2.162109375, -2.1058502197265625, -2.049591064453125, -1.9933319091796875, -1.93707275390625, -1.8808135986328125, -1.824554443359375, -1.7682952880859375, -1.7120361328125, -1.6557769775390625, -1.599517822265625, -1.5432586669921875, -1.48699951171875, -1.4307403564453125, -1.374481201171875, -1.3182220458984375, -1.261962890625, -1.2057037353515625, -1.149444580078125, -1.0931854248046875, -1.03692626953125, -0.9806671142578125, -0.924407958984375, -0.8681488037109375, -0.8118896484375, -0.7556304931640625, -0.699371337890625, -0.6431121826171875, -0.58685302734375, -0.5305938720703125, -0.474334716796875, -0.4180755615234375, -0.36181640625, -0.3055572509765625, -0.249298095703125, -0.1930389404296875, -0.13677978515625, -0.0805206298828125, -0.024261474609375, 0.0319976806640625, 0.0882568359375, 0.1445159912109375, 0.200775146484375, 0.2570343017578125, 0.31329345703125, 0.3695526123046875, 0.425811767578125, 0.4820709228515625, 0.538330078125, 0.5945892333984375, 0.650848388671875, 0.7071075439453125, 0.76336669921875, 0.8196258544921875, 0.875885009765625, 0.9321441650390625, 0.9884033203125, 1.0446624755859375, 1.100921630859375, 1.1571807861328125, 1.21343994140625, 1.2696990966796875, 1.325958251953125, 1.3822174072265625, 1.4384765625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 7.0, 7.0, 4.0, 5.0, 7.0, 7.0, 14.0, 15.0, 18.0, 19.0, 18.0, 32.0, 33.0, 24.0, 34.0, 40.0, 35.0, 39.0, 49.0, 54.0, 52.0, 40.0, 44.0, 39.0, 35.0, 43.0, 40.0, 38.0, 34.0, 28.0, 22.0, 19.0, 23.0, 17.0, 11.0, 10.0, 13.0, 11.0, 5.0, 4.0, 4.0, 4.0, 5.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6201171875, -1.571014404296875, -1.52191162109375, -1.472808837890625, -1.4237060546875, -1.374603271484375, -1.32550048828125, -1.276397705078125, -1.227294921875, -1.178192138671875, -1.12908935546875, -1.079986572265625, -1.0308837890625, -0.981781005859375, -0.93267822265625, -0.883575439453125, -0.83447265625, -0.785369873046875, -0.73626708984375, -0.687164306640625, -0.6380615234375, -0.588958740234375, -0.53985595703125, -0.490753173828125, -0.441650390625, -0.392547607421875, -0.34344482421875, -0.294342041015625, -0.2452392578125, -0.196136474609375, -0.14703369140625, -0.097930908203125, -0.048828125, 0.000274658203125, 0.04937744140625, 0.098480224609375, 0.1475830078125, 0.196685791015625, 0.24578857421875, 0.294891357421875, 0.343994140625, 0.393096923828125, 0.44219970703125, 0.491302490234375, 0.5404052734375, 0.589508056640625, 0.63861083984375, 0.687713623046875, 0.73681640625, 0.785919189453125, 0.83502197265625, 0.884124755859375, 0.9332275390625, 0.982330322265625, 1.03143310546875, 1.080535888671875, 1.129638671875, 1.178741455078125, 1.22784423828125, 1.276947021484375, 1.3260498046875, 1.375152587890625, 1.42425537109375, 1.473358154296875, 1.5224609375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 1.0, 10.0, 13.0, 6.0, 12.0, 8.0, 24.0, 23.0, 24.0, 38.0, 45.0, 77.0, 89.0, 115.0, 154.0, 209.0, 280.0, 376.0, 555.0, 873.0, 1558.0, 3098.0, 9593.0, 51052.0, 377936.0, 524142.0, 59547.0, 10687.0, 3397.0, 1572.0, 950.0, 606.0, 397.0, 274.0, 195.0, 144.0, 105.0, 78.0, 60.0, 61.0, 47.0, 26.0, 22.0, 14.0, 19.0, 15.0, 10.0, 6.0, 5.0, 7.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.79296875, -4.64337158203125, -4.4937744140625, -4.34417724609375, -4.194580078125, -4.04498291015625, -3.8953857421875, -3.74578857421875, -3.59619140625, -3.44659423828125, -3.2969970703125, -3.14739990234375, -2.997802734375, -2.84820556640625, -2.6986083984375, -2.54901123046875, -2.3994140625, -2.24981689453125, -2.1002197265625, -1.95062255859375, -1.801025390625, -1.65142822265625, -1.5018310546875, -1.35223388671875, -1.20263671875, -1.05303955078125, -0.9034423828125, -0.75384521484375, -0.604248046875, -0.45465087890625, -0.3050537109375, -0.15545654296875, -0.005859375, 0.14373779296875, 0.2933349609375, 0.44293212890625, 0.592529296875, 0.74212646484375, 0.8917236328125, 1.04132080078125, 1.19091796875, 1.34051513671875, 1.4901123046875, 1.63970947265625, 1.789306640625, 1.93890380859375, 2.0885009765625, 2.23809814453125, 2.3876953125, 2.53729248046875, 2.6868896484375, 2.83648681640625, 2.986083984375, 3.13568115234375, 3.2852783203125, 3.43487548828125, 3.58447265625, 3.73406982421875, 3.8836669921875, 4.03326416015625, 4.182861328125, 4.33245849609375, 4.4820556640625, 4.63165283203125, 4.78125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 6.0, 4.0, 2.0, 11.0, 4.0, 9.0, 11.0, 8.0, 26.0, 19.0, 29.0, 23.0, 28.0, 36.0, 39.0, 36.0, 49.0, 40.0, 53.0, 40.0, 51.0, 48.0, 39.0, 50.0, 36.0, 34.0, 46.0, 30.0, 37.0, 28.0, 25.0, 18.0, 17.0, 15.0, 13.0, 12.0, 4.0, 7.0, 8.0, 4.0, 2.0, 2.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0], "bins": [-8.3515625, -8.12310791015625, -7.8946533203125, -7.66619873046875, -7.437744140625, -7.20928955078125, -6.9808349609375, -6.75238037109375, -6.52392578125, -6.29547119140625, -6.0670166015625, -5.83856201171875, -5.610107421875, -5.38165283203125, -5.1531982421875, -4.92474365234375, -4.6962890625, -4.46783447265625, -4.2393798828125, -4.01092529296875, -3.782470703125, -3.55401611328125, -3.3255615234375, -3.09710693359375, -2.86865234375, -2.64019775390625, -2.4117431640625, -2.18328857421875, -1.954833984375, -1.72637939453125, -1.4979248046875, -1.26947021484375, -1.041015625, -0.81256103515625, -0.5841064453125, -0.35565185546875, -0.127197265625, 0.10125732421875, 0.3297119140625, 0.55816650390625, 0.78662109375, 1.01507568359375, 1.2435302734375, 1.47198486328125, 1.700439453125, 1.92889404296875, 2.1573486328125, 2.38580322265625, 2.6142578125, 2.84271240234375, 3.0711669921875, 3.29962158203125, 3.528076171875, 3.75653076171875, 3.9849853515625, 4.21343994140625, 4.44189453125, 4.67034912109375, 4.8988037109375, 5.12725830078125, 5.355712890625, 5.58416748046875, 5.8126220703125, 6.04107666015625, 6.26953125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 10.0, 6.0, 5.0, 18.0, 33.0, 62.0, 168.0, 476.0, 2074.0, 26797.0, 932457.0, 81852.0, 3511.0, 724.0, 210.0, 73.0, 42.0, 17.0, 10.0, 5.0, 3.0, 4.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.05859375, -3.95355224609375, -3.8485107421875, -3.74346923828125, -3.638427734375, -3.53338623046875, -3.4283447265625, -3.32330322265625, -3.21826171875, -3.11322021484375, -3.0081787109375, -2.90313720703125, -2.798095703125, -2.69305419921875, -2.5880126953125, -2.48297119140625, -2.3779296875, -2.27288818359375, -2.1678466796875, -2.06280517578125, -1.957763671875, -1.85272216796875, -1.7476806640625, -1.64263916015625, -1.53759765625, -1.43255615234375, -1.3275146484375, -1.22247314453125, -1.117431640625, -1.01239013671875, -0.9073486328125, -0.80230712890625, -0.697265625, -0.59222412109375, -0.4871826171875, -0.38214111328125, -0.277099609375, -0.17205810546875, -0.0670166015625, 0.03802490234375, 0.14306640625, 0.24810791015625, 0.3531494140625, 0.45819091796875, 0.563232421875, 0.66827392578125, 0.7733154296875, 0.87835693359375, 0.9833984375, 1.08843994140625, 1.1934814453125, 1.29852294921875, 1.403564453125, 1.50860595703125, 1.6136474609375, 1.71868896484375, 1.82373046875, 1.92877197265625, 2.0338134765625, 2.13885498046875, 2.243896484375, 2.34893798828125, 2.4539794921875, 2.55902099609375, 2.6640625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 5.0, 4.0, 13.0, 11.0, 10.0, 15.0, 28.0, 27.0, 21.0, 29.0, 39.0, 47.0, 65.0, 69.0, 75.0, 65.0, 75.0, 71.0, 55.0, 60.0, 49.0, 30.0, 23.0, 23.0, 19.0, 8.0, 9.0, 8.0, 10.0, 9.0, 6.0, 8.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000263214111328125, -0.00025454163551330566, -0.00024586915969848633, -0.000237196683883667, -0.00022852420806884766, -0.00021985173225402832, -0.00021117925643920898, -0.00020250678062438965, -0.0001938343048095703, -0.00018516182899475098, -0.00017648935317993164, -0.0001678168773651123, -0.00015914440155029297, -0.00015047192573547363, -0.0001417994499206543, -0.00013312697410583496, -0.00012445449829101562, -0.00011578202247619629, -0.00010710954666137695, -9.843707084655762e-05, -8.976459503173828e-05, -8.109211921691895e-05, -7.241964340209961e-05, -6.374716758728027e-05, -5.507469177246094e-05, -4.64022159576416e-05, -3.7729740142822266e-05, -2.905726432800293e-05, -2.0384788513183594e-05, -1.1712312698364258e-05, -3.039836883544922e-06, 5.632638931274414e-06, 1.430511474609375e-05, 2.2977590560913086e-05, 3.165006637573242e-05, 4.032254219055176e-05, 4.8995018005371094e-05, 5.766749382019043e-05, 6.633996963500977e-05, 7.50124454498291e-05, 8.368492126464844e-05, 9.235739707946777e-05, 0.00010102987289428711, 0.00010970234870910645, 0.00011837482452392578, 0.00012704730033874512, 0.00013571977615356445, 0.0001443922519683838, 0.00015306472778320312, 0.00016173720359802246, 0.0001704096794128418, 0.00017908215522766113, 0.00018775463104248047, 0.0001964271068572998, 0.00020509958267211914, 0.00021377205848693848, 0.0002224445343017578, 0.00023111701011657715, 0.00023978948593139648, 0.0002484619617462158, 0.00025713443756103516, 0.0002658069133758545, 0.00027447938919067383, 0.00028315186500549316, 0.0002918243408203125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 0.0, 6.0, 6.0, 4.0, 12.0, 11.0, 12.0, 19.0, 35.0, 37.0, 46.0, 94.0, 129.0, 200.0, 380.0, 689.0, 1433.0, 3818.0, 14022.0, 95132.0, 734351.0, 167832.0, 21272.0, 5228.0, 1794.0, 827.0, 413.0, 236.0, 172.0, 103.0, 67.0, 45.0, 32.0, 32.0, 24.0, 11.0, 13.0, 5.0, 4.0, 3.0, 0.0, 1.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2939453125, -1.247100830078125, -1.20025634765625, -1.153411865234375, -1.1065673828125, -1.059722900390625, -1.01287841796875, -0.966033935546875, -0.919189453125, -0.872344970703125, -0.82550048828125, -0.778656005859375, -0.7318115234375, -0.684967041015625, -0.63812255859375, -0.591278076171875, -0.54443359375, -0.497589111328125, -0.45074462890625, -0.403900146484375, -0.3570556640625, -0.310211181640625, -0.26336669921875, -0.216522216796875, -0.169677734375, -0.122833251953125, -0.07598876953125, -0.029144287109375, 0.0177001953125, 0.064544677734375, 0.11138916015625, 0.158233642578125, 0.205078125, 0.251922607421875, 0.29876708984375, 0.345611572265625, 0.3924560546875, 0.439300537109375, 0.48614501953125, 0.532989501953125, 0.579833984375, 0.626678466796875, 0.67352294921875, 0.720367431640625, 0.7672119140625, 0.814056396484375, 0.86090087890625, 0.907745361328125, 0.95458984375, 1.001434326171875, 1.04827880859375, 1.095123291015625, 1.1419677734375, 1.188812255859375, 1.23565673828125, 1.282501220703125, 1.329345703125, 1.376190185546875, 1.42303466796875, 1.469879150390625, 1.5167236328125, 1.563568115234375, 1.61041259765625, 1.657257080078125, 1.7041015625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 1.0, 7.0, 12.0, 11.0, 19.0, 11.0, 21.0, 35.0, 31.0, 28.0, 35.0, 49.0, 46.0, 57.0, 62.0, 67.0, 68.0, 70.0, 49.0, 45.0, 49.0, 39.0, 39.0, 21.0, 17.0, 22.0, 18.0, 9.0, 10.0, 5.0, 5.0, 7.0, 8.0, 7.0, 5.0, 3.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-1.3359375, -1.2995376586914062, -1.2631378173828125, -1.2267379760742188, -1.190338134765625, -1.1539382934570312, -1.1175384521484375, -1.0811386108398438, -1.04473876953125, -1.0083389282226562, -0.9719390869140625, -0.9355392456054688, -0.899139404296875, -0.8627395629882812, -0.8263397216796875, -0.7899398803710938, -0.7535400390625, -0.7171401977539062, -0.6807403564453125, -0.6443405151367188, -0.607940673828125, -0.5715408325195312, -0.5351409912109375, -0.49874114990234375, -0.46234130859375, -0.42594146728515625, -0.3895416259765625, -0.35314178466796875, -0.316741943359375, -0.28034210205078125, -0.2439422607421875, -0.20754241943359375, -0.171142578125, -0.13474273681640625, -0.0983428955078125, -0.06194305419921875, -0.025543212890625, 0.01085662841796875, 0.0472564697265625, 0.08365631103515625, 0.12005615234375, 0.15645599365234375, 0.1928558349609375, 0.22925567626953125, 0.265655517578125, 0.30205535888671875, 0.3384552001953125, 0.37485504150390625, 0.4112548828125, 0.44765472412109375, 0.4840545654296875, 0.5204544067382812, 0.556854248046875, 0.5932540893554688, 0.6296539306640625, 0.6660537719726562, 0.70245361328125, 0.7388534545898438, 0.7752532958984375, 0.8116531372070312, 0.848052978515625, 0.8844528198242188, 0.9208526611328125, 0.9572525024414062, 0.99365234375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 2.0, 6.0, 10.0, 46.0, 115.0, 232.0, 274.0, 171.0, 74.0, 31.0, 24.0, 6.0, 2.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.99610137939453, -54.53335189819336, -53.07060241699219, -51.607852935791016, -50.145103454589844, -48.682350158691406, -47.219600677490234, -45.75685119628906, -44.29410171508789, -42.83135223388672, -41.36860275268555, -39.905853271484375, -38.44309997558594, -36.980350494384766, -35.517601013183594, -34.05485153198242, -32.59210205078125, -31.129352569580078, -29.666603088378906, -28.2038516998291, -26.74110221862793, -25.278352737426758, -23.815601348876953, -22.35285186767578, -20.89010238647461, -19.427352905273438, -17.964603424072266, -16.50185203552246, -15.039102554321289, -13.576353073120117, -12.113602638244629, -10.65085220336914, -9.188102722167969, -7.725352764129639, -6.262602806091309, -4.7998528480529785, -3.3371028900146484, -1.8743529319763184, -0.4116029739379883, 1.0511474609375, 2.513896942138672, 3.976646900177002, 5.439396858215332, 6.902146816253662, 8.364896774291992, 9.827646255493164, 11.290396690368652, 12.75314712524414, 14.215896606445312, 15.678646087646484, 17.141395568847656, 18.60414695739746, 20.066896438598633, 21.529645919799805, 22.99239730834961, 24.45514678955078, 25.917896270751953, 27.380645751953125, 28.843395233154297, 30.3061466217041, 31.768896102905273, 33.23164749145508, 34.69439697265625, 36.15714645385742, 37.619895935058594]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 1.0, 2.0, 6.0, 3.0, 8.0, 7.0, 9.0, 12.0, 13.0, 8.0, 20.0, 17.0, 11.0, 25.0, 32.0, 35.0, 36.0, 34.0, 44.0, 47.0, 66.0, 69.0, 57.0, 50.0, 37.0, 45.0, 27.0, 37.0, 27.0, 32.0, 30.0, 20.0, 22.0, 20.0, 17.0, 10.0, 17.0, 12.0, 7.0, 7.0, 4.0, 2.0, 6.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-23.298927307128906, -22.50018310546875, -21.701438903808594, -20.902694702148438, -20.10395050048828, -19.305204391479492, -18.506460189819336, -17.70771598815918, -16.908971786499023, -16.110227584838867, -15.311483383178711, -14.512738227844238, -13.713994026184082, -12.915249824523926, -12.116504669189453, -11.317760467529297, -10.51901626586914, -9.720272064208984, -8.921527862548828, -8.122782707214355, -7.324038505554199, -6.525294303894043, -5.7265496253967285, -4.927804946899414, -4.129060745239258, -3.3303163051605225, -2.531571865081787, -1.7328274250030518, -0.9340829849243164, -0.13533854484558105, 0.6634058952331543, 1.4621505737304688, 2.260896682739258, 3.059641122817993, 3.8583855628967285, 4.657130241394043, 5.455874443054199, 6.2546186447143555, 7.05336332321167, 7.852108001708984, 8.65085220336914, 9.449596405029297, 10.248340606689453, 11.047085762023926, 11.845829963684082, 12.644574165344238, 13.443319320678711, 14.242063522338867, 15.040807723999023, 15.83955192565918, 16.638296127319336, 17.437040328979492, 18.23578643798828, 19.034530639648438, 19.833274841308594, 20.63201904296875, 21.430763244628906, 22.229507446289062, 23.02825164794922, 23.826995849609375, 24.62574005126953, 25.42448616027832, 26.223230361938477, 27.021974563598633, 27.82071876525879]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 6.0, 2.0, 2.0, 14.0, 9.0, 11.0, 14.0, 19.0, 29.0, 44.0, 70.0, 99.0, 172.0, 312.0, 646.0, 1428.0, 3559.0, 10283.0, 36780.0, 213395.0, 1761377.0, 1882766.0, 227667.0, 38177.0, 10562.0, 3716.0, 1487.0, 726.0, 327.0, 221.0, 113.0, 83.0, 60.0, 37.0, 23.0, 22.0, 13.0, 9.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.931640625, -2.86016845703125, -2.7886962890625, -2.71722412109375, -2.645751953125, -2.57427978515625, -2.5028076171875, -2.43133544921875, -2.35986328125, -2.28839111328125, -2.2169189453125, -2.14544677734375, -2.073974609375, -2.00250244140625, -1.9310302734375, -1.85955810546875, -1.7880859375, -1.71661376953125, -1.6451416015625, -1.57366943359375, -1.502197265625, -1.43072509765625, -1.3592529296875, -1.28778076171875, -1.21630859375, -1.14483642578125, -1.0733642578125, -1.00189208984375, -0.930419921875, -0.85894775390625, -0.7874755859375, -0.71600341796875, -0.64453125, -0.57305908203125, -0.5015869140625, -0.43011474609375, -0.358642578125, -0.28717041015625, -0.2156982421875, -0.14422607421875, -0.07275390625, -0.00128173828125, 0.0701904296875, 0.14166259765625, 0.213134765625, 0.28460693359375, 0.3560791015625, 0.42755126953125, 0.4990234375, 0.57049560546875, 0.6419677734375, 0.71343994140625, 0.784912109375, 0.85638427734375, 0.9278564453125, 0.99932861328125, 1.07080078125, 1.14227294921875, 1.2137451171875, 1.28521728515625, 1.356689453125, 1.42816162109375, 1.4996337890625, 1.57110595703125, 1.642578125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 8.0, 6.0, 7.0, 9.0, 24.0, 22.0, 27.0, 32.0, 33.0, 48.0, 54.0, 53.0, 75.0, 73.0, 67.0, 70.0, 67.0, 59.0, 47.0, 51.0, 38.0, 42.0, 21.0, 28.0, 16.0, 9.0, 6.0, 6.0, 6.0, 3.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.609375, -1.537841796875, -1.46630859375, -1.394775390625, -1.3232421875, -1.251708984375, -1.18017578125, -1.108642578125, -1.037109375, -0.965576171875, -0.89404296875, -0.822509765625, -0.7509765625, -0.679443359375, -0.60791015625, -0.536376953125, -0.46484375, -0.393310546875, -0.32177734375, -0.250244140625, -0.1787109375, -0.107177734375, -0.03564453125, 0.035888671875, 0.107421875, 0.178955078125, 0.25048828125, 0.322021484375, 0.3935546875, 0.465087890625, 0.53662109375, 0.608154296875, 0.6796875, 0.751220703125, 0.82275390625, 0.894287109375, 0.9658203125, 1.037353515625, 1.10888671875, 1.180419921875, 1.251953125, 1.323486328125, 1.39501953125, 1.466552734375, 1.5380859375, 1.609619140625, 1.68115234375, 1.752685546875, 1.82421875, 1.895751953125, 1.96728515625, 2.038818359375, 2.1103515625, 2.181884765625, 2.25341796875, 2.324951171875, 2.396484375, 2.468017578125, 2.53955078125, 2.611083984375, 2.6826171875, 2.754150390625, 2.82568359375, 2.897216796875, 2.96875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 5.0, 1.0, 3.0, 2.0, 3.0, 7.0, 7.0, 8.0, 14.0, 21.0, 27.0, 37.0, 42.0, 61.0, 131.0, 138.0, 205.0, 358.0, 592.0, 1200.0, 2690.0, 6680.0, 19391.0, 67703.0, 381573.0, 3033680.0, 566851.0, 79937.0, 20828.0, 6760.0, 2706.0, 1184.0, 594.0, 318.0, 158.0, 126.0, 75.0, 38.0, 34.0, 24.0, 21.0, 15.0, 12.0, 9.0, 9.0, 0.0, 6.0, 2.0, 3.0, 3.0, 2.0], "bins": [-3.07421875, -2.994537353515625, -2.91485595703125, -2.835174560546875, -2.7554931640625, -2.675811767578125, -2.59613037109375, -2.516448974609375, -2.436767578125, -2.357086181640625, -2.27740478515625, -2.197723388671875, -2.1180419921875, -2.038360595703125, -1.95867919921875, -1.878997802734375, -1.79931640625, -1.719635009765625, -1.63995361328125, -1.560272216796875, -1.4805908203125, -1.400909423828125, -1.32122802734375, -1.241546630859375, -1.161865234375, -1.082183837890625, -1.00250244140625, -0.922821044921875, -0.8431396484375, -0.763458251953125, -0.68377685546875, -0.604095458984375, -0.5244140625, -0.444732666015625, -0.36505126953125, -0.285369873046875, -0.2056884765625, -0.126007080078125, -0.04632568359375, 0.033355712890625, 0.113037109375, 0.192718505859375, 0.27239990234375, 0.352081298828125, 0.4317626953125, 0.511444091796875, 0.59112548828125, 0.670806884765625, 0.75048828125, 0.830169677734375, 0.90985107421875, 0.989532470703125, 1.0692138671875, 1.148895263671875, 1.22857666015625, 1.308258056640625, 1.387939453125, 1.467620849609375, 1.54730224609375, 1.626983642578125, 1.7066650390625, 1.786346435546875, 1.86602783203125, 1.945709228515625, 2.025390625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 2.0, 5.0, 5.0, 11.0, 11.0, 11.0, 18.0, 20.0, 25.0, 45.0, 56.0, 102.0, 131.0, 278.0, 435.0, 749.0, 836.0, 561.0, 313.0, 162.0, 107.0, 56.0, 46.0, 32.0, 19.0, 11.0, 9.0, 6.0, 4.0, 3.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9453125, -4.81573486328125, -4.6861572265625, -4.55657958984375, -4.427001953125, -4.29742431640625, -4.1678466796875, -4.03826904296875, -3.90869140625, -3.77911376953125, -3.6495361328125, -3.51995849609375, -3.390380859375, -3.26080322265625, -3.1312255859375, -3.00164794921875, -2.8720703125, -2.74249267578125, -2.6129150390625, -2.48333740234375, -2.353759765625, -2.22418212890625, -2.0946044921875, -1.96502685546875, -1.83544921875, -1.70587158203125, -1.5762939453125, -1.44671630859375, -1.317138671875, -1.18756103515625, -1.0579833984375, -0.92840576171875, -0.798828125, -0.66925048828125, -0.5396728515625, -0.41009521484375, -0.280517578125, -0.15093994140625, -0.0213623046875, 0.10821533203125, 0.23779296875, 0.36737060546875, 0.4969482421875, 0.62652587890625, 0.756103515625, 0.88568115234375, 1.0152587890625, 1.14483642578125, 1.2744140625, 1.40399169921875, 1.5335693359375, 1.66314697265625, 1.792724609375, 1.92230224609375, 2.0518798828125, 2.18145751953125, 2.31103515625, 2.44061279296875, 2.5701904296875, 2.69976806640625, 2.829345703125, 2.95892333984375, 3.0885009765625, 3.21807861328125, 3.34765625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 3.0, 5.0, 18.0, 56.0, 176.0, 340.0, 264.0, 96.0, 28.0, 3.0, 6.0, 4.0, 3.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 4.0], "bins": [-91.42184448242188, -89.58707427978516, -87.7522964477539, -85.91752624511719, -84.08275604248047, -82.24797821044922, -80.4132080078125, -78.57843780517578, -76.74365997314453, -74.90888977050781, -73.07411193847656, -71.23934173583984, -69.40457153320312, -67.56979370117188, -65.73502349853516, -63.90024948120117, -62.06547927856445, -60.23070526123047, -58.39593505859375, -56.561161041259766, -54.72638702392578, -52.89161682128906, -51.05684280395508, -49.222068786621094, -47.387298583984375, -45.55252456665039, -43.71775436401367, -41.88298034667969, -40.0482063293457, -38.21343231201172, -36.378662109375, -34.543888092041016, -32.7091178894043, -30.874345779418945, -29.03957176208496, -27.20479965209961, -25.370025634765625, -23.535253524780273, -21.700481414794922, -19.865707397460938, -18.030935287475586, -16.196163177490234, -14.36138916015625, -12.526617050170898, -10.69184398651123, -8.857070922851562, -7.022298812866211, -5.187525749206543, -3.352752685546875, -1.5179798603057861, 0.31679296493530273, 2.1515655517578125, 3.9863386154174805, 5.821111679077148, 7.6558837890625, 9.490656852722168, 11.325429916381836, 13.160202980041504, 14.994976043701172, 16.829748153686523, 18.664520263671875, 20.49929428100586, 22.33406639099121, 24.168838500976562, 26.003612518310547]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 6.0, 5.0, 5.0, 6.0, 9.0, 9.0, 19.0, 18.0, 26.0, 23.0, 29.0, 34.0, 55.0, 60.0, 54.0, 55.0, 53.0, 79.0, 65.0, 46.0, 42.0, 53.0, 38.0, 38.0, 47.0, 42.0, 21.0, 22.0, 15.0, 14.0, 5.0, 8.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.71340560913086, -24.034442901611328, -23.355480194091797, -22.676517486572266, -21.997554779052734, -21.318592071533203, -20.639629364013672, -19.96066665649414, -19.28170394897461, -18.602741241455078, -17.923778533935547, -17.244815826416016, -16.565853118896484, -15.886890411376953, -15.207927703857422, -14.52896499633789, -13.85000228881836, -13.171039581298828, -12.492076873779297, -11.813114166259766, -11.134151458740234, -10.455188751220703, -9.776226043701172, -9.09726333618164, -8.41830062866211, -7.739337921142578, -7.060375213623047, -6.381412506103516, -5.702449798583984, -5.023487091064453, -4.344524383544922, -3.6655616760253906, -2.986600875854492, -2.307638168334961, -1.6286754608154297, -0.9497127532958984, -0.2707500457763672, 0.40821266174316406, 1.0871753692626953, 1.7661380767822266, 2.445100784301758, 3.124063491821289, 3.8030261993408203, 4.481988906860352, 5.160951614379883, 5.839914321899414, 6.518877029418945, 7.197839736938477, 7.876802444458008, 8.555765151977539, 9.23472785949707, 9.913690567016602, 10.592653274536133, 11.271615982055664, 11.950578689575195, 12.629541397094727, 13.308504104614258, 13.987466812133789, 14.66642951965332, 15.345392227172852, 16.024354934692383, 16.703317642211914, 17.382280349731445, 18.061243057250977, 18.740205764770508]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 0.0, 3.0, 1.0, 10.0, 5.0, 9.0, 16.0, 24.0, 37.0, 51.0, 104.0, 137.0, 245.0, 403.0, 665.0, 1144.0, 2136.0, 3937.0, 7756.0, 15890.0, 33023.0, 69283.0, 150481.0, 280518.0, 249218.0, 122406.0, 56666.0, 27222.0, 12966.0, 6508.0, 3385.0, 1851.0, 981.0, 594.0, 337.0, 225.0, 111.0, 82.0, 56.0, 25.0, 15.0, 13.0, 9.0, 5.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.09765625, -2.031829833984375, -1.96600341796875, -1.900177001953125, -1.8343505859375, -1.768524169921875, -1.70269775390625, -1.636871337890625, -1.571044921875, -1.505218505859375, -1.43939208984375, -1.373565673828125, -1.3077392578125, -1.241912841796875, -1.17608642578125, -1.110260009765625, -1.04443359375, -0.978607177734375, -0.91278076171875, -0.846954345703125, -0.7811279296875, -0.715301513671875, -0.64947509765625, -0.583648681640625, -0.517822265625, -0.451995849609375, -0.38616943359375, -0.320343017578125, -0.2545166015625, -0.188690185546875, -0.12286376953125, -0.057037353515625, 0.0087890625, 0.074615478515625, 0.14044189453125, 0.206268310546875, 0.2720947265625, 0.337921142578125, 0.40374755859375, 0.469573974609375, 0.535400390625, 0.601226806640625, 0.66705322265625, 0.732879638671875, 0.7987060546875, 0.864532470703125, 0.93035888671875, 0.996185302734375, 1.06201171875, 1.127838134765625, 1.19366455078125, 1.259490966796875, 1.3253173828125, 1.391143798828125, 1.45697021484375, 1.522796630859375, 1.588623046875, 1.654449462890625, 1.72027587890625, 1.786102294921875, 1.8519287109375, 1.917755126953125, 1.98358154296875, 2.049407958984375, 2.115234375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 4.0, 8.0, 3.0, 13.0, 14.0, 13.0, 10.0, 19.0, 21.0, 26.0, 25.0, 24.0, 39.0, 37.0, 47.0, 46.0, 51.0, 49.0, 38.0, 56.0, 48.0, 48.0, 37.0, 45.0, 35.0, 33.0, 45.0, 36.0, 29.0, 30.0, 12.0, 14.0, 13.0, 15.0, 7.0, 7.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.669921875, -1.61968994140625, -1.5694580078125, -1.51922607421875, -1.468994140625, -1.41876220703125, -1.3685302734375, -1.31829833984375, -1.26806640625, -1.21783447265625, -1.1676025390625, -1.11737060546875, -1.067138671875, -1.01690673828125, -0.9666748046875, -0.91644287109375, -0.8662109375, -0.81597900390625, -0.7657470703125, -0.71551513671875, -0.665283203125, -0.61505126953125, -0.5648193359375, -0.51458740234375, -0.46435546875, -0.41412353515625, -0.3638916015625, -0.31365966796875, -0.263427734375, -0.21319580078125, -0.1629638671875, -0.11273193359375, -0.0625, -0.01226806640625, 0.0379638671875, 0.08819580078125, 0.138427734375, 0.18865966796875, 0.2388916015625, 0.28912353515625, 0.33935546875, 0.38958740234375, 0.4398193359375, 0.49005126953125, 0.540283203125, 0.59051513671875, 0.6407470703125, 0.69097900390625, 0.7412109375, 0.79144287109375, 0.8416748046875, 0.89190673828125, 0.942138671875, 0.99237060546875, 1.0426025390625, 1.09283447265625, 1.14306640625, 1.19329833984375, 1.2435302734375, 1.29376220703125, 1.343994140625, 1.39422607421875, 1.4444580078125, 1.49468994140625, 1.544921875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 5.0, 5.0, 9.0, 7.0, 12.0, 20.0, 29.0, 37.0, 37.0, 61.0, 90.0, 142.0, 188.0, 324.0, 466.0, 774.0, 1434.0, 3630.0, 15629.0, 132096.0, 759746.0, 112742.0, 13894.0, 3533.0, 1495.0, 751.0, 454.0, 296.0, 199.0, 149.0, 86.0, 72.0, 46.0, 31.0, 16.0, 21.0, 12.0, 6.0, 6.0, 6.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.0546875, -5.873779296875, -5.69287109375, -5.511962890625, -5.3310546875, -5.150146484375, -4.96923828125, -4.788330078125, -4.607421875, -4.426513671875, -4.24560546875, -4.064697265625, -3.8837890625, -3.702880859375, -3.52197265625, -3.341064453125, -3.16015625, -2.979248046875, -2.79833984375, -2.617431640625, -2.4365234375, -2.255615234375, -2.07470703125, -1.893798828125, -1.712890625, -1.531982421875, -1.35107421875, -1.170166015625, -0.9892578125, -0.808349609375, -0.62744140625, -0.446533203125, -0.265625, -0.084716796875, 0.09619140625, 0.277099609375, 0.4580078125, 0.638916015625, 0.81982421875, 1.000732421875, 1.181640625, 1.362548828125, 1.54345703125, 1.724365234375, 1.9052734375, 2.086181640625, 2.26708984375, 2.447998046875, 2.62890625, 2.809814453125, 2.99072265625, 3.171630859375, 3.3525390625, 3.533447265625, 3.71435546875, 3.895263671875, 4.076171875, 4.257080078125, 4.43798828125, 4.618896484375, 4.7998046875, 4.980712890625, 5.16162109375, 5.342529296875, 5.5234375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 4.0, 3.0, 4.0, 2.0, 6.0, 3.0, 9.0, 11.0, 13.0, 13.0, 21.0, 18.0, 15.0, 23.0, 26.0, 26.0, 29.0, 32.0, 44.0, 56.0, 49.0, 44.0, 51.0, 51.0, 38.0, 45.0, 56.0, 34.0, 40.0, 39.0, 33.0, 19.0, 30.0, 18.0, 21.0, 19.0, 16.0, 9.0, 12.0, 3.0, 8.0, 4.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-6.19921875, -6.02728271484375, -5.8553466796875, -5.68341064453125, -5.511474609375, -5.33953857421875, -5.1676025390625, -4.99566650390625, -4.82373046875, -4.65179443359375, -4.4798583984375, -4.30792236328125, -4.135986328125, -3.96405029296875, -3.7921142578125, -3.62017822265625, -3.4482421875, -3.27630615234375, -3.1043701171875, -2.93243408203125, -2.760498046875, -2.58856201171875, -2.4166259765625, -2.24468994140625, -2.07275390625, -1.90081787109375, -1.7288818359375, -1.55694580078125, -1.385009765625, -1.21307373046875, -1.0411376953125, -0.86920166015625, -0.697265625, -0.52532958984375, -0.3533935546875, -0.18145751953125, -0.009521484375, 0.16241455078125, 0.3343505859375, 0.50628662109375, 0.67822265625, 0.85015869140625, 1.0220947265625, 1.19403076171875, 1.365966796875, 1.53790283203125, 1.7098388671875, 1.88177490234375, 2.0537109375, 2.22564697265625, 2.3975830078125, 2.56951904296875, 2.741455078125, 2.91339111328125, 3.0853271484375, 3.25726318359375, 3.42919921875, 3.60113525390625, 3.7730712890625, 3.94500732421875, 4.116943359375, 4.28887939453125, 4.4608154296875, 4.63275146484375, 4.8046875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 5.0, 6.0, 13.0, 15.0, 35.0, 52.0, 110.0, 164.0, 371.0, 975.0, 3655.0, 22401.0, 220716.0, 719026.0, 69312.0, 8621.0, 1855.0, 655.0, 267.0, 136.0, 57.0, 47.0, 16.0, 18.0, 10.0, 9.0, 7.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5771484375, -1.5250244140625, -1.472900390625, -1.4207763671875, -1.36865234375, -1.3165283203125, -1.264404296875, -1.2122802734375, -1.16015625, -1.1080322265625, -1.055908203125, -1.0037841796875, -0.95166015625, -0.8995361328125, -0.847412109375, -0.7952880859375, -0.7431640625, -0.6910400390625, -0.638916015625, -0.5867919921875, -0.53466796875, -0.4825439453125, -0.430419921875, -0.3782958984375, -0.326171875, -0.2740478515625, -0.221923828125, -0.1697998046875, -0.11767578125, -0.0655517578125, -0.013427734375, 0.0386962890625, 0.0908203125, 0.1429443359375, 0.195068359375, 0.2471923828125, 0.29931640625, 0.3514404296875, 0.403564453125, 0.4556884765625, 0.5078125, 0.5599365234375, 0.612060546875, 0.6641845703125, 0.71630859375, 0.7684326171875, 0.820556640625, 0.8726806640625, 0.9248046875, 0.9769287109375, 1.029052734375, 1.0811767578125, 1.13330078125, 1.1854248046875, 1.237548828125, 1.2896728515625, 1.341796875, 1.3939208984375, 1.446044921875, 1.4981689453125, 1.55029296875, 1.6024169921875, 1.654541015625, 1.7066650390625, 1.7587890625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 5.0, 5.0, 5.0, 10.0, 16.0, 17.0, 24.0, 25.0, 45.0, 37.0, 58.0, 71.0, 79.0, 96.0, 107.0, 79.0, 55.0, 55.0, 48.0, 33.0, 37.0, 13.0, 20.0, 17.0, 14.0, 5.0, 6.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002989768981933594, -0.00028873980045318604, -0.0002785027027130127, -0.00026826560497283936, -0.000258028507232666, -0.0002477914094924927, -0.00023755431175231934, -0.000227317214012146, -0.00021708011627197266, -0.00020684301853179932, -0.00019660592079162598, -0.00018636882305145264, -0.0001761317253112793, -0.00016589462757110596, -0.00015565752983093262, -0.00014542043209075928, -0.00013518333435058594, -0.0001249462366104126, -0.00011470913887023926, -0.00010447204113006592, -9.423494338989258e-05, -8.399784564971924e-05, -7.37607479095459e-05, -6.352365016937256e-05, -5.328655242919922e-05, -4.304945468902588e-05, -3.281235694885254e-05, -2.25752592086792e-05, -1.233816146850586e-05, -2.1010637283325195e-06, 8.13603401184082e-06, 1.837313175201416e-05, 2.86102294921875e-05, 3.884732723236084e-05, 4.908442497253418e-05, 5.932152271270752e-05, 6.955862045288086e-05, 7.97957181930542e-05, 9.003281593322754e-05, 0.00010026991367340088, 0.00011050701141357422, 0.00012074410915374756, 0.0001309812068939209, 0.00014121830463409424, 0.00015145540237426758, 0.00016169250011444092, 0.00017192959785461426, 0.0001821666955947876, 0.00019240379333496094, 0.00020264089107513428, 0.00021287798881530762, 0.00022311508655548096, 0.0002333521842956543, 0.00024358928203582764, 0.000253826379776001, 0.0002640634775161743, 0.00027430057525634766, 0.000284537672996521, 0.00029477477073669434, 0.0003050118684768677, 0.000315248966217041, 0.00032548606395721436, 0.0003357231616973877, 0.00034596025943756104, 0.0003561973571777344]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 5.0, 7.0, 2.0, 9.0, 14.0, 13.0, 28.0, 45.0, 35.0, 83.0, 131.0, 207.0, 343.0, 665.0, 1353.0, 3654.0, 14804.0, 110819.0, 721585.0, 166089.0, 20778.0, 4541.0, 1603.0, 730.0, 396.0, 212.0, 153.0, 87.0, 55.0, 33.0, 25.0, 16.0, 13.0, 10.0, 8.0, 3.0, 4.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3251953125, -1.2818756103515625, -1.238555908203125, -1.1952362060546875, -1.15191650390625, -1.1085968017578125, -1.065277099609375, -1.0219573974609375, -0.9786376953125, -0.9353179931640625, -0.891998291015625, -0.8486785888671875, -0.80535888671875, -0.7620391845703125, -0.718719482421875, -0.6753997802734375, -0.632080078125, -0.5887603759765625, -0.545440673828125, -0.5021209716796875, -0.45880126953125, -0.4154815673828125, -0.372161865234375, -0.3288421630859375, -0.2855224609375, -0.2422027587890625, -0.198883056640625, -0.1555633544921875, -0.11224365234375, -0.0689239501953125, -0.025604248046875, 0.0177154541015625, 0.06103515625, 0.1043548583984375, 0.147674560546875, 0.1909942626953125, 0.23431396484375, 0.2776336669921875, 0.320953369140625, 0.3642730712890625, 0.4075927734375, 0.4509124755859375, 0.494232177734375, 0.5375518798828125, 0.58087158203125, 0.6241912841796875, 0.667510986328125, 0.7108306884765625, 0.754150390625, 0.7974700927734375, 0.840789794921875, 0.8841094970703125, 0.92742919921875, 0.9707489013671875, 1.014068603515625, 1.0573883056640625, 1.1007080078125, 1.1440277099609375, 1.187347412109375, 1.2306671142578125, 1.27398681640625, 1.3173065185546875, 1.360626220703125, 1.4039459228515625, 1.447265625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 6.0, 4.0, 4.0, 3.0, 5.0, 7.0, 7.0, 12.0, 11.0, 19.0, 16.0, 20.0, 20.0, 34.0, 43.0, 29.0, 38.0, 36.0, 47.0, 57.0, 52.0, 50.0, 46.0, 48.0, 45.0, 50.0, 43.0, 41.0, 34.0, 32.0, 22.0, 17.0, 13.0, 14.0, 17.0, 13.0, 5.0, 8.0, 5.0, 7.0, 5.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.95361328125, -0.9252243041992188, -0.8968353271484375, -0.8684463500976562, -0.840057373046875, -0.8116683959960938, -0.7832794189453125, -0.7548904418945312, -0.72650146484375, -0.6981124877929688, -0.6697235107421875, -0.6413345336914062, -0.612945556640625, -0.5845565795898438, -0.5561676025390625, -0.5277786254882812, -0.4993896484375, -0.47100067138671875, -0.4426116943359375, -0.41422271728515625, -0.385833740234375, -0.35744476318359375, -0.3290557861328125, -0.30066680908203125, -0.27227783203125, -0.24388885498046875, -0.2154998779296875, -0.18711090087890625, -0.158721923828125, -0.13033294677734375, -0.1019439697265625, -0.07355499267578125, -0.045166015625, -0.01677703857421875, 0.0116119384765625, 0.04000091552734375, 0.068389892578125, 0.09677886962890625, 0.1251678466796875, 0.15355682373046875, 0.18194580078125, 0.21033477783203125, 0.2387237548828125, 0.26711273193359375, 0.295501708984375, 0.32389068603515625, 0.3522796630859375, 0.38066864013671875, 0.4090576171875, 0.43744659423828125, 0.4658355712890625, 0.49422454833984375, 0.522613525390625, 0.5510025024414062, 0.5793914794921875, 0.6077804565429688, 0.63616943359375, 0.6645584106445312, 0.6929473876953125, 0.7213363647460938, 0.749725341796875, 0.7781143188476562, 0.8065032958984375, 0.8348922729492188, 0.86328125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 7.0, 10.0, 14.0, 49.0, 97.0, 184.0, 313.0, 175.0, 76.0, 32.0, 18.0, 14.0, 4.0, 1.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.17835235595703, -32.7778434753418, -31.377338409423828, -29.976829528808594, -28.576324462890625, -27.17581558227539, -25.77530860900879, -24.374801635742188, -22.974294662475586, -21.573787689208984, -20.173280715942383, -18.77277374267578, -17.372264862060547, -15.971758842468262, -14.571250915527344, -13.170743942260742, -11.77023696899414, -10.369729995727539, -8.969223022460938, -7.5687150955200195, -6.168208122253418, -4.767701148986816, -3.3671932220458984, -1.9666862487792969, -0.5661792755126953, 0.8343279361724854, 2.234835147857666, 3.635342597961426, 5.035849571228027, 6.436356544494629, 7.836864471435547, 9.237371444702148, 10.63787841796875, 12.038385391235352, 13.438892364501953, 14.839400291442871, 16.239906311035156, 17.64041519165039, 19.040922164916992, 20.441429138183594, 21.841936111450195, 23.242443084716797, 24.6429500579834, 26.04345703125, 27.443965911865234, 28.844470977783203, 30.244979858398438, 31.64548683166504, 33.04599380493164, 34.446502685546875, 35.847007751464844, 37.24751663208008, 38.64802169799805, 40.04853057861328, 41.44903564453125, 42.849544525146484, 44.25005340576172, 45.65056228637695, 47.05106735229492, 48.451576232910156, 49.852081298828125, 51.25259017944336, 52.653099060058594, 54.05360412597656, 55.45410919189453]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 9.0, 3.0, 11.0, 13.0, 11.0, 11.0, 15.0, 17.0, 21.0, 22.0, 29.0, 28.0, 35.0, 40.0, 23.0, 49.0, 61.0, 79.0, 78.0, 56.0, 47.0, 43.0, 31.0, 27.0, 36.0, 34.0, 15.0, 16.0, 22.0, 28.0, 11.0, 12.0, 15.0, 15.0, 10.0, 10.0, 5.0, 6.0, 3.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.484622955322266, -22.8031063079834, -22.12158966064453, -21.440073013305664, -20.758556365966797, -20.077037811279297, -19.39552116394043, -18.714004516601562, -18.032487869262695, -17.350971221923828, -16.66945457458496, -15.987936973571777, -15.30642032623291, -14.624903678894043, -13.94338607788086, -13.261869430541992, -12.580352783203125, -11.898836135864258, -11.21731948852539, -10.535801887512207, -9.85428524017334, -9.172768592834473, -8.491250991821289, -7.809734344482422, -7.128217697143555, -6.4467010498046875, -5.765183925628662, -5.083666801452637, -4.4021501541137695, -3.7206332683563232, -3.039116382598877, -2.3575992584228516, -1.6760845184326172, -0.9945676326751709, -0.3130507469177246, 0.3684661388397217, 1.049983024597168, 1.7314999103546143, 2.4130167961120605, 3.094533920288086, 3.776050567626953, 4.45756721496582, 5.139084339141846, 5.820601463317871, 6.502118110656738, 7.1836347579956055, 7.865151882171631, 8.546669006347656, 9.228185653686523, 9.90970230102539, 10.591218948364258, 11.272736549377441, 11.954253196716309, 12.635769844055176, 13.31728744506836, 13.998804092407227, 14.680320739746094, 15.361837387084961, 16.043354034423828, 16.724870681762695, 17.406387329101562, 18.087905883789062, 18.76942253112793, 19.450939178466797, 20.132455825805664]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 4.0, 4.0, 8.0, 15.0, 9.0, 13.0, 21.0, 35.0, 56.0, 78.0, 139.0, 224.0, 455.0, 911.0, 1934.0, 4807.0, 16520.0, 93979.0, 986364.0, 2608126.0, 415555.0, 47048.0, 11055.0, 3685.0, 1529.0, 718.0, 394.0, 233.0, 145.0, 98.0, 42.0, 33.0, 21.0, 14.0, 9.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.32421875, -2.256500244140625, -2.18878173828125, -2.121063232421875, -2.0533447265625, -1.985626220703125, -1.91790771484375, -1.850189208984375, -1.782470703125, -1.714752197265625, -1.64703369140625, -1.579315185546875, -1.5115966796875, -1.443878173828125, -1.37615966796875, -1.308441162109375, -1.24072265625, -1.173004150390625, -1.10528564453125, -1.037567138671875, -0.9698486328125, -0.902130126953125, -0.83441162109375, -0.766693115234375, -0.698974609375, -0.631256103515625, -0.56353759765625, -0.495819091796875, -0.4281005859375, -0.360382080078125, -0.29266357421875, -0.224945068359375, -0.1572265625, -0.089508056640625, -0.02178955078125, 0.045928955078125, 0.1136474609375, 0.181365966796875, 0.24908447265625, 0.316802978515625, 0.384521484375, 0.452239990234375, 0.51995849609375, 0.587677001953125, 0.6553955078125, 0.723114013671875, 0.79083251953125, 0.858551025390625, 0.92626953125, 0.993988037109375, 1.06170654296875, 1.129425048828125, 1.1971435546875, 1.264862060546875, 1.33258056640625, 1.400299072265625, 1.468017578125, 1.535736083984375, 1.60345458984375, 1.671173095703125, 1.7388916015625, 1.806610107421875, 1.87432861328125, 1.942047119140625, 2.009765625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 1.0, 1.0, 4.0, 8.0, 3.0, 8.0, 9.0, 11.0, 13.0, 28.0, 20.0, 26.0, 29.0, 29.0, 31.0, 45.0, 47.0, 45.0, 40.0, 48.0, 45.0, 50.0, 44.0, 47.0, 50.0, 45.0, 46.0, 43.0, 28.0, 27.0, 33.0, 19.0, 26.0, 13.0, 16.0, 3.0, 8.0, 5.0, 5.0, 2.0, 3.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.552734375, -1.5071258544921875, -1.461517333984375, -1.4159088134765625, -1.37030029296875, -1.3246917724609375, -1.279083251953125, -1.2334747314453125, -1.1878662109375, -1.1422576904296875, -1.096649169921875, -1.0510406494140625, -1.00543212890625, -0.9598236083984375, -0.914215087890625, -0.8686065673828125, -0.822998046875, -0.7773895263671875, -0.731781005859375, -0.6861724853515625, -0.64056396484375, -0.5949554443359375, -0.549346923828125, -0.5037384033203125, -0.4581298828125, -0.4125213623046875, -0.366912841796875, -0.3213043212890625, -0.27569580078125, -0.2300872802734375, -0.184478759765625, -0.1388702392578125, -0.09326171875, -0.0476531982421875, -0.002044677734375, 0.0435638427734375, 0.08917236328125, 0.1347808837890625, 0.180389404296875, 0.2259979248046875, 0.2716064453125, 0.3172149658203125, 0.362823486328125, 0.4084320068359375, 0.45404052734375, 0.4996490478515625, 0.545257568359375, 0.5908660888671875, 0.636474609375, 0.6820831298828125, 0.727691650390625, 0.7733001708984375, 0.81890869140625, 0.8645172119140625, 0.910125732421875, 0.9557342529296875, 1.0013427734375, 1.0469512939453125, 1.092559814453125, 1.1381683349609375, 1.18377685546875, 1.2293853759765625, 1.274993896484375, 1.3206024169921875, 1.3662109375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 3.0, 9.0, 10.0, 15.0, 35.0, 54.0, 113.0, 219.0, 456.0, 1263.0, 6896.0, 147303.0, 3958598.0, 72162.0, 5222.0, 1177.0, 426.0, 172.0, 68.0, 33.0, 18.0, 14.0, 8.0, 3.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.03515625, -5.843017578125, -5.65087890625, -5.458740234375, -5.2666015625, -5.074462890625, -4.88232421875, -4.690185546875, -4.498046875, -4.305908203125, -4.11376953125, -3.921630859375, -3.7294921875, -3.537353515625, -3.34521484375, -3.153076171875, -2.9609375, -2.768798828125, -2.57666015625, -2.384521484375, -2.1923828125, -2.000244140625, -1.80810546875, -1.615966796875, -1.423828125, -1.231689453125, -1.03955078125, -0.847412109375, -0.6552734375, -0.463134765625, -0.27099609375, -0.078857421875, 0.11328125, 0.305419921875, 0.49755859375, 0.689697265625, 0.8818359375, 1.073974609375, 1.26611328125, 1.458251953125, 1.650390625, 1.842529296875, 2.03466796875, 2.226806640625, 2.4189453125, 2.611083984375, 2.80322265625, 2.995361328125, 3.1875, 3.379638671875, 3.57177734375, 3.763916015625, 3.9560546875, 4.148193359375, 4.34033203125, 4.532470703125, 4.724609375, 4.916748046875, 5.10888671875, 5.301025390625, 5.4931640625, 5.685302734375, 5.87744140625, 6.069580078125, 6.26171875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 6.0, 11.0, 14.0, 42.0, 63.0, 127.0, 326.0, 789.0, 1298.0, 798.0, 325.0, 134.0, 70.0, 25.0, 25.0, 5.0, 10.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.5, -6.32666015625, -6.1533203125, -5.97998046875, -5.806640625, -5.63330078125, -5.4599609375, -5.28662109375, -5.11328125, -4.93994140625, -4.7666015625, -4.59326171875, -4.419921875, -4.24658203125, -4.0732421875, -3.89990234375, -3.7265625, -3.55322265625, -3.3798828125, -3.20654296875, -3.033203125, -2.85986328125, -2.6865234375, -2.51318359375, -2.33984375, -2.16650390625, -1.9931640625, -1.81982421875, -1.646484375, -1.47314453125, -1.2998046875, -1.12646484375, -0.953125, -0.77978515625, -0.6064453125, -0.43310546875, -0.259765625, -0.08642578125, 0.0869140625, 0.26025390625, 0.43359375, 0.60693359375, 0.7802734375, 0.95361328125, 1.126953125, 1.30029296875, 1.4736328125, 1.64697265625, 1.8203125, 1.99365234375, 2.1669921875, 2.34033203125, 2.513671875, 2.68701171875, 2.8603515625, 3.03369140625, 3.20703125, 3.38037109375, 3.5537109375, 3.72705078125, 3.900390625, 4.07373046875, 4.2470703125, 4.42041015625, 4.59375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 15.0, 15.0, 61.0, 252.0, 425.0, 189.0, 29.0, 9.0, 6.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.84202575683594, -80.73775482177734, -78.63348388671875, -76.52922058105469, -74.4249496459961, -72.3206787109375, -70.2164077758789, -68.11213684082031, -66.00787353515625, -63.903602600097656, -61.79933547973633, -59.695064544677734, -57.590797424316406, -55.48652648925781, -53.38225555419922, -51.277984619140625, -49.17371368408203, -47.06944274902344, -44.96517562866211, -42.860904693603516, -40.75663757324219, -38.652366638183594, -36.548095703125, -34.443824768066406, -32.33955764770508, -30.235288619995117, -28.131019592285156, -26.026748657226562, -23.9224796295166, -21.81821060180664, -19.713939666748047, -17.609670639038086, -15.505401611328125, -13.401132583618164, -11.296862602233887, -9.19259262084961, -7.088323593139648, -4.9840545654296875, -2.87978458404541, -0.7755146026611328, 1.3287544250488281, 3.4330239295959473, 5.537293434143066, 7.6415629386901855, 9.745832443237305, 11.850101470947266, 13.954371452331543, 16.05864143371582, 18.16291046142578, 20.267179489135742, 22.371448516845703, 24.475719451904297, 26.579988479614258, 28.68425750732422, 30.788528442382812, 32.892799377441406, 34.997066497802734, 37.10133743286133, 39.205604553222656, 41.30987548828125, 43.414146423339844, 45.51841354370117, 47.622684478759766, 49.726951599121094, 51.83122253417969]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 7.0, 4.0, 6.0, 5.0, 8.0, 19.0, 18.0, 28.0, 34.0, 32.0, 62.0, 68.0, 90.0, 85.0, 76.0, 79.0, 81.0, 70.0, 57.0, 53.0, 31.0, 28.0, 23.0, 16.0, 13.0, 6.0, 5.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-25.743064880371094, -25.021820068359375, -24.30057716369629, -23.57933235168457, -22.85808753967285, -22.136844635009766, -21.415599822998047, -20.694355010986328, -19.97311019897461, -19.25186538696289, -18.530622482299805, -17.809377670288086, -17.088132858276367, -16.36688995361328, -15.645645141601562, -14.924400329589844, -14.203157424926758, -13.481913566589355, -12.760668754577637, -12.039424896240234, -11.318180084228516, -10.596936225891113, -9.875692367553711, -9.154447555541992, -8.43320369720459, -7.711959362030029, -6.990715026855469, -6.269471168518066, -5.548226833343506, -4.826982498168945, -4.105738639831543, -3.3844943046569824, -2.663249969482422, -1.9420057535171509, -1.2207615375518799, -0.49951744079589844, 0.2217268943786621, 0.9429712295532227, 1.664215087890625, 2.3854594230651855, 3.106703758239746, 3.8279480934143066, 4.549192428588867, 5.2704362869262695, 5.99168062210083, 6.712924957275391, 7.434168815612793, 8.155412673950195, 8.876657485961914, 9.597901344299316, 10.319146156311035, 11.040390014648438, 11.761634826660156, 12.482878684997559, 13.204122543334961, 13.92536735534668, 14.646611213684082, 15.367855072021484, 16.089099884033203, 16.810344696044922, 17.531587600708008, 18.252832412719727, 18.974075317382812, 19.69532012939453, 20.41656494140625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 8.0, 7.0, 15.0, 17.0, 26.0, 30.0, 62.0, 87.0, 124.0, 192.0, 319.0, 511.0, 875.0, 1666.0, 3189.0, 6128.0, 12679.0, 26780.0, 58710.0, 126152.0, 230512.0, 261957.0, 166922.0, 80189.0, 37025.0, 17149.0, 8079.0, 4061.0, 2094.0, 1188.0, 711.0, 398.0, 267.0, 146.0, 87.0, 68.0, 28.0, 30.0, 21.0, 14.0, 12.0, 12.0, 4.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.6982421875, -1.6470947265625, -1.595947265625, -1.5447998046875, -1.49365234375, -1.4425048828125, -1.391357421875, -1.3402099609375, -1.2890625, -1.2379150390625, -1.186767578125, -1.1356201171875, -1.08447265625, -1.0333251953125, -0.982177734375, -0.9310302734375, -0.8798828125, -0.8287353515625, -0.777587890625, -0.7264404296875, -0.67529296875, -0.6241455078125, -0.572998046875, -0.5218505859375, -0.470703125, -0.4195556640625, -0.368408203125, -0.3172607421875, -0.26611328125, -0.2149658203125, -0.163818359375, -0.1126708984375, -0.0615234375, -0.0103759765625, 0.040771484375, 0.0919189453125, 0.14306640625, 0.1942138671875, 0.245361328125, 0.2965087890625, 0.34765625, 0.3988037109375, 0.449951171875, 0.5010986328125, 0.55224609375, 0.6033935546875, 0.654541015625, 0.7056884765625, 0.7568359375, 0.8079833984375, 0.859130859375, 0.9102783203125, 0.96142578125, 1.0125732421875, 1.063720703125, 1.1148681640625, 1.166015625, 1.2171630859375, 1.268310546875, 1.3194580078125, 1.37060546875, 1.4217529296875, 1.472900390625, 1.5240478515625, 1.5751953125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 7.0, 2.0, 7.0, 10.0, 10.0, 14.0, 13.0, 19.0, 19.0, 15.0, 26.0, 30.0, 25.0, 43.0, 51.0, 43.0, 50.0, 46.0, 49.0, 52.0, 56.0, 55.0, 49.0, 40.0, 40.0, 40.0, 37.0, 22.0, 19.0, 34.0, 23.0, 11.0, 16.0, 9.0, 12.0, 4.0, 1.0, 3.0, 6.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.70703125, -1.658599853515625, -1.61016845703125, -1.561737060546875, -1.5133056640625, -1.464874267578125, -1.41644287109375, -1.368011474609375, -1.319580078125, -1.271148681640625, -1.22271728515625, -1.174285888671875, -1.1258544921875, -1.077423095703125, -1.02899169921875, -0.980560302734375, -0.93212890625, -0.883697509765625, -0.83526611328125, -0.786834716796875, -0.7384033203125, -0.689971923828125, -0.64154052734375, -0.593109130859375, -0.544677734375, -0.496246337890625, -0.44781494140625, -0.399383544921875, -0.3509521484375, -0.302520751953125, -0.25408935546875, -0.205657958984375, -0.1572265625, -0.108795166015625, -0.06036376953125, -0.011932373046875, 0.0364990234375, 0.084930419921875, 0.13336181640625, 0.181793212890625, 0.230224609375, 0.278656005859375, 0.32708740234375, 0.375518798828125, 0.4239501953125, 0.472381591796875, 0.52081298828125, 0.569244384765625, 0.61767578125, 0.666107177734375, 0.71453857421875, 0.762969970703125, 0.8114013671875, 0.859832763671875, 0.90826416015625, 0.956695556640625, 1.005126953125, 1.053558349609375, 1.10198974609375, 1.150421142578125, 1.1988525390625, 1.247283935546875, 1.29571533203125, 1.344146728515625, 1.392578125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 6.0, 7.0, 8.0, 6.0, 13.0, 9.0, 9.0, 19.0, 30.0, 44.0, 55.0, 79.0, 131.0, 184.0, 330.0, 689.0, 1712.0, 5857.0, 26382.0, 140861.0, 628764.0, 196066.0, 35622.0, 7712.0, 2115.0, 800.0, 350.0, 218.0, 132.0, 92.0, 56.0, 34.0, 38.0, 25.0, 19.0, 11.0, 12.0, 10.0, 8.0, 6.0, 4.0, 5.0, 2.0, 5.0, 1.0, 2.0, 5.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-3.513671875, -3.4058837890625, -3.298095703125, -3.1903076171875, -3.08251953125, -2.9747314453125, -2.866943359375, -2.7591552734375, -2.6513671875, -2.5435791015625, -2.435791015625, -2.3280029296875, -2.22021484375, -2.1124267578125, -2.004638671875, -1.8968505859375, -1.7890625, -1.6812744140625, -1.573486328125, -1.4656982421875, -1.35791015625, -1.2501220703125, -1.142333984375, -1.0345458984375, -0.9267578125, -0.8189697265625, -0.711181640625, -0.6033935546875, -0.49560546875, -0.3878173828125, -0.280029296875, -0.1722412109375, -0.064453125, 0.0433349609375, 0.151123046875, 0.2589111328125, 0.36669921875, 0.4744873046875, 0.582275390625, 0.6900634765625, 0.7978515625, 0.9056396484375, 1.013427734375, 1.1212158203125, 1.22900390625, 1.3367919921875, 1.444580078125, 1.5523681640625, 1.66015625, 1.7679443359375, 1.875732421875, 1.9835205078125, 2.09130859375, 2.1990966796875, 2.306884765625, 2.4146728515625, 2.5224609375, 2.6302490234375, 2.738037109375, 2.8458251953125, 2.95361328125, 3.0614013671875, 3.169189453125, 3.2769775390625, 3.384765625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [5.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 2.0, 0.0, 11.0, 9.0, 6.0, 3.0, 12.0, 12.0, 16.0, 18.0, 22.0, 20.0, 23.0, 28.0, 35.0, 28.0, 29.0, 46.0, 26.0, 36.0, 36.0, 38.0, 41.0, 42.0, 38.0, 40.0, 39.0, 35.0, 40.0, 44.0, 24.0, 26.0, 26.0, 20.0, 20.0, 13.0, 14.0, 18.0, 13.0, 13.0, 13.0, 2.0, 4.0, 8.0, 3.0, 0.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-3.9296875, -3.80230712890625, -3.6749267578125, -3.54754638671875, -3.420166015625, -3.29278564453125, -3.1654052734375, -3.03802490234375, -2.91064453125, -2.78326416015625, -2.6558837890625, -2.52850341796875, -2.401123046875, -2.27374267578125, -2.1463623046875, -2.01898193359375, -1.8916015625, -1.76422119140625, -1.6368408203125, -1.50946044921875, -1.382080078125, -1.25469970703125, -1.1273193359375, -0.99993896484375, -0.87255859375, -0.74517822265625, -0.6177978515625, -0.49041748046875, -0.363037109375, -0.23565673828125, -0.1082763671875, 0.01910400390625, 0.146484375, 0.27386474609375, 0.4012451171875, 0.52862548828125, 0.656005859375, 0.78338623046875, 0.9107666015625, 1.03814697265625, 1.16552734375, 1.29290771484375, 1.4202880859375, 1.54766845703125, 1.675048828125, 1.80242919921875, 1.9298095703125, 2.05718994140625, 2.1845703125, 2.31195068359375, 2.4393310546875, 2.56671142578125, 2.694091796875, 2.82147216796875, 2.9488525390625, 3.07623291015625, 3.20361328125, 3.33099365234375, 3.4583740234375, 3.58575439453125, 3.713134765625, 3.84051513671875, 3.9678955078125, 4.09527587890625, 4.22265625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 2.0, 2.0, 9.0, 8.0, 9.0, 13.0, 13.0, 17.0, 25.0, 48.0, 50.0, 86.0, 124.0, 253.0, 428.0, 874.0, 1648.0, 4087.0, 10767.0, 31330.0, 101467.0, 463225.0, 294158.0, 93546.0, 28928.0, 9995.0, 3867.0, 1703.0, 822.0, 419.0, 207.0, 137.0, 90.0, 56.0, 45.0, 24.0, 17.0, 10.0, 12.0, 12.0, 9.0, 3.0, 2.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.6923828125, -0.6707229614257812, -0.6490631103515625, -0.6274032592773438, -0.605743408203125, -0.5840835571289062, -0.5624237060546875, -0.5407638549804688, -0.51910400390625, -0.49744415283203125, -0.4757843017578125, -0.45412445068359375, -0.432464599609375, -0.41080474853515625, -0.3891448974609375, -0.36748504638671875, -0.3458251953125, -0.32416534423828125, -0.3025054931640625, -0.28084564208984375, -0.259185791015625, -0.23752593994140625, -0.2158660888671875, -0.19420623779296875, -0.17254638671875, -0.15088653564453125, -0.1292266845703125, -0.10756683349609375, -0.085906982421875, -0.06424713134765625, -0.0425872802734375, -0.02092742919921875, 0.000732421875, 0.02239227294921875, 0.0440521240234375, 0.06571197509765625, 0.087371826171875, 0.10903167724609375, 0.1306915283203125, 0.15235137939453125, 0.17401123046875, 0.19567108154296875, 0.2173309326171875, 0.23899078369140625, 0.260650634765625, 0.28231048583984375, 0.3039703369140625, 0.32563018798828125, 0.3472900390625, 0.36894989013671875, 0.3906097412109375, 0.41226959228515625, 0.433929443359375, 0.45558929443359375, 0.4772491455078125, 0.49890899658203125, 0.52056884765625, 0.5422286987304688, 0.5638885498046875, 0.5855484008789062, 0.607208251953125, 0.6288681030273438, 0.6505279541015625, 0.6721878051757812, 0.69384765625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 2.0, 5.0, 4.0, 2.0, 2.0, 6.0, 4.0, 8.0, 10.0, 14.0, 14.0, 23.0, 35.0, 45.0, 37.0, 49.0, 54.0, 84.0, 66.0, 85.0, 73.0, 73.0, 72.0, 53.0, 43.0, 26.0, 19.0, 22.0, 15.0, 11.0, 11.0, 8.0, 4.0, 6.0, 4.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0002655982971191406, -0.00025773048400878906, -0.0002498626708984375, -0.00024199485778808594, -0.00023412704467773438, -0.0002262592315673828, -0.00021839141845703125, -0.0002105236053466797, -0.00020265579223632812, -0.00019478797912597656, -0.000186920166015625, -0.00017905235290527344, -0.00017118453979492188, -0.0001633167266845703, -0.00015544891357421875, -0.0001475811004638672, -0.00013971328735351562, -0.00013184547424316406, -0.0001239776611328125, -0.00011610984802246094, -0.00010824203491210938, -0.00010037422180175781, -9.250640869140625e-05, -8.463859558105469e-05, -7.677078247070312e-05, -6.890296936035156e-05, -6.103515625e-05, -5.316734313964844e-05, -4.5299530029296875e-05, -3.743171691894531e-05, -2.956390380859375e-05, -2.1696090698242188e-05, -1.3828277587890625e-05, -5.9604644775390625e-06, 1.9073486328125e-06, 9.775161743164062e-06, 1.7642974853515625e-05, 2.5510787963867188e-05, 3.337860107421875e-05, 4.124641418457031e-05, 4.9114227294921875e-05, 5.698204040527344e-05, 6.4849853515625e-05, 7.271766662597656e-05, 8.058547973632812e-05, 8.845329284667969e-05, 9.632110595703125e-05, 0.00010418891906738281, 0.00011205673217773438, 0.00011992454528808594, 0.0001277923583984375, 0.00013566017150878906, 0.00014352798461914062, 0.0001513957977294922, 0.00015926361083984375, 0.0001671314239501953, 0.00017499923706054688, 0.00018286705017089844, 0.00019073486328125, 0.00019860267639160156, 0.00020647048950195312, 0.0002143383026123047, 0.00022220611572265625, 0.0002300739288330078, 0.00023794174194335938]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 1.0, 8.0, 2.0, 10.0, 18.0, 30.0, 40.0, 69.0, 172.0, 398.0, 1183.0, 5012.0, 38422.0, 575039.0, 387274.0, 34284.0, 4766.0, 1117.0, 359.0, 175.0, 74.0, 38.0, 25.0, 15.0, 11.0, 6.0, 4.0, 7.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7734375, -0.727874755859375, -0.68231201171875, -0.636749267578125, -0.5911865234375, -0.545623779296875, -0.50006103515625, -0.454498291015625, -0.408935546875, -0.363372802734375, -0.31781005859375, -0.272247314453125, -0.2266845703125, -0.181121826171875, -0.13555908203125, -0.089996337890625, -0.04443359375, 0.001129150390625, 0.04669189453125, 0.092254638671875, 0.1378173828125, 0.183380126953125, 0.22894287109375, 0.274505615234375, 0.320068359375, 0.365631103515625, 0.41119384765625, 0.456756591796875, 0.5023193359375, 0.547882080078125, 0.59344482421875, 0.639007568359375, 0.6845703125, 0.730133056640625, 0.77569580078125, 0.821258544921875, 0.8668212890625, 0.912384033203125, 0.95794677734375, 1.003509521484375, 1.049072265625, 1.094635009765625, 1.14019775390625, 1.185760498046875, 1.2313232421875, 1.276885986328125, 1.32244873046875, 1.368011474609375, 1.41357421875, 1.459136962890625, 1.50469970703125, 1.550262451171875, 1.5958251953125, 1.641387939453125, 1.68695068359375, 1.732513427734375, 1.778076171875, 1.823638916015625, 1.86920166015625, 1.914764404296875, 1.9603271484375, 2.005889892578125, 2.05145263671875, 2.097015380859375, 2.142578125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 8.0, 3.0, 3.0, 5.0, 3.0, 6.0, 8.0, 15.0, 17.0, 11.0, 20.0, 28.0, 32.0, 45.0, 55.0, 49.0, 75.0, 77.0, 74.0, 78.0, 76.0, 59.0, 57.0, 54.0, 36.0, 27.0, 17.0, 18.0, 13.0, 8.0, 6.0, 6.0, 5.0, 3.0, 2.0, 2.0, 2.0, 5.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7255859375, -0.696075439453125, -0.66656494140625, -0.637054443359375, -0.6075439453125, -0.578033447265625, -0.54852294921875, -0.519012451171875, -0.489501953125, -0.459991455078125, -0.43048095703125, -0.400970458984375, -0.3714599609375, -0.341949462890625, -0.31243896484375, -0.282928466796875, -0.25341796875, -0.223907470703125, -0.19439697265625, -0.164886474609375, -0.1353759765625, -0.105865478515625, -0.07635498046875, -0.046844482421875, -0.017333984375, 0.012176513671875, 0.04168701171875, 0.071197509765625, 0.1007080078125, 0.130218505859375, 0.15972900390625, 0.189239501953125, 0.21875, 0.248260498046875, 0.27777099609375, 0.307281494140625, 0.3367919921875, 0.366302490234375, 0.39581298828125, 0.425323486328125, 0.454833984375, 0.484344482421875, 0.51385498046875, 0.543365478515625, 0.5728759765625, 0.602386474609375, 0.63189697265625, 0.661407470703125, 0.69091796875, 0.720428466796875, 0.74993896484375, 0.779449462890625, 0.8089599609375, 0.838470458984375, 0.86798095703125, 0.897491455078125, 0.927001953125, 0.956512451171875, 0.98602294921875, 1.015533447265625, 1.0450439453125, 1.074554443359375, 1.10406494140625, 1.133575439453125, 1.1630859375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 1.0, 3.0, 9.0, 12.0, 17.0, 30.0, 51.0, 83.0, 126.0, 233.0, 168.0, 103.0, 71.0, 40.0, 23.0, 14.0, 6.0, 6.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.356487274169922, -30.635723114013672, -29.914958953857422, -29.194194793701172, -28.473432540893555, -27.752668380737305, -27.031904220581055, -26.311140060424805, -25.590377807617188, -24.869613647460938, -24.148849487304688, -23.428085327148438, -22.70732307434082, -21.98655891418457, -21.26579475402832, -20.54503059387207, -19.82426643371582, -19.10350227355957, -18.38273811340332, -17.661975860595703, -16.941211700439453, -16.220447540283203, -15.499683380126953, -14.778919219970703, -14.05815601348877, -13.33739185333252, -12.616628646850586, -11.895864486694336, -11.175100326538086, -10.454337120056152, -9.733572959899902, -9.012809753417969, -8.292047500610352, -7.57128381729126, -6.850520133972168, -6.129755973815918, -5.408992290496826, -4.688228607177734, -3.9674644470214844, -3.2467007637023926, -2.525937080383301, -1.8051732778549194, -1.084409475326538, -0.3636455535888672, 0.3571181297302246, 1.0778818130493164, 1.7986459732055664, 2.519409656524658, 3.24017333984375, 3.960937023162842, 4.681700706481934, 5.402464866638184, 6.123228549957275, 6.843992233276367, 7.564756393432617, 8.285520553588867, 9.0062837600708, 9.72704792022705, 10.447811126708984, 11.168575286865234, 11.889339447021484, 12.610102653503418, 13.330866813659668, 14.051630020141602, 14.772394180297852]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 6.0, 5.0, 6.0, 4.0, 5.0, 14.0, 5.0, 8.0, 11.0, 16.0, 15.0, 13.0, 24.0, 21.0, 30.0, 23.0, 26.0, 35.0, 36.0, 34.0, 50.0, 60.0, 66.0, 69.0, 71.0, 49.0, 33.0, 40.0, 32.0, 23.0, 35.0, 17.0, 16.0, 16.0, 12.0, 18.0, 15.0, 6.0, 8.0, 11.0, 7.0, 7.0, 6.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.443256378173828, -15.896008491516113, -15.348760604858398, -14.801513671875, -14.254265785217285, -13.70701789855957, -13.159770965576172, -12.612523078918457, -12.065275192260742, -11.518027305603027, -10.970779418945312, -10.423532485961914, -9.8762845993042, -9.329036712646484, -8.781789779663086, -8.234541893005371, -7.687294006347656, -7.140046119689941, -6.592798709869385, -6.045551300048828, -5.498303413391113, -4.951055526733398, -4.403808116912842, -3.856560468673706, -3.3093128204345703, -2.7620651721954346, -2.214817523956299, -1.667569875717163, -1.1203222274780273, -0.5730745792388916, -0.02582693099975586, 0.5214207172393799, 1.0686702728271484, 1.6159179210662842, 2.16316556930542, 2.7104132175445557, 3.2576608657836914, 3.804908514022827, 4.352156162261963, 4.8994035720825195, 5.446651458740234, 5.993899345397949, 6.541146755218506, 7.0883941650390625, 7.635642051696777, 8.182889938354492, 8.73013687133789, 9.277384757995605, 9.82463264465332, 10.371880531311035, 10.91912841796875, 11.466375350952148, 12.013623237609863, 12.560871124267578, 13.108118057250977, 13.655365943908691, 14.202613830566406, 14.749861717224121, 15.297109603881836, 15.844356536865234, 16.391605377197266, 16.938852310180664, 17.486099243164062, 18.033348083496094, 18.580595016479492]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 9.0, 1.0, 6.0, 10.0, 9.0, 16.0, 16.0, 28.0, 32.0, 33.0, 52.0, 59.0, 89.0, 158.0, 317.0, 750.0, 2018.0, 6925.0, 45217.0, 714912.0, 2973162.0, 409687.0, 31778.0, 5809.0, 1724.0, 653.0, 317.0, 163.0, 96.0, 77.0, 37.0, 30.0, 30.0, 14.0, 12.0, 9.0, 5.0, 6.0, 6.0, 9.0, 6.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.681640625, -2.60369873046875, -2.5257568359375, -2.44781494140625, -2.369873046875, -2.29193115234375, -2.2139892578125, -2.13604736328125, -2.05810546875, -1.98016357421875, -1.9022216796875, -1.82427978515625, -1.746337890625, -1.66839599609375, -1.5904541015625, -1.51251220703125, -1.4345703125, -1.35662841796875, -1.2786865234375, -1.20074462890625, -1.122802734375, -1.04486083984375, -0.9669189453125, -0.88897705078125, -0.81103515625, -0.73309326171875, -0.6551513671875, -0.57720947265625, -0.499267578125, -0.42132568359375, -0.3433837890625, -0.26544189453125, -0.1875, -0.10955810546875, -0.0316162109375, 0.04632568359375, 0.124267578125, 0.20220947265625, 0.2801513671875, 0.35809326171875, 0.43603515625, 0.51397705078125, 0.5919189453125, 0.66986083984375, 0.747802734375, 0.82574462890625, 0.9036865234375, 0.98162841796875, 1.0595703125, 1.13751220703125, 1.2154541015625, 1.29339599609375, 1.371337890625, 1.44927978515625, 1.5272216796875, 1.60516357421875, 1.68310546875, 1.76104736328125, 1.8389892578125, 1.91693115234375, 1.994873046875, 2.07281494140625, 2.1507568359375, 2.22869873046875, 2.306640625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 4.0, 3.0, 8.0, 1.0, 19.0, 8.0, 10.0, 25.0, 30.0, 17.0, 35.0, 33.0, 41.0, 42.0, 53.0, 60.0, 44.0, 58.0, 51.0, 52.0, 50.0, 40.0, 44.0, 36.0, 36.0, 41.0, 35.0, 27.0, 37.0, 15.0, 7.0, 10.0, 8.0, 8.0, 7.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6328125, -1.58514404296875, -1.5374755859375, -1.48980712890625, -1.442138671875, -1.39447021484375, -1.3468017578125, -1.29913330078125, -1.25146484375, -1.20379638671875, -1.1561279296875, -1.10845947265625, -1.060791015625, -1.01312255859375, -0.9654541015625, -0.91778564453125, -0.8701171875, -0.82244873046875, -0.7747802734375, -0.72711181640625, -0.679443359375, -0.63177490234375, -0.5841064453125, -0.53643798828125, -0.48876953125, -0.44110107421875, -0.3934326171875, -0.34576416015625, -0.298095703125, -0.25042724609375, -0.2027587890625, -0.15509033203125, -0.107421875, -0.05975341796875, -0.0120849609375, 0.03558349609375, 0.083251953125, 0.13092041015625, 0.1785888671875, 0.22625732421875, 0.27392578125, 0.32159423828125, 0.3692626953125, 0.41693115234375, 0.464599609375, 0.51226806640625, 0.5599365234375, 0.60760498046875, 0.6552734375, 0.70294189453125, 0.7506103515625, 0.79827880859375, 0.845947265625, 0.89361572265625, 0.9412841796875, 0.98895263671875, 1.03662109375, 1.08428955078125, 1.1319580078125, 1.17962646484375, 1.227294921875, 1.27496337890625, 1.3226318359375, 1.37030029296875, 1.41796875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 7.0, 6.0, 9.0, 7.0, 13.0, 22.0, 29.0, 42.0, 55.0, 130.0, 184.0, 410.0, 987.0, 2891.0, 12710.0, 123948.0, 3519040.0, 500935.0, 25777.0, 4636.0, 1297.0, 550.0, 256.0, 141.0, 66.0, 39.0, 23.0, 20.0, 13.0, 11.0, 9.0, 3.0, 5.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.107421875, -2.995208740234375, -2.88299560546875, -2.770782470703125, -2.6585693359375, -2.546356201171875, -2.43414306640625, -2.321929931640625, -2.209716796875, -2.097503662109375, -1.98529052734375, -1.873077392578125, -1.7608642578125, -1.648651123046875, -1.53643798828125, -1.424224853515625, -1.31201171875, -1.199798583984375, -1.08758544921875, -0.975372314453125, -0.8631591796875, -0.750946044921875, -0.63873291015625, -0.526519775390625, -0.414306640625, -0.302093505859375, -0.18988037109375, -0.077667236328125, 0.0345458984375, 0.146759033203125, 0.25897216796875, 0.371185302734375, 0.4833984375, 0.595611572265625, 0.70782470703125, 0.820037841796875, 0.9322509765625, 1.044464111328125, 1.15667724609375, 1.268890380859375, 1.381103515625, 1.493316650390625, 1.60552978515625, 1.717742919921875, 1.8299560546875, 1.942169189453125, 2.05438232421875, 2.166595458984375, 2.27880859375, 2.391021728515625, 2.50323486328125, 2.615447998046875, 2.7276611328125, 2.839874267578125, 2.95208740234375, 3.064300537109375, 3.176513671875, 3.288726806640625, 3.40093994140625, 3.513153076171875, 3.6253662109375, 3.737579345703125, 3.84979248046875, 3.962005615234375, 4.07421875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 6.0, 5.0, 11.0, 5.0, 22.0, 26.0, 36.0, 65.0, 98.0, 200.0, 411.0, 708.0, 858.0, 650.0, 432.0, 241.0, 114.0, 80.0, 35.0, 22.0, 22.0, 15.0, 2.0, 5.0, 2.0, 0.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.375, -4.261566162109375, -4.14813232421875, -4.034698486328125, -3.9212646484375, -3.807830810546875, -3.69439697265625, -3.580963134765625, -3.467529296875, -3.354095458984375, -3.24066162109375, -3.127227783203125, -3.0137939453125, -2.900360107421875, -2.78692626953125, -2.673492431640625, -2.56005859375, -2.446624755859375, -2.33319091796875, -2.219757080078125, -2.1063232421875, -1.992889404296875, -1.87945556640625, -1.766021728515625, -1.652587890625, -1.539154052734375, -1.42572021484375, -1.312286376953125, -1.1988525390625, -1.085418701171875, -0.97198486328125, -0.858551025390625, -0.7451171875, -0.631683349609375, -0.51824951171875, -0.404815673828125, -0.2913818359375, -0.177947998046875, -0.06451416015625, 0.048919677734375, 0.162353515625, 0.275787353515625, 0.38922119140625, 0.502655029296875, 0.6160888671875, 0.729522705078125, 0.84295654296875, 0.956390380859375, 1.06982421875, 1.183258056640625, 1.29669189453125, 1.410125732421875, 1.5235595703125, 1.636993408203125, 1.75042724609375, 1.863861083984375, 1.977294921875, 2.090728759765625, 2.20416259765625, 2.317596435546875, 2.4310302734375, 2.544464111328125, 2.65789794921875, 2.771331787109375, 2.884765625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 8.0, 10.0, 21.0, 118.0, 270.0, 363.0, 158.0, 42.0, 11.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.22658157348633, -52.63948440551758, -51.05238723754883, -49.465293884277344, -47.878196716308594, -46.291099548339844, -44.704002380371094, -43.116905212402344, -41.529808044433594, -39.942710876464844, -38.355613708496094, -36.768516540527344, -35.18142318725586, -33.59432601928711, -32.00722885131836, -30.42013168334961, -28.833036422729492, -27.245939254760742, -25.658843994140625, -24.071746826171875, -22.484649658203125, -20.897552490234375, -19.310457229614258, -17.723360061645508, -16.13626480102539, -14.549168586730957, -12.962071418762207, -11.374975204467773, -9.787878036499023, -8.20078182220459, -6.613685607910156, -5.026588439941406, -3.4394912719726562, -1.852394700050354, -0.26529812812805176, 1.321798324584961, 2.9088950157165527, 4.4959917068481445, 6.083087921142578, 7.670185089111328, 9.257281303405762, 10.844377517700195, 12.431474685668945, 14.018570899963379, 15.605667114257812, 17.192764282226562, 18.779861450195312, 20.366958618164062, 21.95405387878418, 23.54115104675293, 25.128246307373047, 26.715343475341797, 28.302440643310547, 29.889537811279297, 31.476633071899414, 33.06372833251953, 34.65082550048828, 36.23792266845703, 37.82501983642578, 39.41211700439453, 40.999210357666016, 42.586307525634766, 44.173404693603516, 45.760501861572266, 47.347599029541016]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 5.0, 6.0, 11.0, 6.0, 19.0, 19.0, 29.0, 24.0, 30.0, 28.0, 32.0, 33.0, 28.0, 52.0, 37.0, 52.0, 63.0, 51.0, 44.0, 57.0, 39.0, 45.0, 43.0, 30.0, 28.0, 33.0, 21.0, 29.0, 14.0, 18.0, 15.0, 15.0, 12.0, 7.0, 5.0, 5.0, 8.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-12.642155647277832, -12.2734956741333, -11.904836654663086, -11.536176681518555, -11.167516708374023, -10.798857688903809, -10.430197715759277, -10.061538696289062, -9.692878723144531, -9.32421875, -8.955559730529785, -8.586899757385254, -8.218240737915039, -7.849580764770508, -7.480920791625977, -7.1122612953186035, -6.7436017990112305, -6.374942302703857, -6.006282806396484, -5.637622833251953, -5.26896333694458, -4.900303840637207, -4.531643867492676, -4.162984371185303, -3.7943248748779297, -3.4256653785705566, -3.0570056438446045, -2.6883459091186523, -2.3196864128112793, -1.9510267972946167, -1.582367181777954, -1.213707447052002, -0.8450489044189453, -0.4763892889022827, -0.10772967338562012, 0.2609299421310425, 0.6295895576477051, 0.9982491731643677, 1.3669087886810303, 1.7355685234069824, 2.1042280197143555, 2.4728875160217285, 2.8415472507476807, 3.210206985473633, 3.578866481781006, 3.947525978088379, 4.31618595123291, 4.684845447540283, 5.053504943847656, 5.422164440155029, 5.790823936462402, 6.159483909606934, 6.528143405914307, 6.89680290222168, 7.265462875366211, 7.634122371673584, 8.002781867980957, 8.371441841125488, 8.740100860595703, 9.108760833740234, 9.477420806884766, 9.84607982635498, 10.214739799499512, 10.583398818969727, 10.952058792114258]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 5.0, 4.0, 2.0, 5.0, 16.0, 27.0, 21.0, 40.0, 61.0, 102.0, 172.0, 318.0, 538.0, 934.0, 1779.0, 3405.0, 6657.0, 13645.0, 27917.0, 59099.0, 125357.0, 236469.0, 267479.0, 158256.0, 75797.0, 35851.0, 17173.0, 8327.0, 4249.0, 2138.0, 1141.0, 635.0, 351.0, 232.0, 130.0, 85.0, 59.0, 31.0, 17.0, 9.0, 14.0, 7.0, 0.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0], "bins": [-1.7783203125, -1.73046875, -1.6826171875, -1.634765625, -1.5869140625, -1.5390625, -1.4912109375, -1.443359375, -1.3955078125, -1.34765625, -1.2998046875, -1.251953125, -1.2041015625, -1.15625, -1.1083984375, -1.060546875, -1.0126953125, -0.96484375, -0.9169921875, -0.869140625, -0.8212890625, -0.7734375, -0.7255859375, -0.677734375, -0.6298828125, -0.58203125, -0.5341796875, -0.486328125, -0.4384765625, -0.390625, -0.3427734375, -0.294921875, -0.2470703125, -0.19921875, -0.1513671875, -0.103515625, -0.0556640625, -0.0078125, 0.0400390625, 0.087890625, 0.1357421875, 0.18359375, 0.2314453125, 0.279296875, 0.3271484375, 0.375, 0.4228515625, 0.470703125, 0.5185546875, 0.56640625, 0.6142578125, 0.662109375, 0.7099609375, 0.7578125, 0.8056640625, 0.853515625, 0.9013671875, 0.94921875, 0.9970703125, 1.044921875, 1.0927734375, 1.140625, 1.1884765625, 1.236328125, 1.2841796875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 1.0, 4.0, 4.0, 5.0, 6.0, 7.0, 14.0, 14.0, 23.0, 22.0, 23.0, 17.0, 33.0, 34.0, 55.0, 34.0, 42.0, 44.0, 37.0, 51.0, 48.0, 44.0, 47.0, 53.0, 35.0, 33.0, 42.0, 42.0, 35.0, 21.0, 30.0, 26.0, 11.0, 13.0, 5.0, 13.0, 14.0, 4.0, 6.0, 3.0, 6.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3681640625, -1.3248748779296875, -1.281585693359375, -1.2382965087890625, -1.19500732421875, -1.1517181396484375, -1.108428955078125, -1.0651397705078125, -1.0218505859375, -0.9785614013671875, -0.935272216796875, -0.8919830322265625, -0.84869384765625, -0.8054046630859375, -0.762115478515625, -0.7188262939453125, -0.675537109375, -0.6322479248046875, -0.588958740234375, -0.5456695556640625, -0.50238037109375, -0.4590911865234375, -0.415802001953125, -0.3725128173828125, -0.3292236328125, -0.2859344482421875, -0.242645263671875, -0.1993560791015625, -0.15606689453125, -0.1127777099609375, -0.069488525390625, -0.0261993408203125, 0.01708984375, 0.0603790283203125, 0.103668212890625, 0.1469573974609375, 0.19024658203125, 0.2335357666015625, 0.276824951171875, 0.3201141357421875, 0.3634033203125, 0.4066925048828125, 0.449981689453125, 0.4932708740234375, 0.53656005859375, 0.5798492431640625, 0.623138427734375, 0.6664276123046875, 0.709716796875, 0.7530059814453125, 0.796295166015625, 0.8395843505859375, 0.88287353515625, 0.9261627197265625, 0.969451904296875, 1.0127410888671875, 1.0560302734375, 1.0993194580078125, 1.142608642578125, 1.1858978271484375, 1.22918701171875, 1.2724761962890625, 1.315765380859375, 1.3590545654296875, 1.40234375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0, 2.0, 5.0, 7.0, 6.0, 6.0, 11.0, 11.0, 9.0, 14.0, 22.0, 31.0, 38.0, 46.0, 79.0, 95.0, 148.0, 211.0, 301.0, 424.0, 706.0, 1188.0, 2876.0, 9046.0, 40272.0, 218525.0, 644569.0, 100555.0, 19657.0, 5121.0, 1940.0, 897.0, 520.0, 333.0, 227.0, 171.0, 112.0, 85.0, 65.0, 54.0, 46.0, 34.0, 21.0, 20.0, 10.0, 17.0, 6.0, 8.0, 3.0, 2.0, 2.0, 2.0, 4.0, 2.0, 1.0], "bins": [-3.513671875, -3.4140625, -3.314453125, -3.21484375, -3.115234375, -3.015625, -2.916015625, -2.81640625, -2.716796875, -2.6171875, -2.517578125, -2.41796875, -2.318359375, -2.21875, -2.119140625, -2.01953125, -1.919921875, -1.8203125, -1.720703125, -1.62109375, -1.521484375, -1.421875, -1.322265625, -1.22265625, -1.123046875, -1.0234375, -0.923828125, -0.82421875, -0.724609375, -0.625, -0.525390625, -0.42578125, -0.326171875, -0.2265625, -0.126953125, -0.02734375, 0.072265625, 0.171875, 0.271484375, 0.37109375, 0.470703125, 0.5703125, 0.669921875, 0.76953125, 0.869140625, 0.96875, 1.068359375, 1.16796875, 1.267578125, 1.3671875, 1.466796875, 1.56640625, 1.666015625, 1.765625, 1.865234375, 1.96484375, 2.064453125, 2.1640625, 2.263671875, 2.36328125, 2.462890625, 2.5625, 2.662109375, 2.76171875, 2.861328125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 9.0, 4.0, 10.0, 7.0, 9.0, 16.0, 16.0, 24.0, 18.0, 24.0, 29.0, 29.0, 35.0, 44.0, 51.0, 48.0, 57.0, 58.0, 43.0, 59.0, 45.0, 39.0, 51.0, 39.0, 33.0, 27.0, 35.0, 28.0, 27.0, 15.0, 16.0, 16.0, 5.0, 5.0, 6.0, 6.0, 7.0, 3.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-5.1640625, -5.01556396484375, -4.8670654296875, -4.71856689453125, -4.570068359375, -4.42156982421875, -4.2730712890625, -4.12457275390625, -3.97607421875, -3.82757568359375, -3.6790771484375, -3.53057861328125, -3.382080078125, -3.23358154296875, -3.0850830078125, -2.93658447265625, -2.7880859375, -2.63958740234375, -2.4910888671875, -2.34259033203125, -2.194091796875, -2.04559326171875, -1.8970947265625, -1.74859619140625, -1.60009765625, -1.45159912109375, -1.3031005859375, -1.15460205078125, -1.006103515625, -0.85760498046875, -0.7091064453125, -0.56060791015625, -0.412109375, -0.26361083984375, -0.1151123046875, 0.03338623046875, 0.181884765625, 0.33038330078125, 0.4788818359375, 0.62738037109375, 0.77587890625, 0.92437744140625, 1.0728759765625, 1.22137451171875, 1.369873046875, 1.51837158203125, 1.6668701171875, 1.81536865234375, 1.9638671875, 2.11236572265625, 2.2608642578125, 2.40936279296875, 2.557861328125, 2.70635986328125, 2.8548583984375, 3.00335693359375, 3.15185546875, 3.30035400390625, 3.4488525390625, 3.59735107421875, 3.745849609375, 3.89434814453125, 4.0428466796875, 4.19134521484375, 4.33984375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 10.0, 12.0, 6.0, 18.0, 18.0, 23.0, 34.0, 57.0, 75.0, 132.0, 183.0, 309.0, 547.0, 901.0, 1948.0, 4608.0, 11701.0, 35551.0, 126322.0, 619562.0, 174697.0, 46275.0, 15146.0, 5601.0, 2248.0, 1046.0, 590.0, 324.0, 188.0, 135.0, 80.0, 58.0, 43.0, 30.0, 20.0, 13.0, 11.0, 9.0, 10.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73828125, -0.7149276733398438, -0.6915740966796875, -0.6682205200195312, -0.644866943359375, -0.6215133666992188, -0.5981597900390625, -0.5748062133789062, -0.55145263671875, -0.5280990600585938, -0.5047454833984375, -0.48139190673828125, -0.458038330078125, -0.43468475341796875, -0.4113311767578125, -0.38797760009765625, -0.3646240234375, -0.34127044677734375, -0.3179168701171875, -0.29456329345703125, -0.271209716796875, -0.24785614013671875, -0.2245025634765625, -0.20114898681640625, -0.17779541015625, -0.15444183349609375, -0.1310882568359375, -0.10773468017578125, -0.084381103515625, -0.06102752685546875, -0.0376739501953125, -0.01432037353515625, 0.009033203125, 0.03238677978515625, 0.0557403564453125, 0.07909393310546875, 0.102447509765625, 0.12580108642578125, 0.1491546630859375, 0.17250823974609375, 0.19586181640625, 0.21921539306640625, 0.2425689697265625, 0.26592254638671875, 0.289276123046875, 0.31262969970703125, 0.3359832763671875, 0.35933685302734375, 0.3826904296875, 0.40604400634765625, 0.4293975830078125, 0.45275115966796875, 0.476104736328125, 0.49945831298828125, 0.5228118896484375, 0.5461654663085938, 0.56951904296875, 0.5928726196289062, 0.6162261962890625, 0.6395797729492188, 0.662933349609375, 0.6862869262695312, 0.7096405029296875, 0.7329940795898438, 0.75634765625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 1.0, 6.0, 2.0, 7.0, 5.0, 13.0, 4.0, 11.0, 12.0, 22.0, 24.0, 26.0, 41.0, 33.0, 46.0, 60.0, 88.0, 101.0, 91.0, 91.0, 59.0, 47.0, 40.0, 25.0, 25.0, 24.0, 20.0, 13.0, 16.0, 12.0, 6.0, 11.0, 6.0, 6.0, 3.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.00028967857360839844, -0.00028168410062789917, -0.0002736896276473999, -0.00026569515466690063, -0.00025770068168640137, -0.0002497062087059021, -0.00024171173572540283, -0.00023371726274490356, -0.0002257227897644043, -0.00021772831678390503, -0.00020973384380340576, -0.0002017393708229065, -0.00019374489784240723, -0.00018575042486190796, -0.0001777559518814087, -0.00016976147890090942, -0.00016176700592041016, -0.0001537725329399109, -0.00014577805995941162, -0.00013778358697891235, -0.00012978911399841309, -0.00012179464101791382, -0.00011380016803741455, -0.00010580569505691528, -9.781122207641602e-05, -8.981674909591675e-05, -8.182227611541748e-05, -7.382780313491821e-05, -6.583333015441895e-05, -5.783885717391968e-05, -4.984438419342041e-05, -4.184991121292114e-05, -3.3855438232421875e-05, -2.5860965251922607e-05, -1.786649227142334e-05, -9.872019290924072e-06, -1.8775463104248047e-06, 6.116926670074463e-06, 1.411139965057373e-05, 2.2105872631072998e-05, 3.0100345611572266e-05, 3.809481859207153e-05, 4.60892915725708e-05, 5.408376455307007e-05, 6.207823753356934e-05, 7.00727105140686e-05, 7.806718349456787e-05, 8.606165647506714e-05, 9.40561294555664e-05, 0.00010205060243606567, 0.00011004507541656494, 0.00011803954839706421, 0.00012603402137756348, 0.00013402849435806274, 0.000142022967338562, 0.00015001744031906128, 0.00015801191329956055, 0.00016600638628005981, 0.00017400085926055908, 0.00018199533224105835, 0.00018998980522155762, 0.00019798427820205688, 0.00020597875118255615, 0.00021397322416305542, 0.0002219676971435547]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 4.0, 2.0, 10.0, 6.0, 13.0, 21.0, 27.0, 47.0, 89.0, 158.0, 265.0, 519.0, 1308.0, 3567.0, 13481.0, 77822.0, 706738.0, 205097.0, 29320.0, 6402.0, 2008.0, 821.0, 342.0, 192.0, 118.0, 68.0, 42.0, 23.0, 16.0, 8.0, 6.0, 4.0, 3.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.9970703125, -0.962371826171875, -0.92767333984375, -0.892974853515625, -0.8582763671875, -0.823577880859375, -0.78887939453125, -0.754180908203125, -0.719482421875, -0.684783935546875, -0.65008544921875, -0.615386962890625, -0.5806884765625, -0.545989990234375, -0.51129150390625, -0.476593017578125, -0.44189453125, -0.407196044921875, -0.37249755859375, -0.337799072265625, -0.3031005859375, -0.268402099609375, -0.23370361328125, -0.199005126953125, -0.164306640625, -0.129608154296875, -0.09490966796875, -0.060211181640625, -0.0255126953125, 0.009185791015625, 0.04388427734375, 0.078582763671875, 0.11328125, 0.147979736328125, 0.18267822265625, 0.217376708984375, 0.2520751953125, 0.286773681640625, 0.32147216796875, 0.356170654296875, 0.390869140625, 0.425567626953125, 0.46026611328125, 0.494964599609375, 0.5296630859375, 0.564361572265625, 0.59906005859375, 0.633758544921875, 0.66845703125, 0.703155517578125, 0.73785400390625, 0.772552490234375, 0.8072509765625, 0.841949462890625, 0.87664794921875, 0.911346435546875, 0.946044921875, 0.980743408203125, 1.01544189453125, 1.050140380859375, 1.0848388671875, 1.119537353515625, 1.15423583984375, 1.188934326171875, 1.2236328125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 5.0, 4.0, 4.0, 10.0, 13.0, 9.0, 16.0, 22.0, 41.0, 42.0, 58.0, 56.0, 89.0, 111.0, 91.0, 85.0, 68.0, 60.0, 59.0, 39.0, 28.0, 24.0, 23.0, 16.0, 8.0, 8.0, 7.0, 4.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0517578125, -1.0192108154296875, -0.986663818359375, -0.9541168212890625, -0.92156982421875, -0.8890228271484375, -0.856475830078125, -0.8239288330078125, -0.7913818359375, -0.7588348388671875, -0.726287841796875, -0.6937408447265625, -0.66119384765625, -0.6286468505859375, -0.596099853515625, -0.5635528564453125, -0.531005859375, -0.4984588623046875, -0.465911865234375, -0.4333648681640625, -0.40081787109375, -0.3682708740234375, -0.335723876953125, -0.3031768798828125, -0.2706298828125, -0.2380828857421875, -0.205535888671875, -0.1729888916015625, -0.14044189453125, -0.1078948974609375, -0.075347900390625, -0.0428009033203125, -0.01025390625, 0.0222930908203125, 0.054840087890625, 0.0873870849609375, 0.11993408203125, 0.1524810791015625, 0.185028076171875, 0.2175750732421875, 0.2501220703125, 0.2826690673828125, 0.315216064453125, 0.3477630615234375, 0.38031005859375, 0.4128570556640625, 0.445404052734375, 0.4779510498046875, 0.510498046875, 0.5430450439453125, 0.575592041015625, 0.6081390380859375, 0.64068603515625, 0.6732330322265625, 0.705780029296875, 0.7383270263671875, 0.7708740234375, 0.8034210205078125, 0.835968017578125, 0.8685150146484375, 0.90106201171875, 0.9336090087890625, 0.966156005859375, 0.9987030029296875, 1.03125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 2.0, 5.0, 13.0, 22.0, 44.0, 75.0, 134.0, 292.0, 160.0, 88.0, 49.0, 58.0, 19.0, 11.0, 14.0, 4.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.96166229248047, -23.26805305480957, -22.574445724487305, -21.880836486816406, -21.187227249145508, -20.49361801147461, -19.800010681152344, -19.106401443481445, -18.412792205810547, -17.71918296813965, -17.025575637817383, -16.331966400146484, -15.638357162475586, -14.944748878479004, -14.251140594482422, -13.557531356811523, -12.863924026489258, -12.170315742492676, -11.476706504821777, -10.783098220825195, -10.089488983154297, -9.395880699157715, -8.702272415161133, -8.008663177490234, -7.315054893493652, -6.621446132659912, -5.927837371826172, -5.23422908782959, -4.54062032699585, -3.8470115661621094, -3.1534032821655273, -2.459794521331787, -1.7661876678466797, -1.072579026222229, -0.3789703845977783, 0.3146381378173828, 1.008246898651123, 1.7018556594848633, 2.3954639434814453, 3.0890727043151855, 3.782681465148926, 4.476290225982666, 5.169898986816406, 5.863507270812988, 6.5571160316467285, 7.250724792480469, 7.944333076477051, 8.637941360473633, 9.331550598144531, 10.025158882141113, 10.718768119812012, 11.412376403808594, 12.105985641479492, 12.799593925476074, 13.493202209472656, 14.186811447143555, 14.880419731140137, 15.574028015136719, 16.267637252807617, 16.961246490478516, 17.65485382080078, 18.34846305847168, 19.042072296142578, 19.735679626464844, 20.429288864135742]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 7.0, 4.0, 7.0, 0.0, 9.0, 13.0, 14.0, 5.0, 11.0, 16.0, 21.0, 23.0, 24.0, 28.0, 32.0, 40.0, 35.0, 50.0, 64.0, 97.0, 112.0, 63.0, 45.0, 39.0, 29.0, 25.0, 34.0, 26.0, 16.0, 25.0, 17.0, 15.0, 11.0, 6.0, 6.0, 10.0, 3.0, 6.0, 4.0, 3.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-19.079418182373047, -18.53337860107422, -17.98733901977539, -17.441299438476562, -16.895259857177734, -16.349220275878906, -15.803180694580078, -15.25714111328125, -14.711101531982422, -14.165061950683594, -13.619022369384766, -13.072982788085938, -12.52694320678711, -11.980903625488281, -11.434864044189453, -10.888824462890625, -10.34278392791748, -9.796744346618652, -9.250704765319824, -8.704665184020996, -8.158625602722168, -7.61258602142334, -7.0665459632873535, -6.520506381988525, -5.974466800689697, -5.428427219390869, -4.882387638092041, -4.336347579956055, -3.7903082370758057, -3.2442686557769775, -2.6982288360595703, -2.152189254760742, -1.606149673461914, -1.060110092163086, -0.5140703916549683, 0.031969308853149414, 0.5780088901519775, 1.1240484714508057, 1.670088291168213, 2.216127872467041, 2.762167453765869, 3.3082070350646973, 3.8542466163635254, 4.400286674499512, 4.94632625579834, 5.492365837097168, 6.038405418395996, 6.584444999694824, 7.130484580993652, 7.6765241622924805, 8.222563743591309, 8.768603324890137, 9.314642906188965, 9.860682487487793, 10.406723022460938, 10.952762603759766, 11.498802185058594, 12.044841766357422, 12.59088134765625, 13.136920928955078, 13.682960510253906, 14.229000091552734, 14.775039672851562, 15.32107925415039, 15.867118835449219]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 3.0, 4.0, 3.0, 2.0, 8.0, 10.0, 13.0, 12.0, 24.0, 31.0, 26.0, 47.0, 65.0, 92.0, 183.0, 289.0, 483.0, 802.0, 1495.0, 3016.0, 6723.0, 17922.0, 61545.0, 277610.0, 1233456.0, 1840686.0, 571741.0, 125839.0, 31919.0, 10794.0, 4552.0, 2165.0, 1125.0, 610.0, 349.0, 219.0, 144.0, 92.0, 52.0, 38.0, 32.0, 15.0, 17.0, 11.0, 11.0, 8.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.548828125, -1.5048675537109375, -1.460906982421875, -1.4169464111328125, -1.37298583984375, -1.3290252685546875, -1.285064697265625, -1.2411041259765625, -1.1971435546875, -1.1531829833984375, -1.109222412109375, -1.0652618408203125, -1.02130126953125, -0.9773406982421875, -0.933380126953125, -0.8894195556640625, -0.845458984375, -0.8014984130859375, -0.757537841796875, -0.7135772705078125, -0.66961669921875, -0.6256561279296875, -0.581695556640625, -0.5377349853515625, -0.4937744140625, -0.4498138427734375, -0.405853271484375, -0.3618927001953125, -0.31793212890625, -0.2739715576171875, -0.230010986328125, -0.1860504150390625, -0.14208984375, -0.0981292724609375, -0.054168701171875, -0.0102081298828125, 0.03375244140625, 0.0777130126953125, 0.121673583984375, 0.1656341552734375, 0.2095947265625, 0.2535552978515625, 0.297515869140625, 0.3414764404296875, 0.38543701171875, 0.4293975830078125, 0.473358154296875, 0.5173187255859375, 0.561279296875, 0.6052398681640625, 0.649200439453125, 0.6931610107421875, 0.73712158203125, 0.7810821533203125, 0.825042724609375, 0.8690032958984375, 0.9129638671875, 0.9569244384765625, 1.000885009765625, 1.0448455810546875, 1.08880615234375, 1.1327667236328125, 1.176727294921875, 1.2206878662109375, 1.2646484375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 5.0, 7.0, 4.0, 7.0, 9.0, 12.0, 22.0, 21.0, 13.0, 26.0, 36.0, 23.0, 28.0, 48.0, 40.0, 44.0, 50.0, 36.0, 65.0, 55.0, 49.0, 55.0, 42.0, 38.0, 48.0, 41.0, 35.0, 39.0, 29.0, 17.0, 3.0, 14.0, 7.0, 11.0, 6.0, 4.0, 4.0, 2.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.470703125, -1.42572021484375, -1.3807373046875, -1.33575439453125, -1.290771484375, -1.24578857421875, -1.2008056640625, -1.15582275390625, -1.11083984375, -1.06585693359375, -1.0208740234375, -0.97589111328125, -0.930908203125, -0.88592529296875, -0.8409423828125, -0.79595947265625, -0.7509765625, -0.70599365234375, -0.6610107421875, -0.61602783203125, -0.571044921875, -0.52606201171875, -0.4810791015625, -0.43609619140625, -0.39111328125, -0.34613037109375, -0.3011474609375, -0.25616455078125, -0.211181640625, -0.16619873046875, -0.1212158203125, -0.07623291015625, -0.03125, 0.01373291015625, 0.0587158203125, 0.10369873046875, 0.148681640625, 0.19366455078125, 0.2386474609375, 0.28363037109375, 0.32861328125, 0.37359619140625, 0.4185791015625, 0.46356201171875, 0.508544921875, 0.55352783203125, 0.5985107421875, 0.64349365234375, 0.6884765625, 0.73345947265625, 0.7784423828125, 0.82342529296875, 0.868408203125, 0.91339111328125, 0.9583740234375, 1.00335693359375, 1.04833984375, 1.09332275390625, 1.1383056640625, 1.18328857421875, 1.228271484375, 1.27325439453125, 1.3182373046875, 1.36322021484375, 1.408203125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 2.0, 9.0, 15.0, 16.0, 25.0, 41.0, 77.0, 119.0, 256.0, 619.0, 2159.0, 11202.0, 149032.0, 3799461.0, 214379.0, 13237.0, 2397.0, 702.0, 255.0, 130.0, 61.0, 28.0, 19.0, 9.0, 12.0, 5.0, 6.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.775390625, -3.638336181640625, -3.50128173828125, -3.364227294921875, -3.2271728515625, -3.090118408203125, -2.95306396484375, -2.816009521484375, -2.678955078125, -2.541900634765625, -2.40484619140625, -2.267791748046875, -2.1307373046875, -1.993682861328125, -1.85662841796875, -1.719573974609375, -1.58251953125, -1.445465087890625, -1.30841064453125, -1.171356201171875, -1.0343017578125, -0.897247314453125, -0.76019287109375, -0.623138427734375, -0.486083984375, -0.349029541015625, -0.21197509765625, -0.074920654296875, 0.0621337890625, 0.199188232421875, 0.33624267578125, 0.473297119140625, 0.6103515625, 0.747406005859375, 0.88446044921875, 1.021514892578125, 1.1585693359375, 1.295623779296875, 1.43267822265625, 1.569732666015625, 1.706787109375, 1.843841552734375, 1.98089599609375, 2.117950439453125, 2.2550048828125, 2.392059326171875, 2.52911376953125, 2.666168212890625, 2.80322265625, 2.940277099609375, 3.07733154296875, 3.214385986328125, 3.3514404296875, 3.488494873046875, 3.62554931640625, 3.762603759765625, 3.899658203125, 4.036712646484375, 4.17376708984375, 4.310821533203125, 4.4478759765625, 4.584930419921875, 4.72198486328125, 4.859039306640625, 4.99609375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 6.0, 9.0, 9.0, 19.0, 15.0, 25.0, 30.0, 57.0, 86.0, 148.0, 251.0, 380.0, 573.0, 723.0, 642.0, 428.0, 256.0, 169.0, 89.0, 52.0, 31.0, 24.0, 17.0, 10.0, 10.0, 7.0, 5.0, 5.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.982421875, -3.878936767578125, -3.77545166015625, -3.671966552734375, -3.5684814453125, -3.464996337890625, -3.36151123046875, -3.258026123046875, -3.154541015625, -3.051055908203125, -2.94757080078125, -2.844085693359375, -2.7406005859375, -2.637115478515625, -2.53363037109375, -2.430145263671875, -2.32666015625, -2.223175048828125, -2.11968994140625, -2.016204833984375, -1.9127197265625, -1.809234619140625, -1.70574951171875, -1.602264404296875, -1.498779296875, -1.395294189453125, -1.29180908203125, -1.188323974609375, -1.0848388671875, -0.981353759765625, -0.87786865234375, -0.774383544921875, -0.6708984375, -0.567413330078125, -0.46392822265625, -0.360443115234375, -0.2569580078125, -0.153472900390625, -0.04998779296875, 0.053497314453125, 0.156982421875, 0.260467529296875, 0.36395263671875, 0.467437744140625, 0.5709228515625, 0.674407958984375, 0.77789306640625, 0.881378173828125, 0.98486328125, 1.088348388671875, 1.19183349609375, 1.295318603515625, 1.3988037109375, 1.502288818359375, 1.60577392578125, 1.709259033203125, 1.812744140625, 1.916229248046875, 2.01971435546875, 2.123199462890625, 2.2266845703125, 2.330169677734375, 2.43365478515625, 2.537139892578125, 2.640625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 2.0, 9.0, 11.0, 19.0, 79.0, 237.0, 342.0, 194.0, 77.0, 30.0, 3.0, 0.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.531721115112305, -23.98343849182129, -22.435155868530273, -20.886873245239258, -19.338590621948242, -17.790307998657227, -16.242023468017578, -14.693741798400879, -13.145459175109863, -11.597176551818848, -10.048893928527832, -8.5006103515625, -6.952328205108643, -5.404045581817627, -3.855762481689453, -2.3074798583984375, -0.7591972351074219, 0.7890855073928833, 2.3373682498931885, 3.885651111602783, 5.433933734893799, 6.9822163581848145, 8.530499458312988, 10.078782081604004, 11.62706470489502, 13.175347328186035, 14.72362995147705, 16.271913528442383, 17.8201961517334, 19.368478775024414, 20.91676139831543, 22.465044021606445, 24.013324737548828, 25.561607360839844, 27.10988998413086, 28.658172607421875, 30.20645523071289, 31.754737854003906, 33.30302047729492, 34.85130310058594, 36.39958572387695, 37.94786834716797, 39.496150970458984, 41.04443359375, 42.592716217041016, 44.14099884033203, 45.68928146362305, 47.23756408691406, 48.785850524902344, 50.33413314819336, 51.882415771484375, 53.43069839477539, 54.978981018066406, 56.52726364135742, 58.07554626464844, 59.62382888793945, 61.17211151123047, 62.720394134521484, 64.2686767578125, 65.81696319580078, 67.36524200439453, 68.91352844238281, 70.46180725097656, 72.01009368896484, 73.5583724975586]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 8.0, 8.0, 5.0, 10.0, 6.0, 17.0, 20.0, 17.0, 28.0, 34.0, 35.0, 30.0, 44.0, 31.0, 34.0, 54.0, 51.0, 46.0, 55.0, 58.0, 48.0, 48.0, 34.0, 32.0, 33.0, 26.0, 32.0, 25.0, 27.0, 27.0, 22.0, 9.0, 9.0, 11.0, 5.0, 4.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.722419738769531, -10.330253601074219, -9.938087463378906, -9.545921325683594, -9.153755187988281, -8.761589050292969, -8.369422912597656, -7.97725772857666, -7.585091590881348, -7.192925453186035, -6.800759315490723, -6.40859317779541, -6.016427516937256, -5.624261379241943, -5.232095241546631, -4.839929580688477, -4.447762966156006, -4.055596828460693, -3.66343092918396, -3.2712647914886475, -2.879098892211914, -2.4869327545166016, -2.094766616821289, -1.7026007175445557, -1.3104345798492432, -0.9182685613632202, -0.5261024832725525, -0.13393640518188477, 0.2582296133041382, 0.6503956317901611, 1.0425617694854736, 1.434727668762207, 1.8268938064575195, 2.219059944152832, 2.6112258434295654, 3.003391981124878, 3.3955578804016113, 3.787724018096924, 4.179890155792236, 4.572055816650391, 4.964221954345703, 5.356388092041016, 5.748554229736328, 6.140720367431641, 6.532886028289795, 6.925052165985107, 7.31721830368042, 7.709383964538574, 8.101551055908203, 8.493717193603516, 8.885883331298828, 9.27804946899414, 9.670215606689453, 10.062381744384766, 10.454547882080078, 10.846713066101074, 11.238879203796387, 11.6310453414917, 12.023211479187012, 12.415377616882324, 12.807543754577637, 13.199708938598633, 13.591875076293945, 13.984041213989258, 14.37620735168457]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 3.0, 15.0, 14.0, 26.0, 32.0, 41.0, 64.0, 99.0, 165.0, 265.0, 329.0, 615.0, 1007.0, 1653.0, 2877.0, 5159.0, 9102.0, 17191.0, 32841.0, 67796.0, 145375.0, 276893.0, 247213.0, 121122.0, 56820.0, 28202.0, 14704.0, 7945.0, 4440.0, 2572.0, 1533.0, 978.0, 509.0, 348.0, 209.0, 131.0, 85.0, 75.0, 34.0, 22.0, 16.0, 15.0, 11.0, 5.0, 6.0, 3.0, 1.0, 2.0, 2.0], "bins": [-1.9990234375, -1.94482421875, -1.890625, -1.83642578125, -1.7822265625, -1.72802734375, -1.673828125, -1.61962890625, -1.5654296875, -1.51123046875, -1.45703125, -1.40283203125, -1.3486328125, -1.29443359375, -1.240234375, -1.18603515625, -1.1318359375, -1.07763671875, -1.0234375, -0.96923828125, -0.9150390625, -0.86083984375, -0.806640625, -0.75244140625, -0.6982421875, -0.64404296875, -0.58984375, -0.53564453125, -0.4814453125, -0.42724609375, -0.373046875, -0.31884765625, -0.2646484375, -0.21044921875, -0.15625, -0.10205078125, -0.0478515625, 0.00634765625, 0.060546875, 0.11474609375, 0.1689453125, 0.22314453125, 0.27734375, 0.33154296875, 0.3857421875, 0.43994140625, 0.494140625, 0.54833984375, 0.6025390625, 0.65673828125, 0.7109375, 0.76513671875, 0.8193359375, 0.87353515625, 0.927734375, 0.98193359375, 1.0361328125, 1.09033203125, 1.14453125, 1.19873046875, 1.2529296875, 1.30712890625, 1.361328125, 1.41552734375, 1.4697265625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 6.0, 2.0, 1.0, 4.0, 4.0, 6.0, 7.0, 10.0, 13.0, 14.0, 15.0, 9.0, 22.0, 19.0, 26.0, 29.0, 33.0, 25.0, 46.0, 36.0, 32.0, 37.0, 34.0, 36.0, 35.0, 41.0, 43.0, 44.0, 39.0, 43.0, 39.0, 36.0, 29.0, 22.0, 36.0, 30.0, 18.0, 17.0, 13.0, 9.0, 6.0, 8.0, 9.0, 7.0, 6.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-1.1787109375, -1.1412811279296875, -1.103851318359375, -1.0664215087890625, -1.02899169921875, -0.9915618896484375, -0.954132080078125, -0.9167022705078125, -0.8792724609375, -0.8418426513671875, -0.804412841796875, -0.7669830322265625, -0.72955322265625, -0.6921234130859375, -0.654693603515625, -0.6172637939453125, -0.579833984375, -0.5424041748046875, -0.504974365234375, -0.4675445556640625, -0.43011474609375, -0.3926849365234375, -0.355255126953125, -0.3178253173828125, -0.2803955078125, -0.2429656982421875, -0.205535888671875, -0.1681060791015625, -0.13067626953125, -0.0932464599609375, -0.055816650390625, -0.0183868408203125, 0.01904296875, 0.0564727783203125, 0.093902587890625, 0.1313323974609375, 0.16876220703125, 0.2061920166015625, 0.243621826171875, 0.2810516357421875, 0.3184814453125, 0.3559112548828125, 0.393341064453125, 0.4307708740234375, 0.46820068359375, 0.5056304931640625, 0.543060302734375, 0.5804901123046875, 0.617919921875, 0.6553497314453125, 0.692779541015625, 0.7302093505859375, 0.76763916015625, 0.8050689697265625, 0.842498779296875, 0.8799285888671875, 0.9173583984375, 0.9547882080078125, 0.992218017578125, 1.0296478271484375, 1.06707763671875, 1.1045074462890625, 1.141937255859375, 1.1793670654296875, 1.216796875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 10.0, 8.0, 13.0, 16.0, 27.0, 35.0, 42.0, 57.0, 92.0, 158.0, 231.0, 314.0, 456.0, 820.0, 1523.0, 3607.0, 15205.0, 126732.0, 800906.0, 80861.0, 11101.0, 2996.0, 1265.0, 694.0, 452.0, 298.0, 184.0, 136.0, 95.0, 61.0, 45.0, 35.0, 25.0, 14.0, 15.0, 10.0, 4.0, 9.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.51953125, -4.38006591796875, -4.2406005859375, -4.10113525390625, -3.961669921875, -3.82220458984375, -3.6827392578125, -3.54327392578125, -3.40380859375, -3.26434326171875, -3.1248779296875, -2.98541259765625, -2.845947265625, -2.70648193359375, -2.5670166015625, -2.42755126953125, -2.2880859375, -2.14862060546875, -2.0091552734375, -1.86968994140625, -1.730224609375, -1.59075927734375, -1.4512939453125, -1.31182861328125, -1.17236328125, -1.03289794921875, -0.8934326171875, -0.75396728515625, -0.614501953125, -0.47503662109375, -0.3355712890625, -0.19610595703125, -0.056640625, 0.08282470703125, 0.2222900390625, 0.36175537109375, 0.501220703125, 0.64068603515625, 0.7801513671875, 0.91961669921875, 1.05908203125, 1.19854736328125, 1.3380126953125, 1.47747802734375, 1.616943359375, 1.75640869140625, 1.8958740234375, 2.03533935546875, 2.1748046875, 2.31427001953125, 2.4537353515625, 2.59320068359375, 2.732666015625, 2.87213134765625, 3.0115966796875, 3.15106201171875, 3.29052734375, 3.42999267578125, 3.5694580078125, 3.70892333984375, 3.848388671875, 3.98785400390625, 4.1273193359375, 4.26678466796875, 4.40625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 2.0, 5.0, 11.0, 11.0, 11.0, 14.0, 16.0, 15.0, 14.0, 28.0, 23.0, 31.0, 35.0, 44.0, 29.0, 53.0, 43.0, 44.0, 41.0, 35.0, 40.0, 63.0, 41.0, 37.0, 50.0, 41.0, 32.0, 30.0, 23.0, 25.0, 16.0, 14.0, 19.0, 11.0, 6.0, 15.0, 11.0, 6.0, 5.0, 2.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-4.6640625, -4.52984619140625, -4.3956298828125, -4.26141357421875, -4.127197265625, -3.99298095703125, -3.8587646484375, -3.72454833984375, -3.59033203125, -3.45611572265625, -3.3218994140625, -3.18768310546875, -3.053466796875, -2.91925048828125, -2.7850341796875, -2.65081787109375, -2.5166015625, -2.38238525390625, -2.2481689453125, -2.11395263671875, -1.979736328125, -1.84552001953125, -1.7113037109375, -1.57708740234375, -1.44287109375, -1.30865478515625, -1.1744384765625, -1.04022216796875, -0.906005859375, -0.77178955078125, -0.6375732421875, -0.50335693359375, -0.369140625, -0.23492431640625, -0.1007080078125, 0.03350830078125, 0.167724609375, 0.30194091796875, 0.4361572265625, 0.57037353515625, 0.70458984375, 0.83880615234375, 0.9730224609375, 1.10723876953125, 1.241455078125, 1.37567138671875, 1.5098876953125, 1.64410400390625, 1.7783203125, 1.91253662109375, 2.0467529296875, 2.18096923828125, 2.315185546875, 2.44940185546875, 2.5836181640625, 2.71783447265625, 2.85205078125, 2.98626708984375, 3.1204833984375, 3.25469970703125, 3.388916015625, 3.52313232421875, 3.6573486328125, 3.79156494140625, 3.92578125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 5.0, 4.0, 6.0, 6.0, 13.0, 21.0, 19.0, 20.0, 24.0, 43.0, 66.0, 97.0, 142.0, 188.0, 329.0, 659.0, 1268.0, 3021.0, 8466.0, 32355.0, 160490.0, 705459.0, 102485.0, 22163.0, 6320.0, 2393.0, 1039.0, 550.0, 309.0, 184.0, 119.0, 74.0, 73.0, 35.0, 25.0, 18.0, 14.0, 16.0, 13.0, 4.0, 5.0, 6.0, 6.0, 1.0, 2.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.85400390625, -0.8276214599609375, -0.801239013671875, -0.7748565673828125, -0.74847412109375, -0.7220916748046875, -0.695709228515625, -0.6693267822265625, -0.6429443359375, -0.6165618896484375, -0.590179443359375, -0.5637969970703125, -0.53741455078125, -0.5110321044921875, -0.484649658203125, -0.4582672119140625, -0.431884765625, -0.4055023193359375, -0.379119873046875, -0.3527374267578125, -0.32635498046875, -0.2999725341796875, -0.273590087890625, -0.2472076416015625, -0.2208251953125, -0.1944427490234375, -0.168060302734375, -0.1416778564453125, -0.11529541015625, -0.0889129638671875, -0.062530517578125, -0.0361480712890625, -0.009765625, 0.0166168212890625, 0.042999267578125, 0.0693817138671875, 0.09576416015625, 0.1221466064453125, 0.148529052734375, 0.1749114990234375, 0.2012939453125, 0.2276763916015625, 0.254058837890625, 0.2804412841796875, 0.30682373046875, 0.3332061767578125, 0.359588623046875, 0.3859710693359375, 0.412353515625, 0.4387359619140625, 0.465118408203125, 0.4915008544921875, 0.51788330078125, 0.5442657470703125, 0.570648193359375, 0.5970306396484375, 0.6234130859375, 0.6497955322265625, 0.676177978515625, 0.7025604248046875, 0.72894287109375, 0.7553253173828125, 0.781707763671875, 0.8080902099609375, 0.83447265625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 7.0, 2.0, 4.0, 4.0, 8.0, 8.0, 2.0, 11.0, 11.0, 25.0, 31.0, 34.0, 43.0, 67.0, 122.0, 127.0, 104.0, 93.0, 75.0, 58.0, 46.0, 34.0, 34.0, 16.0, 10.0, 5.0, 6.0, 6.0, 5.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0004191398620605469, -0.00040678679943084717, -0.00039443373680114746, -0.00038208067417144775, -0.00036972761154174805, -0.00035737454891204834, -0.00034502148628234863, -0.0003326684236526489, -0.0003203153610229492, -0.0003079622983932495, -0.0002956092357635498, -0.0002832561731338501, -0.0002709031105041504, -0.0002585500478744507, -0.000246196985244751, -0.00023384392261505127, -0.00022149085998535156, -0.00020913779735565186, -0.00019678473472595215, -0.00018443167209625244, -0.00017207860946655273, -0.00015972554683685303, -0.00014737248420715332, -0.0001350194215774536, -0.0001226663589477539, -0.0001103132963180542, -9.796023368835449e-05, -8.560717105865479e-05, -7.325410842895508e-05, -6.090104579925537e-05, -4.8547983169555664e-05, -3.619492053985596e-05, -2.384185791015625e-05, -1.1488795280456543e-05, 8.642673492431641e-07, 1.3217329978942871e-05, 2.5570392608642578e-05, 3.7923455238342285e-05, 5.027651786804199e-05, 6.26295804977417e-05, 7.49826431274414e-05, 8.733570575714111e-05, 9.968876838684082e-05, 0.00011204183101654053, 0.00012439489364624023, 0.00013674795627593994, 0.00014910101890563965, 0.00016145408153533936, 0.00017380714416503906, 0.00018616020679473877, 0.00019851326942443848, 0.00021086633205413818, 0.0002232193946838379, 0.0002355724573135376, 0.0002479255199432373, 0.000260278582572937, 0.0002726316452026367, 0.0002849847078323364, 0.00029733777046203613, 0.00030969083309173584, 0.00032204389572143555, 0.00033439695835113525, 0.00034675002098083496, 0.00035910308361053467, 0.0003714561462402344]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 8.0, 12.0, 21.0, 22.0, 32.0, 56.0, 82.0, 165.0, 317.0, 576.0, 1220.0, 3616.0, 15209.0, 107147.0, 779013.0, 118096.0, 16574.0, 3798.0, 1270.0, 568.0, 302.0, 157.0, 107.0, 69.0, 42.0, 21.0, 13.0, 17.0, 6.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0009765625, -0.967071533203125, -0.93316650390625, -0.899261474609375, -0.8653564453125, -0.831451416015625, -0.79754638671875, -0.763641357421875, -0.729736328125, -0.695831298828125, -0.66192626953125, -0.628021240234375, -0.5941162109375, -0.560211181640625, -0.52630615234375, -0.492401123046875, -0.45849609375, -0.424591064453125, -0.39068603515625, -0.356781005859375, -0.3228759765625, -0.288970947265625, -0.25506591796875, -0.221160888671875, -0.187255859375, -0.153350830078125, -0.11944580078125, -0.085540771484375, -0.0516357421875, -0.017730712890625, 0.01617431640625, 0.050079345703125, 0.083984375, 0.117889404296875, 0.15179443359375, 0.185699462890625, 0.2196044921875, 0.253509521484375, 0.28741455078125, 0.321319580078125, 0.355224609375, 0.389129638671875, 0.42303466796875, 0.456939697265625, 0.4908447265625, 0.524749755859375, 0.55865478515625, 0.592559814453125, 0.62646484375, 0.660369873046875, 0.69427490234375, 0.728179931640625, 0.7620849609375, 0.795989990234375, 0.82989501953125, 0.863800048828125, 0.897705078125, 0.931610107421875, 0.96551513671875, 0.999420166015625, 1.0333251953125, 1.067230224609375, 1.10113525390625, 1.135040283203125, 1.1689453125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 7.0, 2.0, 4.0, 3.0, 15.0, 9.0, 12.0, 16.0, 25.0, 40.0, 47.0, 69.0, 71.0, 95.0, 91.0, 110.0, 86.0, 74.0, 65.0, 44.0, 35.0, 18.0, 20.0, 19.0, 7.0, 12.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.83544921875, -0.8017349243164062, -0.7680206298828125, -0.7343063354492188, -0.700592041015625, -0.6668777465820312, -0.6331634521484375, -0.5994491577148438, -0.56573486328125, -0.5320205688476562, -0.4983062744140625, -0.46459197998046875, -0.430877685546875, -0.39716339111328125, -0.3634490966796875, -0.32973480224609375, -0.2960205078125, -0.26230621337890625, -0.2285919189453125, -0.19487762451171875, -0.161163330078125, -0.12744903564453125, -0.0937347412109375, -0.06002044677734375, -0.02630615234375, 0.00740814208984375, 0.0411224365234375, 0.07483673095703125, 0.108551025390625, 0.14226531982421875, 0.1759796142578125, 0.20969390869140625, 0.243408203125, 0.27712249755859375, 0.3108367919921875, 0.34455108642578125, 0.378265380859375, 0.41197967529296875, 0.4456939697265625, 0.47940826416015625, 0.51312255859375, 0.5468368530273438, 0.5805511474609375, 0.6142654418945312, 0.647979736328125, 0.6816940307617188, 0.7154083251953125, 0.7491226196289062, 0.7828369140625, 0.8165512084960938, 0.8502655029296875, 0.8839797973632812, 0.917694091796875, 0.9514083862304688, 0.9851226806640625, 1.0188369750976562, 1.05255126953125, 1.0862655639648438, 1.1199798583984375, 1.1536941528320312, 1.187408447265625, 1.2211227416992188, 1.2548370361328125, 1.2885513305664062, 1.322265625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 7.0, 30.0, 50.0, 111.0, 435.0, 242.0, 79.0, 29.0, 8.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-46.56085205078125, -45.22489547729492, -43.888938903808594, -42.552978515625, -41.21702194213867, -39.881065368652344, -38.545108795166016, -37.20915222167969, -35.87319564819336, -34.53723907470703, -33.2012825012207, -31.865324020385742, -30.529367446899414, -29.193408966064453, -27.857452392578125, -26.521495819091797, -25.185537338256836, -23.849580764770508, -22.513622283935547, -21.17766571044922, -19.84170913696289, -18.505752563476562, -17.1697940826416, -15.833837509155273, -14.497879981994629, -13.161922454833984, -11.825965881347656, -10.490008354187012, -9.154050827026367, -7.818094253540039, -6.4821367263793945, -5.146180152893066, -3.810222625732422, -2.4742655754089355, -1.1383082866668701, 0.1976490020751953, 1.5336060523986816, 2.869563102722168, 4.2055206298828125, 5.541477203369141, 6.877434730529785, 8.21339225769043, 9.549348831176758, 10.885306358337402, 12.221263885498047, 13.557220458984375, 14.89317798614502, 16.22913360595703, 17.565092086791992, 18.90104866027832, 20.23700714111328, 21.57296371459961, 22.908920288085938, 24.244876861572266, 25.580835342407227, 26.916791915893555, 28.252750396728516, 29.588706970214844, 30.924665451049805, 32.2606201171875, 33.596580505371094, 34.93253707885742, 36.26849365234375, 37.60445022583008, 38.940406799316406]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 0.0, 5.0, 3.0, 8.0, 6.0, 6.0, 6.0, 8.0, 17.0, 18.0, 14.0, 34.0, 18.0, 37.0, 39.0, 37.0, 30.0, 40.0, 93.0, 169.0, 110.0, 50.0, 39.0, 31.0, 27.0, 24.0, 23.0, 18.0, 18.0, 11.0, 13.0, 9.0, 12.0, 9.0, 7.0, 3.0, 10.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.820205688476562, -20.216535568237305, -19.61286735534668, -19.009197235107422, -18.405527114868164, -17.801856994628906, -17.19818878173828, -16.594518661499023, -15.990849494934082, -15.38718032836914, -14.783510208129883, -14.179841041564941, -13.576171875, -12.972501754760742, -12.3688325881958, -11.76516342163086, -11.161493301391602, -10.55782413482666, -9.954154014587402, -9.350484848022461, -8.746814727783203, -8.143145561218262, -7.53947639465332, -6.935806751251221, -6.332137107849121, -5.7284674644470215, -5.124797821044922, -4.5211286544799805, -3.917459011077881, -3.3137893676757812, -2.7101199626922607, -2.1064505577087402, -1.5027790069580078, -0.8991094827651978, -0.2954399585723877, 0.30822956562042236, 0.9118990898132324, 1.515568733215332, 2.1192381381988525, 2.722907543182373, 3.3265771865844727, 3.9302468299865723, 4.533916473388672, 5.137585639953613, 5.741255283355713, 6.3449249267578125, 6.948594093322754, 7.5522637367248535, 8.155933380126953, 8.759602546691895, 9.363272666931152, 9.966941833496094, 10.570611953735352, 11.174281120300293, 11.777950286865234, 12.381620407104492, 12.985289573669434, 13.588958740234375, 14.192628860473633, 14.796298027038574, 15.399967193603516, 16.003637313842773, 16.60730743408203, 17.210975646972656, 17.814645767211914]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 10.0, 9.0, 6.0, 9.0, 12.0, 22.0, 25.0, 41.0, 68.0, 65.0, 130.0, 210.0, 304.0, 472.0, 899.0, 1696.0, 3754.0, 10507.0, 41537.0, 257777.0, 1479665.0, 1909092.0, 400133.0, 63106.0, 15107.0, 5099.0, 2014.0, 1009.0, 566.0, 315.0, 222.0, 148.0, 88.0, 42.0, 42.0, 23.0, 18.0, 15.0, 10.0, 2.0, 9.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.505859375, -2.432403564453125, -2.35894775390625, -2.285491943359375, -2.2120361328125, -2.138580322265625, -2.06512451171875, -1.991668701171875, -1.918212890625, -1.844757080078125, -1.77130126953125, -1.697845458984375, -1.6243896484375, -1.550933837890625, -1.47747802734375, -1.404022216796875, -1.33056640625, -1.257110595703125, -1.18365478515625, -1.110198974609375, -1.0367431640625, -0.963287353515625, -0.88983154296875, -0.816375732421875, -0.742919921875, -0.669464111328125, -0.59600830078125, -0.522552490234375, -0.4490966796875, -0.375640869140625, -0.30218505859375, -0.228729248046875, -0.1552734375, -0.081817626953125, -0.00836181640625, 0.065093994140625, 0.1385498046875, 0.212005615234375, 0.28546142578125, 0.358917236328125, 0.432373046875, 0.505828857421875, 0.57928466796875, 0.652740478515625, 0.7261962890625, 0.799652099609375, 0.87310791015625, 0.946563720703125, 1.02001953125, 1.093475341796875, 1.16693115234375, 1.240386962890625, 1.3138427734375, 1.387298583984375, 1.46075439453125, 1.534210205078125, 1.607666015625, 1.681121826171875, 1.75457763671875, 1.828033447265625, 1.9014892578125, 1.974945068359375, 2.04840087890625, 2.121856689453125, 2.1953125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 5.0, 1.0, 4.0, 4.0, 5.0, 5.0, 6.0, 14.0, 13.0, 17.0, 12.0, 30.0, 31.0, 31.0, 41.0, 51.0, 51.0, 62.0, 46.0, 58.0, 53.0, 48.0, 58.0, 62.0, 48.0, 49.0, 45.0, 22.0, 36.0, 26.0, 26.0, 8.0, 11.0, 11.0, 5.0, 4.0, 5.0, 1.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.9482421875, -1.89862060546875, -1.8489990234375, -1.79937744140625, -1.749755859375, -1.70013427734375, -1.6505126953125, -1.60089111328125, -1.55126953125, -1.50164794921875, -1.4520263671875, -1.40240478515625, -1.352783203125, -1.30316162109375, -1.2535400390625, -1.20391845703125, -1.154296875, -1.10467529296875, -1.0550537109375, -1.00543212890625, -0.955810546875, -0.90618896484375, -0.8565673828125, -0.80694580078125, -0.75732421875, -0.70770263671875, -0.6580810546875, -0.60845947265625, -0.558837890625, -0.50921630859375, -0.4595947265625, -0.40997314453125, -0.3603515625, -0.31072998046875, -0.2611083984375, -0.21148681640625, -0.161865234375, -0.11224365234375, -0.0626220703125, -0.01300048828125, 0.03662109375, 0.08624267578125, 0.1358642578125, 0.18548583984375, 0.235107421875, 0.28472900390625, 0.3343505859375, 0.38397216796875, 0.43359375, 0.48321533203125, 0.5328369140625, 0.58245849609375, 0.632080078125, 0.68170166015625, 0.7313232421875, 0.78094482421875, 0.83056640625, 0.88018798828125, 0.9298095703125, 0.97943115234375, 1.029052734375, 1.07867431640625, 1.1282958984375, 1.17791748046875, 1.2275390625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 7.0, 7.0, 18.0, 18.0, 23.0, 78.0, 152.0, 351.0, 948.0, 3418.0, 53858.0, 4097770.0, 33405.0, 2803.0, 864.0, 330.0, 107.0, 57.0, 29.0, 16.0, 10.0, 3.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.3203125, -9.95751953125, -9.5947265625, -9.23193359375, -8.869140625, -8.50634765625, -8.1435546875, -7.78076171875, -7.41796875, -7.05517578125, -6.6923828125, -6.32958984375, -5.966796875, -5.60400390625, -5.2412109375, -4.87841796875, -4.515625, -4.15283203125, -3.7900390625, -3.42724609375, -3.064453125, -2.70166015625, -2.3388671875, -1.97607421875, -1.61328125, -1.25048828125, -0.8876953125, -0.52490234375, -0.162109375, 0.20068359375, 0.5634765625, 0.92626953125, 1.2890625, 1.65185546875, 2.0146484375, 2.37744140625, 2.740234375, 3.10302734375, 3.4658203125, 3.82861328125, 4.19140625, 4.55419921875, 4.9169921875, 5.27978515625, 5.642578125, 6.00537109375, 6.3681640625, 6.73095703125, 7.09375, 7.45654296875, 7.8193359375, 8.18212890625, 8.544921875, 8.90771484375, 9.2705078125, 9.63330078125, 9.99609375, 10.35888671875, 10.7216796875, 11.08447265625, 11.447265625, 11.81005859375, 12.1728515625, 12.53564453125, 12.8984375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 7.0, 18.0, 24.0, 29.0, 69.0, 130.0, 188.0, 280.0, 549.0, 893.0, 817.0, 432.0, 273.0, 142.0, 95.0, 60.0, 26.0, 17.0, 9.0, 7.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-8.8671875, -8.664794921875, -8.46240234375, -8.260009765625, -8.0576171875, -7.855224609375, -7.65283203125, -7.450439453125, -7.248046875, -7.045654296875, -6.84326171875, -6.640869140625, -6.4384765625, -6.236083984375, -6.03369140625, -5.831298828125, -5.62890625, -5.426513671875, -5.22412109375, -5.021728515625, -4.8193359375, -4.616943359375, -4.41455078125, -4.212158203125, -4.009765625, -3.807373046875, -3.60498046875, -3.402587890625, -3.2001953125, -2.997802734375, -2.79541015625, -2.593017578125, -2.390625, -2.188232421875, -1.98583984375, -1.783447265625, -1.5810546875, -1.378662109375, -1.17626953125, -0.973876953125, -0.771484375, -0.569091796875, -0.36669921875, -0.164306640625, 0.0380859375, 0.240478515625, 0.44287109375, 0.645263671875, 0.84765625, 1.050048828125, 1.25244140625, 1.454833984375, 1.6572265625, 1.859619140625, 2.06201171875, 2.264404296875, 2.466796875, 2.669189453125, 2.87158203125, 3.073974609375, 3.2763671875, 3.478759765625, 3.68115234375, 3.883544921875, 4.0859375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 10.0, 14.0, 26.0, 101.0, 311.0, 360.0, 115.0, 34.0, 18.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-122.20375061035156, -119.07085418701172, -115.93795776367188, -112.80506134033203, -109.67216491699219, -106.53927612304688, -103.40637969970703, -100.27348327636719, -97.14058685302734, -94.0076904296875, -90.87479400634766, -87.74189758300781, -84.6090087890625, -81.47611236572266, -78.34321594238281, -75.21031951904297, -72.07742309570312, -68.94452667236328, -65.81163024902344, -62.67873764038086, -59.545841217041016, -56.41294479370117, -53.280052185058594, -50.14715576171875, -47.014259338378906, -43.88136291503906, -40.74846649169922, -37.61557388305664, -34.4826774597168, -31.349781036376953, -28.216886520385742, -25.08399200439453, -21.951095581054688, -18.818199157714844, -15.685304641723633, -12.552409172058105, -9.419513702392578, -6.286618232727051, -3.1537227630615234, -0.0208282470703125, 3.1120681762695312, 6.244963645935059, 9.377859115600586, 12.510754585266113, 15.64365005493164, 18.776546478271484, 21.909440994262695, 25.042335510253906, 28.17523193359375, 31.308128356933594, 34.44102478027344, 37.573917388916016, 40.70681381225586, 43.8397102355957, 46.97260284423828, 50.105499267578125, 53.23839569091797, 56.37129211425781, 59.504188537597656, 62.637081146240234, 65.76997375488281, 68.90287017822266, 72.0357666015625, 75.16866302490234, 78.30155944824219]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 8.0, 8.0, 10.0, 19.0, 19.0, 40.0, 44.0, 53.0, 86.0, 117.0, 143.0, 103.0, 93.0, 79.0, 62.0, 44.0, 31.0, 17.0, 13.0, 13.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.63609313964844, -49.99907302856445, -48.36205291748047, -46.725032806396484, -45.0880126953125, -43.45099639892578, -41.8139762878418, -40.17695617675781, -38.53993606567383, -36.902915954589844, -35.26589584350586, -33.628875732421875, -31.991857528686523, -30.35483741760254, -28.717819213867188, -27.080799102783203, -25.44377899169922, -23.806758880615234, -22.16973876953125, -20.5327205657959, -18.895700454711914, -17.25868034362793, -15.621661186218262, -13.984642028808594, -12.34762191772461, -10.710601806640625, -9.073582649230957, -7.436563014984131, -5.799543380737305, -4.16252326965332, -2.5255041122436523, -0.8884849548339844, 0.74853515625, 2.385554790496826, 4.022574424743652, 5.6595940589904785, 7.296613693237305, 8.933633804321289, 10.570652961730957, 12.207672119140625, 13.84469223022461, 15.481712341308594, 17.118732452392578, 18.75575065612793, 20.392770767211914, 22.0297908782959, 23.66680908203125, 25.303829193115234, 26.94084930419922, 28.577869415283203, 30.214889526367188, 31.85190773010254, 33.488929748535156, 35.125946044921875, 36.76296615600586, 38.399986267089844, 40.03700637817383, 41.67402648925781, 43.3110466003418, 44.94806671142578, 46.5850830078125, 48.22210693359375, 49.85912322998047, 51.49614334106445, 53.13316345214844]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 5.0, 3.0, 4.0, 6.0, 12.0, 14.0, 15.0, 25.0, 43.0, 71.0, 104.0, 210.0, 461.0, 1012.0, 2404.0, 6492.0, 23714.0, 126200.0, 715054.0, 136233.0, 25221.0, 6852.0, 2358.0, 1046.0, 464.0, 237.0, 109.0, 65.0, 38.0, 21.0, 23.0, 10.0, 10.0, 7.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.984375, -3.85382080078125, -3.7232666015625, -3.59271240234375, -3.462158203125, -3.33160400390625, -3.2010498046875, -3.07049560546875, -2.93994140625, -2.80938720703125, -2.6788330078125, -2.54827880859375, -2.417724609375, -2.28717041015625, -2.1566162109375, -2.02606201171875, -1.8955078125, -1.76495361328125, -1.6343994140625, -1.50384521484375, -1.373291015625, -1.24273681640625, -1.1121826171875, -0.98162841796875, -0.85107421875, -0.72052001953125, -0.5899658203125, -0.45941162109375, -0.328857421875, -0.19830322265625, -0.0677490234375, 0.06280517578125, 0.193359375, 0.32391357421875, 0.4544677734375, 0.58502197265625, 0.715576171875, 0.84613037109375, 0.9766845703125, 1.10723876953125, 1.23779296875, 1.36834716796875, 1.4989013671875, 1.62945556640625, 1.760009765625, 1.89056396484375, 2.0211181640625, 2.15167236328125, 2.2822265625, 2.41278076171875, 2.5433349609375, 2.67388916015625, 2.804443359375, 2.93499755859375, 3.0655517578125, 3.19610595703125, 3.32666015625, 3.45721435546875, 3.5877685546875, 3.71832275390625, 3.848876953125, 3.97943115234375, 4.1099853515625, 4.24053955078125, 4.37109375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 8.0, 16.0, 20.0, 39.0, 46.0, 70.0, 110.0, 110.0, 106.0, 113.0, 102.0, 86.0, 72.0, 43.0, 21.0, 18.0, 13.0, 8.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.857421875, -3.739349365234375, -3.62127685546875, -3.503204345703125, -3.3851318359375, -3.267059326171875, -3.14898681640625, -3.030914306640625, -2.912841796875, -2.794769287109375, -2.67669677734375, -2.558624267578125, -2.4405517578125, -2.322479248046875, -2.20440673828125, -2.086334228515625, -1.96826171875, -1.850189208984375, -1.73211669921875, -1.614044189453125, -1.4959716796875, -1.377899169921875, -1.25982666015625, -1.141754150390625, -1.023681640625, -0.905609130859375, -0.78753662109375, -0.669464111328125, -0.5513916015625, -0.433319091796875, -0.31524658203125, -0.197174072265625, -0.0791015625, 0.038970947265625, 0.15704345703125, 0.275115966796875, 0.3931884765625, 0.511260986328125, 0.62933349609375, 0.747406005859375, 0.865478515625, 0.983551025390625, 1.10162353515625, 1.219696044921875, 1.3377685546875, 1.455841064453125, 1.57391357421875, 1.691986083984375, 1.81005859375, 1.928131103515625, 2.04620361328125, 2.164276123046875, 2.2823486328125, 2.400421142578125, 2.51849365234375, 2.636566162109375, 2.754638671875, 2.872711181640625, 2.99078369140625, 3.108856201171875, 3.2269287109375, 3.345001220703125, 3.46307373046875, 3.581146240234375, 3.69921875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 6.0, 9.0, 7.0, 7.0, 21.0, 18.0, 22.0, 25.0, 42.0, 58.0, 83.0, 107.0, 174.0, 288.0, 471.0, 876.0, 2139.0, 6834.0, 36585.0, 845297.0, 132921.0, 15751.0, 3729.0, 1435.0, 628.0, 352.0, 188.0, 145.0, 95.0, 56.0, 49.0, 25.0, 30.0, 17.0, 13.0, 15.0, 6.0, 7.0, 6.0, 3.0, 3.0, 3.0, 3.0, 0.0, 2.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.705078125, -3.580657958984375, -3.45623779296875, -3.331817626953125, -3.2073974609375, -3.082977294921875, -2.95855712890625, -2.834136962890625, -2.709716796875, -2.585296630859375, -2.46087646484375, -2.336456298828125, -2.2120361328125, -2.087615966796875, -1.96319580078125, -1.838775634765625, -1.71435546875, -1.589935302734375, -1.46551513671875, -1.341094970703125, -1.2166748046875, -1.092254638671875, -0.96783447265625, -0.843414306640625, -0.718994140625, -0.594573974609375, -0.47015380859375, -0.345733642578125, -0.2213134765625, -0.096893310546875, 0.02752685546875, 0.151947021484375, 0.2763671875, 0.400787353515625, 0.52520751953125, 0.649627685546875, 0.7740478515625, 0.898468017578125, 1.02288818359375, 1.147308349609375, 1.271728515625, 1.396148681640625, 1.52056884765625, 1.644989013671875, 1.7694091796875, 1.893829345703125, 2.01824951171875, 2.142669677734375, 2.26708984375, 2.391510009765625, 2.51593017578125, 2.640350341796875, 2.7647705078125, 2.889190673828125, 3.01361083984375, 3.138031005859375, 3.262451171875, 3.386871337890625, 3.51129150390625, 3.635711669921875, 3.7601318359375, 3.884552001953125, 4.00897216796875, 4.133392333984375, 4.2578125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 2.0, 5.0, 5.0, 3.0, 6.0, 12.0, 7.0, 12.0, 18.0, 18.0, 21.0, 23.0, 17.0, 38.0, 40.0, 43.0, 53.0, 71.0, 68.0, 81.0, 75.0, 66.0, 69.0, 40.0, 26.0, 25.0, 31.0, 23.0, 20.0, 14.0, 11.0, 9.0, 9.0, 9.0, 4.0, 8.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-6.57421875, -6.37762451171875, -6.1810302734375, -5.98443603515625, -5.787841796875, -5.59124755859375, -5.3946533203125, -5.19805908203125, -5.00146484375, -4.80487060546875, -4.6082763671875, -4.41168212890625, -4.215087890625, -4.01849365234375, -3.8218994140625, -3.62530517578125, -3.4287109375, -3.23211669921875, -3.0355224609375, -2.83892822265625, -2.642333984375, -2.44573974609375, -2.2491455078125, -2.05255126953125, -1.85595703125, -1.65936279296875, -1.4627685546875, -1.26617431640625, -1.069580078125, -0.87298583984375, -0.6763916015625, -0.47979736328125, -0.283203125, -0.08660888671875, 0.1099853515625, 0.30657958984375, 0.503173828125, 0.69976806640625, 0.8963623046875, 1.09295654296875, 1.28955078125, 1.48614501953125, 1.6827392578125, 1.87933349609375, 2.075927734375, 2.27252197265625, 2.4691162109375, 2.66571044921875, 2.8623046875, 3.05889892578125, 3.2554931640625, 3.45208740234375, 3.648681640625, 3.84527587890625, 4.0418701171875, 4.23846435546875, 4.43505859375, 4.63165283203125, 4.8282470703125, 5.02484130859375, 5.221435546875, 5.41802978515625, 5.6146240234375, 5.81121826171875, 6.0078125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 2.0, 7.0, 7.0, 14.0, 11.0, 15.0, 21.0, 42.0, 35.0, 68.0, 112.0, 229.0, 509.0, 1237.0, 3977.0, 16976.0, 213844.0, 782966.0, 21086.0, 4735.0, 1453.0, 560.0, 268.0, 143.0, 70.0, 54.0, 32.0, 25.0, 20.0, 12.0, 4.0, 6.0, 5.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0361328125, -1.002777099609375, -0.96942138671875, -0.936065673828125, -0.9027099609375, -0.869354248046875, -0.83599853515625, -0.802642822265625, -0.769287109375, -0.735931396484375, -0.70257568359375, -0.669219970703125, -0.6358642578125, -0.602508544921875, -0.56915283203125, -0.535797119140625, -0.50244140625, -0.469085693359375, -0.43572998046875, -0.402374267578125, -0.3690185546875, -0.335662841796875, -0.30230712890625, -0.268951416015625, -0.235595703125, -0.202239990234375, -0.16888427734375, -0.135528564453125, -0.1021728515625, -0.068817138671875, -0.03546142578125, -0.002105712890625, 0.03125, 0.064605712890625, 0.09796142578125, 0.131317138671875, 0.1646728515625, 0.198028564453125, 0.23138427734375, 0.264739990234375, 0.298095703125, 0.331451416015625, 0.36480712890625, 0.398162841796875, 0.4315185546875, 0.464874267578125, 0.49822998046875, 0.531585693359375, 0.56494140625, 0.598297119140625, 0.63165283203125, 0.665008544921875, 0.6983642578125, 0.731719970703125, 0.76507568359375, 0.798431396484375, 0.831787109375, 0.865142822265625, 0.89849853515625, 0.931854248046875, 0.9652099609375, 0.998565673828125, 1.03192138671875, 1.065277099609375, 1.0986328125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 8.0, 2.0, 12.0, 10.0, 15.0, 19.0, 21.0, 18.0, 25.0, 33.0, 55.0, 51.0, 83.0, 113.0, 122.0, 107.0, 75.0, 53.0, 41.0, 39.0, 19.0, 20.0, 17.0, 13.0, 6.0, 8.0, 5.0, 6.0, 5.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020813941955566406, -0.00019996985793113708, -0.0001918002963066101, -0.00018363073468208313, -0.00017546117305755615, -0.00016729161143302917, -0.0001591220498085022, -0.00015095248818397522, -0.00014278292655944824, -0.00013461336493492126, -0.0001264438033103943, -0.00011827424168586731, -0.00011010468006134033, -0.00010193511843681335, -9.376555681228638e-05, -8.55959951877594e-05, -7.742643356323242e-05, -6.925687193870544e-05, -6.108731031417847e-05, -5.291774868965149e-05, -4.474818706512451e-05, -3.6578625440597534e-05, -2.8409063816070557e-05, -2.023950219154358e-05, -1.2069940567016602e-05, -3.900378942489624e-06, 4.2691826820373535e-06, 1.2438744306564331e-05, 2.060830593109131e-05, 2.8777867555618286e-05, 3.6947429180145264e-05, 4.511699080467224e-05, 5.328655242919922e-05, 6.14561140537262e-05, 6.962567567825317e-05, 7.779523730278015e-05, 8.596479892730713e-05, 9.41343605518341e-05, 0.00010230392217636108, 0.00011047348380088806, 0.00011864304542541504, 0.00012681260704994202, 0.000134982168674469, 0.00014315173029899597, 0.00015132129192352295, 0.00015949085354804993, 0.0001676604151725769, 0.00017582997679710388, 0.00018399953842163086, 0.00019216910004615784, 0.00020033866167068481, 0.0002085082232952118, 0.00021667778491973877, 0.00022484734654426575, 0.00023301690816879272, 0.0002411864697933197, 0.0002493560314178467, 0.00025752559304237366, 0.00026569515466690063, 0.0002738647162914276, 0.0002820342779159546, 0.00029020383954048157, 0.00029837340116500854, 0.0003065429627895355, 0.0003147125244140625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 9.0, 5.0, 6.0, 17.0, 12.0, 24.0, 25.0, 49.0, 53.0, 102.0, 136.0, 226.0, 409.0, 708.0, 1345.0, 2573.0, 5770.0, 14595.0, 47265.0, 720204.0, 197146.0, 36023.0, 11936.0, 4849.0, 2230.0, 1198.0, 626.0, 370.0, 231.0, 123.0, 85.0, 61.0, 48.0, 28.0, 17.0, 10.0, 16.0, 8.0, 8.0, 4.0, 2.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.5751953125, -0.559173583984375, -0.54315185546875, -0.527130126953125, -0.5111083984375, -0.495086669921875, -0.47906494140625, -0.463043212890625, -0.447021484375, -0.430999755859375, -0.41497802734375, -0.398956298828125, -0.3829345703125, -0.366912841796875, -0.35089111328125, -0.334869384765625, -0.31884765625, -0.302825927734375, -0.28680419921875, -0.270782470703125, -0.2547607421875, -0.238739013671875, -0.22271728515625, -0.206695556640625, -0.190673828125, -0.174652099609375, -0.15863037109375, -0.142608642578125, -0.1265869140625, -0.110565185546875, -0.09454345703125, -0.078521728515625, -0.0625, -0.046478271484375, -0.03045654296875, -0.014434814453125, 0.0015869140625, 0.017608642578125, 0.03363037109375, 0.049652099609375, 0.065673828125, 0.081695556640625, 0.09771728515625, 0.113739013671875, 0.1297607421875, 0.145782470703125, 0.16180419921875, 0.177825927734375, 0.19384765625, 0.209869384765625, 0.22589111328125, 0.241912841796875, 0.2579345703125, 0.273956298828125, 0.28997802734375, 0.305999755859375, 0.322021484375, 0.338043212890625, 0.35406494140625, 0.370086669921875, 0.3861083984375, 0.402130126953125, 0.41815185546875, 0.434173583984375, 0.4501953125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 4.0, 5.0, 6.0, 4.0, 4.0, 13.0, 13.0, 6.0, 16.0, 18.0, 24.0, 27.0, 33.0, 46.0, 75.0, 79.0, 92.0, 120.0, 100.0, 80.0, 50.0, 41.0, 22.0, 32.0, 20.0, 11.0, 6.0, 11.0, 10.0, 6.0, 7.0, 6.0, 3.0, 5.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.61474609375, -0.592041015625, -0.5693359375, -0.546630859375, -0.52392578125, -0.501220703125, -0.478515625, -0.455810546875, -0.43310546875, -0.410400390625, -0.3876953125, -0.364990234375, -0.34228515625, -0.319580078125, -0.296875, -0.274169921875, -0.25146484375, -0.228759765625, -0.2060546875, -0.183349609375, -0.16064453125, -0.137939453125, -0.115234375, -0.092529296875, -0.06982421875, -0.047119140625, -0.0244140625, -0.001708984375, 0.02099609375, 0.043701171875, 0.06640625, 0.089111328125, 0.11181640625, 0.134521484375, 0.1572265625, 0.179931640625, 0.20263671875, 0.225341796875, 0.248046875, 0.270751953125, 0.29345703125, 0.316162109375, 0.3388671875, 0.361572265625, 0.38427734375, 0.406982421875, 0.4296875, 0.452392578125, 0.47509765625, 0.497802734375, 0.5205078125, 0.543212890625, 0.56591796875, 0.588623046875, 0.611328125, 0.634033203125, 0.65673828125, 0.679443359375, 0.7021484375, 0.724853515625, 0.74755859375, 0.770263671875, 0.79296875, 0.815673828125, 0.83837890625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 4.0, 11.0, 25.0, 62.0, 177.0, 559.0, 109.0, 30.0, 15.0, 4.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.57852172851562, -81.91183471679688, -80.24514770507812, -78.57846069335938, -76.91177368164062, -75.24508666992188, -73.57839965820312, -71.91171264648438, -70.24502563476562, -68.57833862304688, -66.91165161132812, -65.24496459960938, -63.578277587890625, -61.911590576171875, -60.244903564453125, -58.578216552734375, -56.911529541015625, -55.244842529296875, -53.578155517578125, -51.911468505859375, -50.244781494140625, -48.578094482421875, -46.911407470703125, -45.244720458984375, -43.578033447265625, -41.911346435546875, -40.244659423828125, -38.577972412109375, -36.911285400390625, -35.244598388671875, -33.577911376953125, -31.911224365234375, -30.24454116821289, -28.57785415649414, -26.91116714477539, -25.24448013305664, -23.57779312133789, -21.91110610961914, -20.24441909790039, -18.57773208618164, -16.91104507446289, -15.24435806274414, -13.57767105102539, -11.91098403930664, -10.24429702758789, -8.57761001586914, -6.910923004150391, -5.244235992431641, -3.5775489807128906, -1.9108619689941406, -0.24417495727539062, 1.4225120544433594, 3.0891990661621094, 4.755886077880859, 6.422573089599609, 8.08926010131836, 9.75594711303711, 11.42263412475586, 13.08932113647461, 14.75600814819336, 16.42269515991211, 18.08938217163086, 19.75606918334961, 21.42275619506836, 23.08944320678711]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 7.0, 6.0, 7.0, 8.0, 12.0, 19.0, 25.0, 34.0, 31.0, 46.0, 55.0, 293.0, 246.0, 56.0, 31.0, 32.0, 27.0, 29.0, 9.0, 13.0, 7.0, 3.0, 7.0, 2.0, 3.0, 4.0, 1.0], "bins": [-45.40498733520508, -44.4771842956543, -43.549381256103516, -42.62157440185547, -41.69377136230469, -40.765968322753906, -39.838165283203125, -38.91035842895508, -37.9825553894043, -37.054752349853516, -36.126949310302734, -35.19914245605469, -34.271339416503906, -33.343536376953125, -32.415733337402344, -31.48792839050293, -30.560123443603516, -29.632320404052734, -28.70451545715332, -27.77671241760254, -26.848907470703125, -25.921104431152344, -24.99329948425293, -24.06549644470215, -23.137693405151367, -22.209890365600586, -21.282085418701172, -20.35428237915039, -19.426477432250977, -18.498674392700195, -17.57086944580078, -16.64306640625, -15.715262413024902, -14.787458419799805, -13.859654426574707, -12.93185043334961, -12.004046440124512, -11.076242446899414, -10.148439407348633, -9.220634460449219, -8.292831420898438, -7.36502742767334, -6.437223434448242, -5.5094194412231445, -4.581615447998047, -3.6538119316101074, -2.7260079383850098, -1.798203945159912, -0.8703994750976562, 0.05740445852279663, 0.9852083921432495, 1.9130122661590576, 2.8408162593841553, 3.768620014190674, 4.6964240074157715, 5.624228000640869, 6.552031993865967, 7.4798359870910645, 8.407639503479004, 9.335443496704102, 10.2632474899292, 11.191051483154297, 12.118855476379395, 13.046659469604492, 13.97446346282959]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 2.0, 3.0, 6.0, 15.0, 7.0, 24.0, 37.0, 24.0, 39.0, 61.0, 108.0, 268.0, 102.0, 56.0, 32.0, 41.0, 36.0, 30.0, 30.0, 25.0, 13.0, 8.0, 7.0, 9.0, 10.0, 3.0, 5.0, 2.0, 4.0], "bins": [-3.013671875, -2.948638916015625, -2.88360595703125, -2.818572998046875, -2.7535400390625, -2.688507080078125, -2.62347412109375, -2.558441162109375, -2.493408203125, -2.428375244140625, -2.36334228515625, -2.298309326171875, -2.2332763671875, -2.168243408203125, -2.10321044921875, -2.038177490234375, -1.97314453125, -1.908111572265625, -1.84307861328125, -1.778045654296875, -1.7130126953125, -1.647979736328125, -1.58294677734375, -1.517913818359375, -1.452880859375, -1.387847900390625, -1.32281494140625, -1.257781982421875, -1.1927490234375, -1.127716064453125, -1.06268310546875, -0.997650146484375, -0.9326171875, -0.867584228515625, -0.80255126953125, -0.737518310546875, -0.6724853515625, -0.607452392578125, -0.54241943359375, -0.477386474609375, -0.412353515625, -0.347320556640625, -0.28228759765625, -0.217254638671875, -0.1522216796875, -0.087188720703125, -0.02215576171875, 0.042877197265625, 0.10791015625, 0.172943115234375, 0.23797607421875, 0.303009033203125, 0.3680419921875, 0.433074951171875, 0.49810791015625, 0.563140869140625, 0.628173828125, 0.693206787109375, 0.75823974609375, 0.823272705078125, 0.8883056640625, 0.953338623046875, 1.01837158203125, 1.083404541015625, 1.1484375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 1.0, 5.0, 6.0, 7.0, 8.0, 11.0, 23.0, 50.0, 68.0, 248.0, 2456.0, 8376211.0, 8791.0, 452.0, 109.0, 42.0, 16.0, 22.0, 6.0, 3.0, 9.0, 14.0, 10.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0], "bins": [-40.45846939086914, -39.047237396240234, -37.63600158691406, -36.224769592285156, -34.813533782958984, -33.40230178833008, -31.99106788635254, -30.579833984375, -29.16860008239746, -27.757366180419922, -26.346132278442383, -24.934898376464844, -23.523666381835938, -22.112430572509766, -20.70119857788086, -19.28996467590332, -17.87873077392578, -16.467496871948242, -15.056262969970703, -13.64503002166748, -12.233796119689941, -10.822562217712402, -9.41132926940918, -8.00009536743164, -6.588861465454102, -5.1776275634765625, -3.7663941383361816, -2.355160713195801, -0.9439268112182617, 0.46730709075927734, 1.8785400390625, 3.289773941040039, 4.701007843017578, 6.112241744995117, 7.523475170135498, 8.934708595275879, 10.345942497253418, 11.757176399230957, 13.16840934753418, 14.579643249511719, 15.990877151489258, 17.402111053466797, 18.813344955444336, 20.224578857421875, 21.63581085205078, 23.047046661376953, 24.45827865600586, 25.8695125579834, 27.280746459960938, 28.691980361938477, 30.103214263916016, 31.514446258544922, 32.925682067871094, 34.3369140625, 35.748146057128906, 37.15938186645508, 38.57061767578125, 39.981849670410156, 41.39308547973633, 42.804317474365234, 44.215553283691406, 45.62678527832031, 47.03801727294922, 48.44925308227539, 49.8604850769043]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 3.0, 1.0, 4.0, 3.0, 4.0, 5.0, 5.0, 4.0, 6.0, 6.0, 3.0, 5.0, 3.0, 2.0, 5.0, 6.0, 3.0, 6.0, 2.0, 2.0, 1.0, 5.0, 2.0, 3.0, 3.0, 2.0, 5.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-12.431917190551758, -11.959487915039062, -11.487058639526367, -11.014630317687988, -10.542201042175293, -10.069771766662598, -9.597343444824219, -9.124914169311523, -8.652484893798828, -8.180055618286133, -7.707626819610596, -7.235198020935059, -6.762768745422363, -6.290339469909668, -5.817910671234131, -5.345481872558594, -4.873052597045898, -4.400623321533203, -3.928194522857666, -3.45576548576355, -2.9833364486694336, -2.5109074115753174, -2.038478374481201, -1.566049337387085, -1.0936203002929688, -0.6211912631988525, -0.14876222610473633, 0.3236668109893799, 0.7960958480834961, 1.2685248851776123, 1.7409539222717285, 2.2133829593658447, 2.685811996459961, 3.158241033554077, 3.6306700706481934, 4.1030988693237305, 4.575528144836426, 5.047957420349121, 5.520386219024658, 5.992815017700195, 6.465244293212891, 6.937673568725586, 7.410102367401123, 7.88253116607666, 8.354960441589355, 8.82738971710205, 9.29981803894043, 9.772247314453125, 10.24467658996582, 10.717105865478516, 11.189535140991211, 11.66196346282959, 12.134392738342285, 12.60682201385498, 13.07925033569336, 13.551679611206055, 14.02410888671875, 14.496538162231445, 14.96896743774414, 15.44139575958252, 15.913825035095215, 16.386253356933594, 16.85868263244629, 17.331111907958984, 17.80354118347168]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 5.0, 5.0, 9.0, 13.0, 18.0, 23.0, 36.0, 28.0, 54.0, 62.0, 89.0, 133.0, 220.0, 447.0, 840.0, 2266.0, 7084.0, 26956.0, 117617.0, 259832.0, 81846.0, 18758.0, 4956.0, 1514.0, 578.0, 308.0, 191.0, 102.0, 78.0, 54.0, 36.0, 26.0, 23.0, 10.0, 14.0, 10.0, 14.0, 5.0, 2.0, 0.0, 4.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-17.515625, -17.00634765625, -16.4970703125, -15.98779296875, -15.478515625, -14.96923828125, -14.4599609375, -13.95068359375, -13.44140625, -12.93212890625, -12.4228515625, -11.91357421875, -11.404296875, -10.89501953125, -10.3857421875, -9.87646484375, -9.3671875, -8.85791015625, -8.3486328125, -7.83935546875, -7.330078125, -6.82080078125, -6.3115234375, -5.80224609375, -5.29296875, -4.78369140625, -4.2744140625, -3.76513671875, -3.255859375, -2.74658203125, -2.2373046875, -1.72802734375, -1.21875, -0.70947265625, -0.2001953125, 0.30908203125, 0.818359375, 1.32763671875, 1.8369140625, 2.34619140625, 2.85546875, 3.36474609375, 3.8740234375, 4.38330078125, 4.892578125, 5.40185546875, 5.9111328125, 6.42041015625, 6.9296875, 7.43896484375, 7.9482421875, 8.45751953125, 8.966796875, 9.47607421875, 9.9853515625, 10.49462890625, 11.00390625, 11.51318359375, 12.0224609375, 12.53173828125, 13.041015625, 13.55029296875, 14.0595703125, 14.56884765625, 15.078125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 3.0, 4.0, 1.0, 5.0, 9.0, 15.0, 6.0, 21.0, 36.0, 67.0, 92.0, 131.0, 143.0, 128.0, 122.0, 90.0, 49.0, 33.0, 24.0, 18.0, 3.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.806640625, -3.680450439453125, -3.55426025390625, -3.428070068359375, -3.3018798828125, -3.175689697265625, -3.04949951171875, -2.923309326171875, -2.797119140625, -2.670928955078125, -2.54473876953125, -2.418548583984375, -2.2923583984375, -2.166168212890625, -2.03997802734375, -1.913787841796875, -1.78759765625, -1.661407470703125, -1.53521728515625, -1.409027099609375, -1.2828369140625, -1.156646728515625, -1.03045654296875, -0.904266357421875, -0.778076171875, -0.651885986328125, -0.52569580078125, -0.399505615234375, -0.2733154296875, -0.147125244140625, -0.02093505859375, 0.105255126953125, 0.2314453125, 0.357635498046875, 0.48382568359375, 0.610015869140625, 0.7362060546875, 0.862396240234375, 0.98858642578125, 1.114776611328125, 1.240966796875, 1.367156982421875, 1.49334716796875, 1.619537353515625, 1.7457275390625, 1.871917724609375, 1.99810791015625, 2.124298095703125, 2.25048828125, 2.376678466796875, 2.50286865234375, 2.629058837890625, 2.7552490234375, 2.881439208984375, 3.00762939453125, 3.133819580078125, 3.260009765625, 3.386199951171875, 3.51239013671875, 3.638580322265625, 3.7647705078125, 3.890960693359375, 4.01715087890625, 4.143341064453125, 4.26953125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 10.0, 21.0, 47.0, 124.0, 187.0, 44.0, 26.0, 12.0, 10.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.013225555419922, -10.16330623626709, -9.313387870788574, -8.463468551635742, -7.61354923248291, -6.763630390167236, -5.9137115478515625, -5.0637922286987305, -4.213873386383057, -3.3639543056488037, -2.514035224914551, -1.664116382598877, -0.814197301864624, 0.035721778869628906, 0.8856406211853027, 1.7355599403381348, 2.5854787826538086, 3.4353978633880615, 4.2853169441223145, 5.135235786437988, 5.98515510559082, 6.835073947906494, 7.684992790222168, 8.534912109375, 9.384830474853516, 10.234749794006348, 11.084668159484863, 11.934587478637695, 12.784506797790527, 13.63442611694336, 14.484344482421875, 15.334263801574707, 16.18418312072754, 17.034101486206055, 17.884021759033203, 18.73394012451172, 19.583858489990234, 20.433778762817383, 21.2836971282959, 22.133617401123047, 22.983535766601562, 23.833454132080078, 24.683374404907227, 25.533292770385742, 26.383211135864258, 27.233131408691406, 28.083049774169922, 28.932968139648438, 29.782886505126953, 30.63280487060547, 31.482725143432617, 32.3326416015625, 33.18256378173828, 34.0324821472168, 34.88240051269531, 35.73231887817383, 36.58224105834961, 37.432159423828125, 38.28207778930664, 39.131996154785156, 39.98191833496094, 40.83183670043945, 41.68175506591797, 42.531673431396484, 43.381591796875]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 0.0, 0.0, 3.0, 2.0, 7.0, 2.0, 16.0, 14.0, 25.0, 29.0, 56.0, 63.0, 72.0, 65.0, 42.0, 24.0, 16.0, 7.0, 5.0, 5.0, 7.0, 6.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.436331748962402, -9.130949020385742, -8.825565338134766, -8.520182609558105, -8.214799880981445, -7.909416675567627, -7.604033470153809, -7.298650741577148, -6.99326753616333, -6.687884330749512, -6.382501602172852, -6.077118396759033, -5.771735191345215, -5.466352462768555, -5.160969257354736, -4.855586051940918, -4.550203323364258, -4.2448201179504395, -3.9394373893737793, -3.634054183959961, -3.3286712169647217, -3.0232882499694824, -2.717905044555664, -2.412522077560425, -2.1071391105651855, -1.8017561435699463, -1.4963730573654175, -1.1909899711608887, -0.8856070041656494, -0.5802240371704102, -0.27484095096588135, 0.03054213523864746, 0.3359241485595703, 0.6413071751594543, 0.9466902017593384, 1.2520732879638672, 1.5574562549591064, 1.8628392219543457, 2.168222427368164, 2.4736053943634033, 2.7789883613586426, 3.084371328353882, 3.389754295349121, 3.6951375007629395, 4.000520706176758, 4.305903434753418, 4.611286640167236, 4.916669845581055, 5.222052574157715, 5.527435779571533, 5.832818508148193, 6.138201713562012, 6.443584442138672, 6.74896764755249, 7.054350852966309, 7.359733581542969, 7.665116786956787, 7.9704999923706055, 8.275882720947266, 8.581265449523926, 8.886649131774902, 9.192031860351562, 9.497414588928223, 9.8027982711792, 10.10818099975586]}, "eval/loss": 4.166304588317871, "eval/wer": 1.918524395081317, "eval/runtime": 982.6549, "eval/samples_per_second": 2.689, "eval/steps_per_second": 0.337} \ No newline at end of file +{"train/loss": 3.5732, "train/learning_rate": 3.1152647975077883e-08, "train/epoch": 1.0, "train/global_step": 1784, "_runtime": 8667, "_timestamp": 1646049692, "_step": 1787, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 9.0, 346.0, 631.0, 30.0, 2.0, 1.0], "bins": [-641.971923828125, -631.305908203125, -620.639892578125, -609.973876953125, -599.307861328125, -588.641845703125, -577.975830078125, -567.309814453125, -556.643798828125, -545.977783203125, -535.311767578125, -524.645751953125, -513.979736328125, -503.313720703125, -492.647705078125, -481.981689453125, -471.315673828125, -460.649658203125, -449.983642578125, -439.317626953125, -428.651611328125, -417.985595703125, -407.319580078125, -396.653564453125, -385.987548828125, -375.321533203125, -364.655517578125, -353.989501953125, -343.323486328125, -332.657470703125, -321.991455078125, -311.325439453125, -300.6593933105469, -289.9933776855469, -279.3273620605469, -268.6613464355469, -257.9953308105469, -247.32931518554688, -236.66329956054688, -225.99728393554688, -215.33126831054688, -204.66525268554688, -193.99923706054688, -183.33322143554688, -172.66720581054688, -162.00119018554688, -151.33517456054688, -140.66915893554688, -130.00314331054688, -119.33712768554688, -108.67111206054688, -98.00509643554688, -87.33908081054688, -76.67306518554688, -66.00704956054688, -55.341033935546875, -44.67502212524414, -34.00900650024414, -23.34299087524414, -12.67697525024414, -2.0109596252441406, 8.65505599975586, 19.32107162475586, 29.98708724975586, 40.65310287475586]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 6.0, 10.0, 8.0, 10.0, 19.0, 21.0, 16.0, 27.0, 24.0, 29.0, 34.0, 38.0, 42.0, 38.0, 39.0, 44.0, 47.0, 51.0, 52.0, 45.0, 44.0, 38.0, 46.0, 33.0, 29.0, 45.0, 18.0, 31.0, 22.0, 13.0, 15.0, 10.0, 20.0, 11.0, 6.0, 4.0, 8.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-75.822509765625, -73.62486267089844, -71.4272232055664, -69.22957611083984, -67.03193664550781, -64.83428955078125, -62.63664627075195, -60.439002990722656, -58.24135971069336, -56.04371643066406, -53.846073150634766, -51.64842987060547, -49.450782775878906, -47.253143310546875, -45.05549621582031, -42.857852935791016, -40.66020965576172, -38.46256637573242, -36.264923095703125, -34.06727981567383, -31.8696346282959, -29.6719913482666, -27.474346160888672, -25.276702880859375, -23.079059600830078, -20.88141632080078, -18.683773040771484, -16.486127853393555, -14.288484573364258, -12.090841293334961, -9.893197059631348, -7.695552825927734, -5.4979095458984375, -3.3002657890319824, -1.1026220321655273, 1.0950217247009277, 3.292665481567383, 5.49030876159668, 7.687952995300293, 9.885597229003906, 12.083240509033203, 14.2808837890625, 16.478527069091797, 18.676172256469727, 20.873815536499023, 23.07145881652832, 25.26910400390625, 27.466747283935547, 29.664390563964844, 31.86203384399414, 34.05967712402344, 36.257320404052734, 38.45496368408203, 40.652610778808594, 42.85025405883789, 45.04789733886719, 47.245540618896484, 49.44318389892578, 51.64082717895508, 53.838470458984375, 56.03611755371094, 58.23375701904297, 60.43140411376953, 62.62904739379883, 64.82669067382812]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 4.0, 8.0, 11.0, 16.0, 21.0, 32.0, 31.0, 38.0, 38.0, 50.0, 49.0, 55.0, 53.0, 54.0, 61.0, 48.0, 71.0, 50.0, 42.0, 49.0, 33.0, 43.0, 48.0, 24.0, 18.0, 14.0, 15.0, 7.0, 8.0, 7.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-8.375, -8.1734619140625, -7.971923828125, -7.7703857421875, -7.56884765625, -7.3673095703125, -7.165771484375, -6.9642333984375, -6.7626953125, -6.5611572265625, -6.359619140625, -6.1580810546875, -5.95654296875, -5.7550048828125, -5.553466796875, -5.3519287109375, -5.150390625, -4.9488525390625, -4.747314453125, -4.5457763671875, -4.34423828125, -4.1427001953125, -3.941162109375, -3.7396240234375, -3.5380859375, -3.3365478515625, -3.135009765625, -2.9334716796875, -2.73193359375, -2.5303955078125, -2.328857421875, -2.1273193359375, -1.92578125, -1.7242431640625, -1.522705078125, -1.3211669921875, -1.11962890625, -0.9180908203125, -0.716552734375, -0.5150146484375, -0.3134765625, -0.1119384765625, 0.089599609375, 0.2911376953125, 0.49267578125, 0.6942138671875, 0.895751953125, 1.0972900390625, 1.298828125, 1.5003662109375, 1.701904296875, 1.9034423828125, 2.10498046875, 2.3065185546875, 2.508056640625, 2.7095947265625, 2.9111328125, 3.1126708984375, 3.314208984375, 3.5157470703125, 3.71728515625, 3.9188232421875, 4.120361328125, 4.3218994140625, 4.5234375]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 2.0, 9.0, 6.0, 10.0, 12.0, 25.0, 27.0, 37.0, 68.0, 93.0, 165.0, 224.0, 442.0, 815.0, 1724.0, 4296.0, 14068.0, 99545.0, 2388338.0, 1594739.0, 70897.0, 11734.0, 3624.0, 1570.0, 781.0, 417.0, 250.0, 135.0, 84.0, 51.0, 38.0, 25.0, 10.0, 11.0, 3.0, 5.0, 3.0, 0.0, 2.0], "bins": [-27.78125, -27.148681640625, -26.51611328125, -25.883544921875, -25.2509765625, -24.618408203125, -23.98583984375, -23.353271484375, -22.720703125, -22.088134765625, -21.45556640625, -20.822998046875, -20.1904296875, -19.557861328125, -18.92529296875, -18.292724609375, -17.66015625, -17.027587890625, -16.39501953125, -15.762451171875, -15.1298828125, -14.497314453125, -13.86474609375, -13.232177734375, -12.599609375, -11.967041015625, -11.33447265625, -10.701904296875, -10.0693359375, -9.436767578125, -8.80419921875, -8.171630859375, -7.5390625, -6.906494140625, -6.27392578125, -5.641357421875, -5.0087890625, -4.376220703125, -3.74365234375, -3.111083984375, -2.478515625, -1.845947265625, -1.21337890625, -0.580810546875, 0.0517578125, 0.684326171875, 1.31689453125, 1.949462890625, 2.58203125, 3.214599609375, 3.84716796875, 4.479736328125, 5.1123046875, 5.744873046875, 6.37744140625, 7.010009765625, 7.642578125, 8.275146484375, 8.90771484375, 9.540283203125, 10.1728515625, 10.805419921875, 11.43798828125, 12.070556640625, 12.703125]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 5.0, 7.0, 11.0, 23.0, 24.0, 57.0, 84.0, 139.0, 236.0, 372.0, 679.0, 886.0, 624.0, 364.0, 231.0, 126.0, 80.0, 38.0, 22.0, 20.0, 24.0, 10.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.734375, -22.9287109375, -22.123046875, -21.3173828125, -20.51171875, -19.7060546875, -18.900390625, -18.0947265625, -17.2890625, -16.4833984375, -15.677734375, -14.8720703125, -14.06640625, -13.2607421875, -12.455078125, -11.6494140625, -10.84375, -10.0380859375, -9.232421875, -8.4267578125, -7.62109375, -6.8154296875, -6.009765625, -5.2041015625, -4.3984375, -3.5927734375, -2.787109375, -1.9814453125, -1.17578125, -0.3701171875, 0.435546875, 1.2412109375, 2.046875, 2.8525390625, 3.658203125, 4.4638671875, 5.26953125, 6.0751953125, 6.880859375, 7.6865234375, 8.4921875, 9.2978515625, 10.103515625, 10.9091796875, 11.71484375, 12.5205078125, 13.326171875, 14.1318359375, 14.9375, 15.7431640625, 16.548828125, 17.3544921875, 18.16015625, 18.9658203125, 19.771484375, 20.5771484375, 21.3828125, 22.1884765625, 22.994140625, 23.7998046875, 24.60546875, 25.4111328125, 26.216796875, 27.0224609375, 27.828125]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 6.0, 7.0, 16.0, 14.0, 22.0, 40.0, 66.0, 96.0, 225.0, 408.0, 869.0, 2223.0, 22720.0, 4086441.0, 76007.0, 2997.0, 1028.0, 486.0, 245.0, 123.0, 97.0, 56.0, 23.0, 17.0, 15.0, 8.0, 5.0, 5.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.0625, -71.3798828125, -68.697265625, -66.0146484375, -63.33203125, -60.6494140625, -57.966796875, -55.2841796875, -52.6015625, -49.9189453125, -47.236328125, -44.5537109375, -41.87109375, -39.1884765625, -36.505859375, -33.8232421875, -31.140625, -28.4580078125, -25.775390625, -23.0927734375, -20.41015625, -17.7275390625, -15.044921875, -12.3623046875, -9.6796875, -6.9970703125, -4.314453125, -1.6318359375, 1.05078125, 3.7333984375, 6.416015625, 9.0986328125, 11.78125, 14.4638671875, 17.146484375, 19.8291015625, 22.51171875, 25.1943359375, 27.876953125, 30.5595703125, 33.2421875, 35.9248046875, 38.607421875, 41.2900390625, 43.97265625, 46.6552734375, 49.337890625, 52.0205078125, 54.703125, 57.3857421875, 60.068359375, 62.7509765625, 65.43359375, 68.1162109375, 70.798828125, 73.4814453125, 76.1640625, 78.8466796875, 81.529296875, 84.2119140625, 86.89453125, 89.5771484375, 92.259765625, 94.9423828125, 97.625]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 81.0, 553.0, 353.0, 21.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-270.17755126953125, -262.1882629394531, -254.198974609375, -246.20968627929688, -238.22039794921875, -230.23110961914062, -222.2418212890625, -214.25253295898438, -206.26324462890625, -198.27395629882812, -190.28466796875, -182.29537963867188, -174.30609130859375, -166.31680297851562, -158.3275146484375, -150.33822631835938, -142.3489532470703, -134.3596649169922, -126.37037658691406, -118.38108825683594, -110.39179992675781, -102.40251159667969, -94.4132308959961, -86.42394256591797, -78.43465423583984, -70.44536590576172, -62.456077575683594, -54.466793060302734, -46.47750473022461, -38.488216400146484, -30.498931884765625, -22.5096435546875, -14.520339965820312, -6.531052589416504, 1.4582347869873047, 9.447521209716797, 17.436809539794922, 25.426097869873047, 33.415382385253906, 41.40467071533203, 49.393959045410156, 57.38324737548828, 65.3725357055664, 73.36181640625, 81.35110473632812, 89.34039306640625, 97.32968139648438, 105.3189697265625, 113.30825805664062, 121.29754638671875, 129.28683471679688, 137.276123046875, 145.26541137695312, 153.25469970703125, 161.24398803710938, 169.2332763671875, 177.22256469726562, 185.21185302734375, 193.20114135742188, 201.1904296875, 209.17971801757812, 217.16900634765625, 225.15829467773438, 233.1475830078125, 241.13685607910156]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 0.0, 4.0, 3.0, 2.0, 10.0, 9.0, 4.0, 8.0, 8.0, 9.0, 15.0, 16.0, 7.0, 27.0, 25.0, 17.0, 24.0, 28.0, 22.0, 29.0, 36.0, 44.0, 38.0, 38.0, 34.0, 32.0, 49.0, 38.0, 45.0, 48.0, 40.0, 34.0, 32.0, 24.0, 24.0, 18.0, 21.0, 26.0, 16.0, 12.0, 20.0, 11.0, 14.0, 9.0, 8.0, 5.0, 4.0, 9.0, 6.0, 4.0, 2.0, 4.0, 0.0, 0.0, 1.0, 2.0], "bins": [-49.61613464355469, -48.13227462768555, -46.64841842651367, -45.16455841064453, -43.68069839477539, -42.19683837890625, -40.712982177734375, -39.229122161865234, -37.745262145996094, -36.26140213012695, -34.77754592895508, -33.29368591308594, -31.809825897216797, -30.32596778869629, -28.84210968017578, -27.35824966430664, -25.874391555786133, -24.390533447265625, -22.906673431396484, -21.422815322875977, -19.938955307006836, -18.455097198486328, -16.971237182617188, -15.48737907409668, -14.003520011901855, -12.519660949707031, -11.035801887512207, -9.551942825317383, -8.068084716796875, -6.584225177764893, -5.100366592407227, -3.6165075302124023, -2.132648468017578, -0.6487895250320435, 0.8350694179534912, 2.3189282417297363, 3.8027873039245605, 5.286646366119385, 6.770504951477051, 8.254364013671875, 9.7382230758667, 11.222082138061523, 12.705941200256348, 14.189800262451172, 15.67365837097168, 17.15751838684082, 18.641376495361328, 20.12523651123047, 21.609094619750977, 23.092952728271484, 24.576812744140625, 26.060670852661133, 27.544530868530273, 29.02838897705078, 30.512248992919922, 31.99610710144043, 33.47996520996094, 34.96382522583008, 36.44768142700195, 37.931541442871094, 39.415401458740234, 40.899261474609375, 42.38311767578125, 43.86697769165039, 45.35083770751953]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 7.0, 5.0, 10.0, 12.0, 17.0, 25.0, 24.0, 32.0, 29.0, 34.0, 53.0, 54.0, 40.0, 52.0, 48.0, 64.0, 45.0, 62.0, 44.0, 41.0, 58.0, 35.0, 41.0, 39.0, 40.0, 27.0, 13.0, 16.0, 17.0, 12.0, 6.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.44921875, -7.24139404296875, -7.0335693359375, -6.82574462890625, -6.617919921875, -6.41009521484375, -6.2022705078125, -5.99444580078125, -5.78662109375, -5.57879638671875, -5.3709716796875, -5.16314697265625, -4.955322265625, -4.74749755859375, -4.5396728515625, -4.33184814453125, -4.1240234375, -3.91619873046875, -3.7083740234375, -3.50054931640625, -3.292724609375, -3.08489990234375, -2.8770751953125, -2.66925048828125, -2.46142578125, -2.25360107421875, -2.0457763671875, -1.83795166015625, -1.630126953125, -1.42230224609375, -1.2144775390625, -1.00665283203125, -0.798828125, -0.59100341796875, -0.3831787109375, -0.17535400390625, 0.032470703125, 0.24029541015625, 0.4481201171875, 0.65594482421875, 0.86376953125, 1.07159423828125, 1.2794189453125, 1.48724365234375, 1.695068359375, 1.90289306640625, 2.1107177734375, 2.31854248046875, 2.5263671875, 2.73419189453125, 2.9420166015625, 3.14984130859375, 3.357666015625, 3.56549072265625, 3.7733154296875, 3.98114013671875, 4.18896484375, 4.39678955078125, 4.6046142578125, 4.81243896484375, 5.020263671875, 5.22808837890625, 5.4359130859375, 5.64373779296875, 5.8515625]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 9.0, 10.0, 16.0, 22.0, 27.0, 41.0, 78.0, 98.0, 160.0, 212.0, 344.0, 494.0, 814.0, 1440.0, 2241.0, 3882.0, 6698.0, 11812.0, 20901.0, 36784.0, 65891.0, 114348.0, 199263.0, 246334.0, 144137.0, 82930.0, 47360.0, 26393.0, 14927.0, 8406.0, 5019.0, 2796.0, 1710.0, 1104.0, 640.0, 434.0, 259.0, 164.0, 142.0, 81.0, 39.0, 29.0, 21.0, 17.0, 14.0, 13.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.85986328125, -0.8323135375976562, -0.8047637939453125, -0.7772140502929688, -0.749664306640625, -0.7221145629882812, -0.6945648193359375, -0.6670150756835938, -0.63946533203125, -0.6119155883789062, -0.5843658447265625, -0.5568161010742188, -0.529266357421875, -0.5017166137695312, -0.4741668701171875, -0.44661712646484375, -0.4190673828125, -0.39151763916015625, -0.3639678955078125, -0.33641815185546875, -0.308868408203125, -0.28131866455078125, -0.2537689208984375, -0.22621917724609375, -0.19866943359375, -0.17111968994140625, -0.1435699462890625, -0.11602020263671875, -0.088470458984375, -0.06092071533203125, -0.0333709716796875, -0.00582122802734375, 0.021728515625, 0.04927825927734375, 0.0768280029296875, 0.10437774658203125, 0.131927490234375, 0.15947723388671875, 0.1870269775390625, 0.21457672119140625, 0.24212646484375, 0.26967620849609375, 0.2972259521484375, 0.32477569580078125, 0.352325439453125, 0.37987518310546875, 0.4074249267578125, 0.43497467041015625, 0.4625244140625, 0.49007415771484375, 0.5176239013671875, 0.5451736450195312, 0.572723388671875, 0.6002731323242188, 0.6278228759765625, 0.6553726196289062, 0.68292236328125, 0.7104721069335938, 0.7380218505859375, 0.7655715942382812, 0.793121337890625, 0.8206710815429688, 0.8482208251953125, 0.8757705688476562, 0.9033203125]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 5.0, 5.0, 4.0, 7.0, 5.0, 2.0, 11.0, 7.0, 16.0, 15.0, 13.0, 7.0, 16.0, 20.0, 19.0, 31.0, 23.0, 25.0, 29.0, 27.0, 39.0, 34.0, 46.0, 43.0, 34.0, 1062.0, 40.0, 44.0, 37.0, 30.0, 31.0, 32.0, 26.0, 35.0, 26.0, 21.0, 25.0, 16.0, 18.0, 23.0, 15.0, 14.0, 5.0, 10.0, 7.0, 5.0, 5.0, 7.0, 8.0, 3.0, 1.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-2.92578125, -2.833282470703125, -2.74078369140625, -2.648284912109375, -2.5557861328125, -2.463287353515625, -2.37078857421875, -2.278289794921875, -2.185791015625, -2.093292236328125, -2.00079345703125, -1.908294677734375, -1.8157958984375, -1.723297119140625, -1.63079833984375, -1.538299560546875, -1.44580078125, -1.353302001953125, -1.26080322265625, -1.168304443359375, -1.0758056640625, -0.983306884765625, -0.89080810546875, -0.798309326171875, -0.705810546875, -0.613311767578125, -0.52081298828125, -0.428314208984375, -0.3358154296875, -0.243316650390625, -0.15081787109375, -0.058319091796875, 0.0341796875, 0.126678466796875, 0.21917724609375, 0.311676025390625, 0.4041748046875, 0.496673583984375, 0.58917236328125, 0.681671142578125, 0.774169921875, 0.866668701171875, 0.95916748046875, 1.051666259765625, 1.1441650390625, 1.236663818359375, 1.32916259765625, 1.421661376953125, 1.51416015625, 1.606658935546875, 1.69915771484375, 1.791656494140625, 1.8841552734375, 1.976654052734375, 2.06915283203125, 2.161651611328125, 2.254150390625, 2.346649169921875, 2.43914794921875, 2.531646728515625, 2.6241455078125, 2.716644287109375, 2.80914306640625, 2.901641845703125, 2.994140625]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 8.0, 11.0, 12.0, 26.0, 32.0, 55.0, 75.0, 105.0, 198.0, 248.0, 379.0, 566.0, 840.0, 1308.0, 1928.0, 2883.0, 4379.0, 7044.0, 10684.0, 16859.0, 26844.0, 42249.0, 67583.0, 108797.0, 176921.0, 1259102.0, 137087.0, 85135.0, 53181.0, 33406.0, 21081.0, 13297.0, 8725.0, 5455.0, 3610.0, 2356.0, 1571.0, 1032.0, 685.0, 476.0, 294.0, 196.0, 142.0, 101.0, 58.0, 40.0, 23.0, 15.0, 9.0, 16.0, 4.0, 4.0, 2.0, 0.0, 3.0, 1.0], "bins": [-0.66650390625, -0.646453857421875, -0.62640380859375, -0.606353759765625, -0.5863037109375, -0.566253662109375, -0.54620361328125, -0.526153564453125, -0.506103515625, -0.486053466796875, -0.46600341796875, -0.445953369140625, -0.4259033203125, -0.405853271484375, -0.38580322265625, -0.365753173828125, -0.345703125, -0.325653076171875, -0.30560302734375, -0.285552978515625, -0.2655029296875, -0.245452880859375, -0.22540283203125, -0.205352783203125, -0.185302734375, -0.165252685546875, -0.14520263671875, -0.125152587890625, -0.1051025390625, -0.085052490234375, -0.06500244140625, -0.044952392578125, -0.02490234375, -0.004852294921875, 0.01519775390625, 0.035247802734375, 0.0552978515625, 0.075347900390625, 0.09539794921875, 0.115447998046875, 0.135498046875, 0.155548095703125, 0.17559814453125, 0.195648193359375, 0.2156982421875, 0.235748291015625, 0.25579833984375, 0.275848388671875, 0.2958984375, 0.315948486328125, 0.33599853515625, 0.356048583984375, 0.3760986328125, 0.396148681640625, 0.41619873046875, 0.436248779296875, 0.456298828125, 0.476348876953125, 0.49639892578125, 0.516448974609375, 0.5364990234375, 0.556549072265625, 0.57659912109375, 0.596649169921875, 0.61669921875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 5.0, 4.0, 2.0, 4.0, 4.0, 5.0, 12.0, 8.0, 8.0, 16.0, 23.0, 19.0, 27.0, 33.0, 36.0, 41.0, 54.0, 46.0, 49.0, 63.0, 69.0, 63.0, 51.0, 59.0, 31.0, 43.0, 31.0, 39.0, 18.0, 27.0, 21.0, 31.0, 12.0, 10.0, 9.0, 8.0, 8.0, 8.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001129150390625, -0.0010925531387329102, -0.0010559558868408203, -0.0010193586349487305, -0.0009827613830566406, -0.0009461641311645508, -0.0009095668792724609, -0.0008729696273803711, -0.0008363723754882812, -0.0007997751235961914, -0.0007631778717041016, -0.0007265806198120117, -0.0006899833679199219, -0.000653386116027832, -0.0006167888641357422, -0.0005801916122436523, -0.0005435943603515625, -0.0005069971084594727, -0.0004703998565673828, -0.00043380260467529297, -0.0003972053527832031, -0.0003606081008911133, -0.00032401084899902344, -0.0002874135971069336, -0.00025081634521484375, -0.0002142190933227539, -0.00017762184143066406, -0.00014102458953857422, -0.00010442733764648438, -6.783008575439453e-05, -3.123283386230469e-05, 5.364418029785156e-06, 4.1961669921875e-05, 7.855892181396484e-05, 0.00011515617370605469, 0.00015175342559814453, 0.00018835067749023438, 0.00022494792938232422, 0.00026154518127441406, 0.0002981424331665039, 0.00033473968505859375, 0.0003713369369506836, 0.00040793418884277344, 0.0004445314407348633, 0.0004811286926269531, 0.000517725944519043, 0.0005543231964111328, 0.0005909204483032227, 0.0006275177001953125, 0.0006641149520874023, 0.0007007122039794922, 0.000737309455871582, 0.0007739067077636719, 0.0008105039596557617, 0.0008471012115478516, 0.0008836984634399414, 0.0009202957153320312, 0.0009568929672241211, 0.000993490219116211, 0.0010300874710083008, 0.0010666847229003906, 0.0011032819747924805, 0.0011398792266845703, 0.0011764764785766602, 0.00121307373046875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 4.0, 7.0, 11.0, 7.0, 18.0, 20.0, 14.0, 23.0, 27.0, 41.0, 48.0, 68.0, 75.0, 117.0, 129.0, 200.0, 225.0, 287.0, 558.0, 1094.0, 968621.0, 74439.0, 819.0, 463.0, 256.0, 220.0, 149.0, 134.0, 119.0, 85.0, 66.0, 50.0, 35.0, 19.0, 24.0, 19.0, 13.0, 14.0, 4.0, 7.0, 11.0, 4.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.02197265625, -0.02128291130065918, -0.02059316635131836, -0.01990342140197754, -0.01921367645263672, -0.0185239315032959, -0.017834186553955078, -0.017144441604614258, -0.016454696655273438, -0.015764951705932617, -0.015075206756591797, -0.014385461807250977, -0.013695716857910156, -0.013005971908569336, -0.012316226959228516, -0.011626482009887695, -0.010936737060546875, -0.010246992111206055, -0.009557247161865234, -0.008867502212524414, -0.008177757263183594, -0.0074880123138427734, -0.006798267364501953, -0.006108522415161133, -0.0054187774658203125, -0.004729032516479492, -0.004039287567138672, -0.0033495426177978516, -0.0026597976684570312, -0.001970052719116211, -0.0012803077697753906, -0.0005905628204345703, 9.918212890625e-05, 0.0007889270782470703, 0.0014786720275878906, 0.002168416976928711, 0.0028581619262695312, 0.0035479068756103516, 0.004237651824951172, 0.004927396774291992, 0.0056171417236328125, 0.006306886672973633, 0.006996631622314453, 0.0076863765716552734, 0.008376121520996094, 0.009065866470336914, 0.009755611419677734, 0.010445356369018555, 0.011135101318359375, 0.011824846267700195, 0.012514591217041016, 0.013204336166381836, 0.013894081115722656, 0.014583826065063477, 0.015273571014404297, 0.015963315963745117, 0.016653060913085938, 0.017342805862426758, 0.018032550811767578, 0.0187222957611084, 0.01941204071044922, 0.02010178565979004, 0.02079153060913086, 0.02148127555847168, 0.0221710205078125]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 8.0, 160.0, 786.0, 61.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006038642022758722, -0.0004914011806249619, -0.000378938129870221, -0.0002664750791154802, -0.0001540120574645698, -4.154903581365943e-05, 7.091404404491186e-05, 0.00018337706569582224, 0.0002958400873467326, 0.000408303108997643, 0.0005207661306485534, 0.0006332292105071247, 0.000745692232158035, 0.0008581552538089454, 0.0009706183336675167, 0.001083081355318427, 0.0011955443769693375, 0.0013080073986202478, 0.0014204704202711582, 0.0015329334419220686, 0.001645396463572979, 0.0017578594852238894, 0.0018703226232901216, 0.0019827857613563538, 0.0020952485501766205, 0.002207711571827531, 0.0023201745934784412, 0.0024326376151293516, 0.002545100636780262, 0.0026575636584311724, 0.0027700266800820827, 0.0028824899345636368, 0.0029949527233839035, 0.003107415745034814, 0.0032198787666857243, 0.0033323417883366346, 0.003444804809987545, 0.0035572678316384554, 0.0036697308532893658, 0.00378219410777092, 0.0038946568965911865, 0.0040071201510727406, 0.004119582939893007, 0.004232046194374561, 0.004344508983194828, 0.004456972237676382, 0.004569435026496649, 0.004681898280978203, 0.0047943610697984695, 0.004906824324280024, 0.00501928711310029, 0.005131750367581844, 0.005244213156402111, 0.005356676410883665, 0.005469139199703932, 0.005581602454185486, 0.00569406570866704, 0.005806528963148594, 0.005918991751968861, 0.006031455006450415, 0.006143917795270681, 0.006256381049752235, 0.006368843838572502, 0.006481307093054056, 0.006593769881874323]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 3.0, 5.0, 7.0, 2.0, 5.0, 6.0, 10.0, 19.0, 15.0, 19.0, 20.0, 24.0, 24.0, 33.0, 40.0, 43.0, 44.0, 39.0, 44.0, 46.0, 53.0, 55.0, 47.0, 53.0, 53.0, 34.0, 32.0, 35.0, 23.0, 32.0, 24.0, 19.0, 23.0, 19.0, 19.0, 10.0, 9.0, 8.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005924105644226074, -0.0005711764097213745, -0.0005499422550201416, -0.0005287081003189087, -0.0005074739456176758, -0.00048623979091644287, -0.00046500563621520996, -0.00044377148151397705, -0.00042253732681274414, -0.00040130317211151123, -0.0003800690174102783, -0.0003588348627090454, -0.0003376007080078125, -0.0003163665533065796, -0.0002951323986053467, -0.00027389824390411377, -0.00025266408920288086, -0.00023142993450164795, -0.00021019577980041504, -0.00018896162509918213, -0.00016772747039794922, -0.0001464933156967163, -0.0001252591609954834, -0.00010402500629425049, -8.279085159301758e-05, -6.155669689178467e-05, -4.032254219055176e-05, -1.9088387489318848e-05, 2.1457672119140625e-06, 2.3379921913146973e-05, 4.461407661437988e-05, 6.584823131561279e-05, 8.70823860168457e-05, 0.00010831654071807861, 0.00012955069541931152, 0.00015078485012054443, 0.00017201900482177734, 0.00019325315952301025, 0.00021448731422424316, 0.00023572146892547607, 0.000256955623626709, 0.0002781897783279419, 0.0002994239330291748, 0.0003206580877304077, 0.0003418922424316406, 0.00036312639713287354, 0.00038436055183410645, 0.00040559470653533936, 0.00042682886123657227, 0.0004480630159378052, 0.0004692971706390381, 0.000490531325340271, 0.0005117654800415039, 0.0005329996347427368, 0.0005542337894439697, 0.0005754679441452026, 0.0005967020988464355, 0.0006179362535476685, 0.0006391704082489014, 0.0006604045629501343, 0.0006816387176513672, 0.0007028728723526001, 0.000724107027053833, 0.0007453411817550659, 0.0007665753364562988]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 7.0, 5.0, 10.0, 12.0, 17.0, 25.0, 24.0, 32.0, 29.0, 34.0, 53.0, 54.0, 40.0, 52.0, 48.0, 64.0, 45.0, 62.0, 44.0, 41.0, 58.0, 35.0, 41.0, 39.0, 40.0, 27.0, 13.0, 16.0, 17.0, 12.0, 6.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.44921875, -7.24139404296875, -7.0335693359375, -6.82574462890625, -6.617919921875, -6.41009521484375, -6.2022705078125, -5.99444580078125, -5.78662109375, -5.57879638671875, -5.3709716796875, -5.16314697265625, -4.955322265625, -4.74749755859375, -4.5396728515625, -4.33184814453125, -4.1240234375, -3.91619873046875, -3.7083740234375, -3.50054931640625, -3.292724609375, -3.08489990234375, -2.8770751953125, -2.66925048828125, -2.46142578125, -2.25360107421875, -2.0457763671875, -1.83795166015625, -1.630126953125, -1.42230224609375, -1.2144775390625, -1.00665283203125, -0.798828125, -0.59100341796875, -0.3831787109375, -0.17535400390625, 0.032470703125, 0.24029541015625, 0.4481201171875, 0.65594482421875, 0.86376953125, 1.07159423828125, 1.2794189453125, 1.48724365234375, 1.695068359375, 1.90289306640625, 2.1107177734375, 2.31854248046875, 2.5263671875, 2.73419189453125, 2.9420166015625, 3.14984130859375, 3.357666015625, 3.56549072265625, 3.7733154296875, 3.98114013671875, 4.18896484375, 4.39678955078125, 4.6046142578125, 4.81243896484375, 5.020263671875, 5.22808837890625, 5.4359130859375, 5.64373779296875, 5.8515625]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 1.0, 3.0, 5.0, 9.0, 9.0, 10.0, 24.0, 35.0, 36.0, 50.0, 85.0, 115.0, 160.0, 244.0, 363.0, 486.0, 791.0, 1204.0, 2002.0, 3282.0, 5929.0, 13351.0, 58343.0, 879129.0, 55084.0, 13095.0, 5950.0, 3223.0, 1927.0, 1235.0, 733.0, 528.0, 341.0, 224.0, 173.0, 114.0, 72.0, 60.0, 33.0, 34.0, 21.0, 16.0, 12.0, 7.0, 8.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-36.34375, -35.22509765625, -34.1064453125, -32.98779296875, -31.869140625, -30.75048828125, -29.6318359375, -28.51318359375, -27.39453125, -26.27587890625, -25.1572265625, -24.03857421875, -22.919921875, -21.80126953125, -20.6826171875, -19.56396484375, -18.4453125, -17.32666015625, -16.2080078125, -15.08935546875, -13.970703125, -12.85205078125, -11.7333984375, -10.61474609375, -9.49609375, -8.37744140625, -7.2587890625, -6.14013671875, -5.021484375, -3.90283203125, -2.7841796875, -1.66552734375, -0.546875, 0.57177734375, 1.6904296875, 2.80908203125, 3.927734375, 5.04638671875, 6.1650390625, 7.28369140625, 8.40234375, 9.52099609375, 10.6396484375, 11.75830078125, 12.876953125, 13.99560546875, 15.1142578125, 16.23291015625, 17.3515625, 18.47021484375, 19.5888671875, 20.70751953125, 21.826171875, 22.94482421875, 24.0634765625, 25.18212890625, 26.30078125, 27.41943359375, 28.5380859375, 29.65673828125, 30.775390625, 31.89404296875, 33.0126953125, 34.13134765625, 35.25]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 5.0, 5.0, 2.0, 5.0, 8.0, 15.0, 17.0, 14.0, 13.0, 26.0, 26.0, 33.0, 24.0, 41.0, 38.0, 59.0, 50.0, 43.0, 103.0, 299.0, 1620.0, 179.0, 62.0, 51.0, 40.0, 44.0, 39.0, 29.0, 32.0, 20.0, 18.0, 17.0, 22.0, 10.0, 7.0, 14.0, 7.0, 5.0, 0.0, 4.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-20.0625, -19.524169921875, -18.98583984375, -18.447509765625, -17.9091796875, -17.370849609375, -16.83251953125, -16.294189453125, -15.755859375, -15.217529296875, -14.67919921875, -14.140869140625, -13.6025390625, -13.064208984375, -12.52587890625, -11.987548828125, -11.44921875, -10.910888671875, -10.37255859375, -9.834228515625, -9.2958984375, -8.757568359375, -8.21923828125, -7.680908203125, -7.142578125, -6.604248046875, -6.06591796875, -5.527587890625, -4.9892578125, -4.450927734375, -3.91259765625, -3.374267578125, -2.8359375, -2.297607421875, -1.75927734375, -1.220947265625, -0.6826171875, -0.144287109375, 0.39404296875, 0.932373046875, 1.470703125, 2.009033203125, 2.54736328125, 3.085693359375, 3.6240234375, 4.162353515625, 4.70068359375, 5.239013671875, 5.77734375, 6.315673828125, 6.85400390625, 7.392333984375, 7.9306640625, 8.468994140625, 9.00732421875, 9.545654296875, 10.083984375, 10.622314453125, 11.16064453125, 11.698974609375, 12.2373046875, 12.775634765625, 13.31396484375, 13.852294921875, 14.390625]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 9.0, 11.0, 9.0, 12.0, 14.0, 16.0, 18.0, 28.0, 31.0, 27.0, 42.0, 55.0, 59.0, 140.0, 396.0, 2664.0, 3119780.0, 20947.0, 750.0, 229.0, 101.0, 79.0, 56.0, 35.0, 29.0, 29.0, 19.0, 18.0, 21.0, 14.0, 16.0, 15.0, 7.0, 7.0, 3.0, 5.0, 2.0, 4.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.9375, -63.556640625, -61.17578125, -58.794921875, -56.4140625, -54.033203125, -51.65234375, -49.271484375, -46.890625, -44.509765625, -42.12890625, -39.748046875, -37.3671875, -34.986328125, -32.60546875, -30.224609375, -27.84375, -25.462890625, -23.08203125, -20.701171875, -18.3203125, -15.939453125, -13.55859375, -11.177734375, -8.796875, -6.416015625, -4.03515625, -1.654296875, 0.7265625, 3.107421875, 5.48828125, 7.869140625, 10.25, 12.630859375, 15.01171875, 17.392578125, 19.7734375, 22.154296875, 24.53515625, 26.916015625, 29.296875, 31.677734375, 34.05859375, 36.439453125, 38.8203125, 41.201171875, 43.58203125, 45.962890625, 48.34375, 50.724609375, 53.10546875, 55.486328125, 57.8671875, 60.248046875, 62.62890625, 65.009765625, 67.390625, 69.771484375, 72.15234375, 74.533203125, 76.9140625, 79.294921875, 81.67578125, 84.056640625, 86.4375]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 134.0, 874.0, 7.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-236.75433349609375, -229.62741088867188, -222.50048828125, -215.37355041503906, -208.2466278076172, -201.1197052001953, -193.99276733398438, -186.8658447265625, -179.73892211914062, -172.61199951171875, -165.48507690429688, -158.35813903808594, -151.23121643066406, -144.1042938232422, -136.97735595703125, -129.85043334960938, -122.7235107421875, -115.59658813476562, -108.46965789794922, -101.34272766113281, -94.21580505371094, -87.08888244628906, -79.96195220947266, -72.83502197265625, -65.70809936523438, -58.581172943115234, -51.454246520996094, -44.32732009887695, -37.20039367675781, -30.073467254638672, -22.94654083251953, -15.81961441040039, -8.692672729492188, -1.5657463073730469, 5.561180114746094, 12.688106536865234, 19.815032958984375, 26.941959381103516, 34.068885803222656, 41.1958122253418, 48.32273864746094, 55.44966506958008, 62.57659149169922, 69.70352172851562, 76.8304443359375, 83.95736694335938, 91.08429718017578, 98.21122741699219, 105.33815002441406, 112.46507263183594, 119.59200286865234, 126.71893310546875, 133.84585571289062, 140.9727783203125, 148.09970092773438, 155.2266387939453, 162.3535614013672, 169.48048400878906, 176.607421875, 183.73434448242188, 190.86126708984375, 197.98818969726562, 205.1151123046875, 212.24205017089844, 219.3689727783203]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 3.0, 3.0, 6.0, 17.0, 5.0, 16.0, 10.0, 17.0, 21.0, 20.0, 31.0, 32.0, 16.0, 27.0, 25.0, 26.0, 54.0, 40.0, 53.0, 33.0, 51.0, 33.0, 35.0, 42.0, 40.0, 33.0, 29.0, 52.0, 38.0, 28.0, 26.0, 22.0, 17.0, 19.0, 13.0, 12.0, 9.0, 13.0, 6.0, 5.0, 6.0, 5.0, 8.0, 3.0, 3.0, 2.0, 0.0, 3.0], "bins": [-66.52519226074219, -64.83065032958984, -63.13611602783203, -61.44157409667969, -59.74703598022461, -58.05249786376953, -56.35795593261719, -54.66341781616211, -52.96887969970703, -51.27434158325195, -49.579803466796875, -47.88526153564453, -46.19072341918945, -44.496185302734375, -42.80164337158203, -41.10710525512695, -39.412567138671875, -37.7180290222168, -36.02349090576172, -34.328948974609375, -32.6344108581543, -30.93987274169922, -29.245332717895508, -27.550792694091797, -25.85625457763672, -24.16171646118164, -22.46717643737793, -20.77263641357422, -19.07809829711914, -17.383560180664062, -15.689020156860352, -13.994481086730957, -12.299945831298828, -10.605406761169434, -8.910867691040039, -7.2163286209106445, -5.52178955078125, -3.8272504806518555, -2.132711410522461, -0.4381723403930664, 1.2563667297363281, 2.9509057998657227, 4.645444869995117, 6.339983940124512, 8.034523010253906, 9.7290620803833, 11.423601150512695, 13.11814022064209, 14.812679290771484, 16.507217407226562, 18.201757431030273, 19.896297454833984, 21.590835571289062, 23.28537368774414, 24.97991371154785, 26.674453735351562, 28.36899185180664, 30.06352996826172, 31.75806999206543, 33.45261001586914, 35.14714813232422, 36.8416862487793, 38.536224365234375, 40.23076629638672, 41.9253044128418]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 10.0, 15.0, 11.0, 13.0, 26.0, 20.0, 37.0, 27.0, 41.0, 45.0, 32.0, 55.0, 52.0, 40.0, 45.0, 57.0, 61.0, 49.0, 36.0, 53.0, 35.0, 51.0, 37.0, 27.0, 33.0, 25.0, 19.0, 11.0, 16.0, 11.0, 5.0, 2.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.22265625, -7.01123046875, -6.7998046875, -6.58837890625, -6.376953125, -6.16552734375, -5.9541015625, -5.74267578125, -5.53125, -5.31982421875, -5.1083984375, -4.89697265625, -4.685546875, -4.47412109375, -4.2626953125, -4.05126953125, -3.83984375, -3.62841796875, -3.4169921875, -3.20556640625, -2.994140625, -2.78271484375, -2.5712890625, -2.35986328125, -2.1484375, -1.93701171875, -1.7255859375, -1.51416015625, -1.302734375, -1.09130859375, -0.8798828125, -0.66845703125, -0.45703125, -0.24560546875, -0.0341796875, 0.17724609375, 0.388671875, 0.60009765625, 0.8115234375, 1.02294921875, 1.234375, 1.44580078125, 1.6572265625, 1.86865234375, 2.080078125, 2.29150390625, 2.5029296875, 2.71435546875, 2.92578125, 3.13720703125, 3.3486328125, 3.56005859375, 3.771484375, 3.98291015625, 4.1943359375, 4.40576171875, 4.6171875, 4.82861328125, 5.0400390625, 5.25146484375, 5.462890625, 5.67431640625, 5.8857421875, 6.09716796875, 6.30859375]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 9.0, 11.0, 15.0, 22.0, 32.0, 45.0, 81.0, 132.0, 239.0, 383.0, 819.0, 1857.0, 4844.0, 15047.0, 81848.0, 3400880.0, 640020.0, 33620.0, 8549.0, 3156.0, 1293.0, 598.0, 309.0, 175.0, 107.0, 64.0, 41.0, 27.0, 17.0, 18.0, 5.0, 8.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.3125, -41.095703125, -39.87890625, -38.662109375, -37.4453125, -36.228515625, -35.01171875, -33.794921875, -32.578125, -31.361328125, -30.14453125, -28.927734375, -27.7109375, -26.494140625, -25.27734375, -24.060546875, -22.84375, -21.626953125, -20.41015625, -19.193359375, -17.9765625, -16.759765625, -15.54296875, -14.326171875, -13.109375, -11.892578125, -10.67578125, -9.458984375, -8.2421875, -7.025390625, -5.80859375, -4.591796875, -3.375, -2.158203125, -0.94140625, 0.275390625, 1.4921875, 2.708984375, 3.92578125, 5.142578125, 6.359375, 7.576171875, 8.79296875, 10.009765625, 11.2265625, 12.443359375, 13.66015625, 14.876953125, 16.09375, 17.310546875, 18.52734375, 19.744140625, 20.9609375, 22.177734375, 23.39453125, 24.611328125, 25.828125, 27.044921875, 28.26171875, 29.478515625, 30.6953125, 31.912109375, 33.12890625, 34.345703125, 35.5625]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 5.0, 3.0, 10.0, 11.0, 21.0, 19.0, 40.0, 55.0, 101.0, 160.0, 253.0, 427.0, 704.0, 828.0, 590.0, 332.0, 201.0, 121.0, 64.0, 40.0, 30.0, 29.0, 15.0, 8.0, 4.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-34.25, -33.221435546875, -32.19287109375, -31.164306640625, -30.1357421875, -29.107177734375, -28.07861328125, -27.050048828125, -26.021484375, -24.992919921875, -23.96435546875, -22.935791015625, -21.9072265625, -20.878662109375, -19.85009765625, -18.821533203125, -17.79296875, -16.764404296875, -15.73583984375, -14.707275390625, -13.6787109375, -12.650146484375, -11.62158203125, -10.593017578125, -9.564453125, -8.535888671875, -7.50732421875, -6.478759765625, -5.4501953125, -4.421630859375, -3.39306640625, -2.364501953125, -1.3359375, -0.307373046875, 0.72119140625, 1.749755859375, 2.7783203125, 3.806884765625, 4.83544921875, 5.864013671875, 6.892578125, 7.921142578125, 8.94970703125, 9.978271484375, 11.0068359375, 12.035400390625, 13.06396484375, 14.092529296875, 15.12109375, 16.149658203125, 17.17822265625, 18.206787109375, 19.2353515625, 20.263916015625, 21.29248046875, 22.321044921875, 23.349609375, 24.378173828125, 25.40673828125, 26.435302734375, 27.4638671875, 28.492431640625, 29.52099609375, 30.549560546875, 31.578125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 0.0, 4.0, 8.0, 5.0, 11.0, 18.0, 19.0, 25.0, 51.0, 85.0, 118.0, 208.0, 425.0, 1958.0, 3494723.0, 694082.0, 1523.0, 433.0, 216.0, 133.0, 71.0, 59.0, 23.0, 31.0, 17.0, 15.0, 5.0, 5.0, 2.0, 5.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-98.125, -93.845703125, -89.56640625, -85.287109375, -81.0078125, -76.728515625, -72.44921875, -68.169921875, -63.890625, -59.611328125, -55.33203125, -51.052734375, -46.7734375, -42.494140625, -38.21484375, -33.935546875, -29.65625, -25.376953125, -21.09765625, -16.818359375, -12.5390625, -8.259765625, -3.98046875, 0.298828125, 4.578125, 8.857421875, 13.13671875, 17.416015625, 21.6953125, 25.974609375, 30.25390625, 34.533203125, 38.8125, 43.091796875, 47.37109375, 51.650390625, 55.9296875, 60.208984375, 64.48828125, 68.767578125, 73.046875, 77.326171875, 81.60546875, 85.884765625, 90.1640625, 94.443359375, 98.72265625, 103.001953125, 107.28125, 111.560546875, 115.83984375, 120.119140625, 124.3984375, 128.677734375, 132.95703125, 137.236328125, 141.515625, 145.794921875, 150.07421875, 154.353515625, 158.6328125, 162.912109375, 167.19140625, 171.470703125, 175.75]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 82.0, 619.0, 298.0, 12.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-526.989501953125, -517.1840209960938, -507.37847900390625, -497.5729675292969, -487.7674560546875, -477.9619445800781, -468.15643310546875, -458.3509521484375, -448.54541015625, -438.7398986816406, -428.93438720703125, -419.1288757324219, -409.3233642578125, -399.5178527832031, -389.71234130859375, -379.9068603515625, -370.1013488769531, -360.29583740234375, -350.4903259277344, -340.684814453125, -330.8793029785156, -321.07379150390625, -311.2682800292969, -301.4627685546875, -291.65728759765625, -281.8517761230469, -272.0462646484375, -262.2407531738281, -252.43524169921875, -242.62973022460938, -232.82423400878906, -223.0187225341797, -213.2132110595703, -203.40769958496094, -193.60218811035156, -183.7966766357422, -173.99118041992188, -164.1856689453125, -154.38015747070312, -144.57464599609375, -134.76913452148438, -124.963623046875, -115.15811157226562, -105.35260772705078, -95.5470962524414, -85.74158477783203, -75.93608093261719, -66.13056945800781, -56.32505798339844, -46.51954650878906, -36.71403884887695, -26.90852928161621, -17.10301971435547, -7.297508239746094, 2.5079994201660156, 12.313507080078125, 22.1190185546875, 31.924528121948242, 41.730037689208984, 51.535545349121094, 61.34105682373047, 71.14656829833984, 80.95207214355469, 90.75758361816406, 100.56309509277344]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 4.0, 2.0, 5.0, 5.0, 4.0, 5.0, 7.0, 11.0, 22.0, 24.0, 18.0, 30.0, 25.0, 38.0, 40.0, 42.0, 41.0, 45.0, 55.0, 54.0, 46.0, 43.0, 50.0, 53.0, 42.0, 34.0, 43.0, 25.0, 32.0, 20.0, 31.0, 24.0, 21.0, 22.0, 12.0, 7.0, 7.0, 4.0, 10.0, 3.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.2261962890625, -72.79197692871094, -70.35775756835938, -67.92353057861328, -65.48931121826172, -63.055091857910156, -60.620872497558594, -58.18665313720703, -55.7524299621582, -53.31821060180664, -50.88398742675781, -48.44976806640625, -46.01554870605469, -43.58132553100586, -41.1471061706543, -38.71288299560547, -36.278663635253906, -33.844444274902344, -31.410221099853516, -28.976001739501953, -26.541780471801758, -24.107559204101562, -21.67333984375, -19.239118576049805, -16.80489730834961, -14.370676040649414, -11.936455726623535, -9.502235412597656, -7.068014144897461, -4.633792877197266, -2.1995725631713867, 0.2346477508544922, 2.6688613891601562, 5.103082180023193, 7.5373029708862305, 9.97152328491211, 12.405744552612305, 14.8399658203125, 17.274185180664062, 19.708406448364258, 22.142627716064453, 24.57684898376465, 27.011070251464844, 29.445289611816406, 31.8795108795166, 34.3137321472168, 36.74795150756836, 39.18217468261719, 41.61639404296875, 44.05061340332031, 46.48483657836914, 48.9190559387207, 51.35327911376953, 53.787498474121094, 56.221717834472656, 58.65593719482422, 61.09016036987305, 63.52437973022461, 65.95860290527344, 68.392822265625, 70.82704162597656, 73.26126098632812, 75.69548797607422, 78.12970733642578, 80.56392669677734]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 4.0, 16.0, 17.0, 17.0, 23.0, 19.0, 19.0, 27.0, 38.0, 34.0, 41.0, 47.0, 43.0, 43.0, 36.0, 49.0, 52.0, 64.0, 41.0, 48.0, 41.0, 42.0, 36.0, 36.0, 25.0, 34.0, 22.0, 16.0, 16.0, 19.0, 9.0, 7.0, 9.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.21875, -6.01800537109375, -5.8172607421875, -5.61651611328125, -5.415771484375, -5.21502685546875, -5.0142822265625, -4.81353759765625, -4.61279296875, -4.41204833984375, -4.2113037109375, -4.01055908203125, -3.809814453125, -3.60906982421875, -3.4083251953125, -3.20758056640625, -3.0068359375, -2.80609130859375, -2.6053466796875, -2.40460205078125, -2.203857421875, -2.00311279296875, -1.8023681640625, -1.60162353515625, -1.40087890625, -1.20013427734375, -0.9993896484375, -0.79864501953125, -0.597900390625, -0.39715576171875, -0.1964111328125, 0.00433349609375, 0.205078125, 0.40582275390625, 0.6065673828125, 0.80731201171875, 1.008056640625, 1.20880126953125, 1.4095458984375, 1.61029052734375, 1.81103515625, 2.01177978515625, 2.2125244140625, 2.41326904296875, 2.614013671875, 2.81475830078125, 3.0155029296875, 3.21624755859375, 3.4169921875, 3.61773681640625, 3.8184814453125, 4.01922607421875, 4.219970703125, 4.42071533203125, 4.6214599609375, 4.82220458984375, 5.02294921875, 5.22369384765625, 5.4244384765625, 5.62518310546875, 5.825927734375, 6.02667236328125, 6.2274169921875, 6.42816162109375, 6.62890625]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 4.0, 6.0, 14.0, 11.0, 26.0, 49.0, 61.0, 105.0, 136.0, 232.0, 335.0, 551.0, 846.0, 1300.0, 2074.0, 3348.0, 5380.0, 8925.0, 14475.0, 24006.0, 39963.0, 66798.0, 109409.0, 176064.0, 225560.0, 144446.0, 88432.0, 53493.0, 32439.0, 19450.0, 11754.0, 7115.0, 4385.0, 2761.0, 1677.0, 1039.0, 665.0, 408.0, 253.0, 196.0, 111.0, 67.0, 54.0, 48.0, 24.0, 20.0, 18.0, 10.0, 8.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.85546875, -0.8289718627929688, -0.8024749755859375, -0.7759780883789062, -0.749481201171875, -0.7229843139648438, -0.6964874267578125, -0.6699905395507812, -0.64349365234375, -0.6169967651367188, -0.5904998779296875, -0.5640029907226562, -0.537506103515625, -0.5110092163085938, -0.4845123291015625, -0.45801544189453125, -0.4315185546875, -0.40502166748046875, -0.3785247802734375, -0.35202789306640625, -0.325531005859375, -0.29903411865234375, -0.2725372314453125, -0.24604034423828125, -0.21954345703125, -0.19304656982421875, -0.1665496826171875, -0.14005279541015625, -0.113555908203125, -0.08705902099609375, -0.0605621337890625, -0.03406524658203125, -0.007568359375, 0.01892852783203125, 0.0454254150390625, 0.07192230224609375, 0.098419189453125, 0.12491607666015625, 0.1514129638671875, 0.17790985107421875, 0.20440673828125, 0.23090362548828125, 0.2574005126953125, 0.28389739990234375, 0.310394287109375, 0.33689117431640625, 0.3633880615234375, 0.38988494873046875, 0.4163818359375, 0.44287872314453125, 0.4693756103515625, 0.49587249755859375, 0.522369384765625, 0.5488662719726562, 0.5753631591796875, 0.6018600463867188, 0.62835693359375, 0.6548538208007812, 0.6813507080078125, 0.7078475952148438, 0.734344482421875, 0.7608413696289062, 0.7873382568359375, 0.8138351440429688, 0.84033203125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 7.0, 1.0, 6.0, 3.0, 8.0, 15.0, 7.0, 17.0, 10.0, 14.0, 25.0, 33.0, 34.0, 19.0, 26.0, 34.0, 40.0, 35.0, 39.0, 47.0, 36.0, 1061.0, 51.0, 46.0, 40.0, 45.0, 42.0, 42.0, 32.0, 29.0, 29.0, 18.0, 20.0, 19.0, 23.0, 16.0, 10.0, 15.0, 7.0, 5.0, 6.0, 8.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.576171875, -3.466796875, -3.357421875, -3.248046875, -3.138671875, -3.029296875, -2.919921875, -2.810546875, -2.701171875, -2.591796875, -2.482421875, -2.373046875, -2.263671875, -2.154296875, -2.044921875, -1.935546875, -1.826171875, -1.716796875, -1.607421875, -1.498046875, -1.388671875, -1.279296875, -1.169921875, -1.060546875, -0.951171875, -0.841796875, -0.732421875, -0.623046875, -0.513671875, -0.404296875, -0.294921875, -0.185546875, -0.076171875, 0.033203125, 0.142578125, 0.251953125, 0.361328125, 0.470703125, 0.580078125, 0.689453125, 0.798828125, 0.908203125, 1.017578125, 1.126953125, 1.236328125, 1.345703125, 1.455078125, 1.564453125, 1.673828125, 1.783203125, 1.892578125, 2.001953125, 2.111328125, 2.220703125, 2.330078125, 2.439453125, 2.548828125, 2.658203125, 2.767578125, 2.876953125, 2.986328125, 3.095703125, 3.205078125, 3.314453125, 3.423828125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 1.0, 2.0, 8.0, 6.0, 14.0, 21.0, 32.0, 40.0, 60.0, 104.0, 150.0, 224.0, 330.0, 512.0, 776.0, 1231.0, 1898.0, 2983.0, 4656.0, 7609.0, 11910.0, 19415.0, 31709.0, 51009.0, 83708.0, 133248.0, 1253794.0, 185341.0, 116215.0, 72561.0, 44711.0, 27564.0, 16985.0, 10397.0, 6547.0, 4056.0, 2569.0, 1624.0, 1060.0, 692.0, 474.0, 299.0, 212.0, 136.0, 87.0, 47.0, 40.0, 24.0, 17.0, 18.0, 9.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65576171875, -0.6337966918945312, -0.6118316650390625, -0.5898666381835938, -0.567901611328125, -0.5459365844726562, -0.5239715576171875, -0.5020065307617188, -0.48004150390625, -0.45807647705078125, -0.4361114501953125, -0.41414642333984375, -0.392181396484375, -0.37021636962890625, -0.3482513427734375, -0.32628631591796875, -0.3043212890625, -0.28235626220703125, -0.2603912353515625, -0.23842620849609375, -0.216461181640625, -0.19449615478515625, -0.1725311279296875, -0.15056610107421875, -0.12860107421875, -0.10663604736328125, -0.0846710205078125, -0.06270599365234375, -0.040740966796875, -0.01877593994140625, 0.0031890869140625, 0.02515411376953125, 0.047119140625, 0.06908416748046875, 0.0910491943359375, 0.11301422119140625, 0.134979248046875, 0.15694427490234375, 0.1789093017578125, 0.20087432861328125, 0.22283935546875, 0.24480438232421875, 0.2667694091796875, 0.28873443603515625, 0.310699462890625, 0.33266448974609375, 0.3546295166015625, 0.37659454345703125, 0.3985595703125, 0.42052459716796875, 0.4424896240234375, 0.46445465087890625, 0.486419677734375, 0.5083847045898438, 0.5303497314453125, 0.5523147583007812, 0.57427978515625, 0.5962448120117188, 0.6182098388671875, 0.6401748657226562, 0.662139892578125, 0.6841049194335938, 0.7060699462890625, 0.7280349731445312, 0.75]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 2.0, 8.0, 8.0, 9.0, 17.0, 14.0, 25.0, 18.0, 33.0, 46.0, 50.0, 73.0, 59.0, 70.0, 85.0, 88.0, 79.0, 60.0, 51.0, 45.0, 36.0, 27.0, 17.0, 11.0, 19.0, 11.0, 11.0, 6.0, 6.0, 3.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0014743804931640625, -0.001429229974746704, -0.0013840794563293457, -0.0013389289379119873, -0.001293778419494629, -0.0012486279010772705, -0.0012034773826599121, -0.0011583268642425537, -0.0011131763458251953, -0.001068025827407837, -0.0010228753089904785, -0.0009777247905731201, -0.0009325742721557617, -0.0008874237537384033, -0.0008422732353210449, -0.0007971227169036865, -0.0007519721984863281, -0.0007068216800689697, -0.0006616711616516113, -0.0006165206432342529, -0.0005713701248168945, -0.0005262196063995361, -0.00048106908798217773, -0.00043591856956481934, -0.00039076805114746094, -0.00034561753273010254, -0.00030046701431274414, -0.00025531649589538574, -0.00021016597747802734, -0.00016501545906066895, -0.00011986494064331055, -7.471442222595215e-05, -2.956390380859375e-05, 1.558661460876465e-05, 6.073713302612305e-05, 0.00010588765144348145, 0.00015103816986083984, 0.00019618868827819824, 0.00024133920669555664, 0.00028648972511291504, 0.00033164024353027344, 0.00037679076194763184, 0.00042194128036499023, 0.00046709179878234863, 0.000512242317199707, 0.0005573928356170654, 0.0006025433540344238, 0.0006476938724517822, 0.0006928443908691406, 0.000737994909286499, 0.0007831454277038574, 0.0008282959461212158, 0.0008734464645385742, 0.0009185969829559326, 0.000963747501373291, 0.0010088980197906494, 0.0010540485382080078, 0.0010991990566253662, 0.0011443495750427246, 0.001189500093460083, 0.0012346506118774414, 0.0012798011302947998, 0.0013249516487121582, 0.0013701021671295166, 0.001415252685546875]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 6.0, 7.0, 12.0, 20.0, 14.0, 19.0, 22.0, 34.0, 43.0, 48.0, 69.0, 123.0, 164.0, 181.0, 264.0, 642.0, 8181.0, 1034501.0, 2754.0, 499.0, 268.0, 199.0, 116.0, 86.0, 74.0, 47.0, 35.0, 23.0, 14.0, 17.0, 12.0, 12.0, 18.0, 7.0, 6.0, 1.0, 6.0, 3.0, 5.0, 4.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.025634765625, -0.024762630462646484, -0.02389049530029297, -0.023018360137939453, -0.022146224975585938, -0.021274089813232422, -0.020401954650878906, -0.01952981948852539, -0.018657684326171875, -0.01778554916381836, -0.016913414001464844, -0.016041278839111328, -0.015169143676757812, -0.014297008514404297, -0.013424873352050781, -0.012552738189697266, -0.01168060302734375, -0.010808467864990234, -0.009936332702636719, -0.009064197540283203, -0.008192062377929688, -0.007319927215576172, -0.006447792053222656, -0.005575656890869141, -0.004703521728515625, -0.0038313865661621094, -0.0029592514038085938, -0.002087116241455078, -0.0012149810791015625, -0.0003428459167480469, 0.0005292892456054688, 0.0014014244079589844, 0.0022735595703125, 0.0031456947326660156, 0.004017829895019531, 0.004889965057373047, 0.0057621002197265625, 0.006634235382080078, 0.007506370544433594, 0.00837850570678711, 0.009250640869140625, 0.01012277603149414, 0.010994911193847656, 0.011867046356201172, 0.012739181518554688, 0.013611316680908203, 0.014483451843261719, 0.015355587005615234, 0.01622772216796875, 0.017099857330322266, 0.01797199249267578, 0.018844127655029297, 0.019716262817382812, 0.020588397979736328, 0.021460533142089844, 0.02233266830444336, 0.023204803466796875, 0.02407693862915039, 0.024949073791503906, 0.025821208953857422, 0.026693344116210938, 0.027565479278564453, 0.02843761444091797, 0.029309749603271484, 0.030181884765625]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 47.0, 370.0, 497.0, 81.0, 15.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0035810621920973063, -0.0034896391443908215, -0.0033982160966843367, -0.003306793048977852, -0.0032153702341020107, -0.003123947186395526, -0.003032524138689041, -0.0029411010909825563, -0.0028496780432760715, -0.0027582549955695868, -0.002666831947863102, -0.002575408900156617, -0.0024839858524501324, -0.0023925630375742912, -0.0023011399898678064, -0.0022097169421613216, -0.002118293894454837, -0.002026870846748352, -0.0019354477990418673, -0.0018440248677507043, -0.0017526018200442195, -0.0016611787723377347, -0.0015697558410465717, -0.001478332793340087, -0.0013869097456336021, -0.0012954866979271173, -0.0012040636502206326, -0.0011126407189294696, -0.0010212176712229848, -0.0009297946235165, -0.0008383716340176761, -0.0007469486445188522, -0.0006555255968123674, -0.0005641025491058826, -0.00047267955960705876, -0.0003812565410044044, -0.0002898335224017501, -0.00019841050379909575, -0.00010698748519644141, -1.556449569761753e-05, 7.585855200886726e-05, 0.0001672815706115216, 0.00025870458921417594, 0.0003501276078168303, 0.0004415506264194846, 0.0005329736741259694, 0.0006243966636247933, 0.0007158196531236172, 0.000807242700830102, 0.0008986657485365868, 0.0009900887962430716, 0.0010815117275342345, 0.0011729347752407193, 0.0012643578229472041, 0.001355780754238367, 0.0014472038019448519, 0.0015386268496513367, 0.0016300498973578215, 0.0017214729450643063, 0.0018128958763554692, 0.001904318924061954, 0.001995741855353117, 0.002087164903059602, 0.0021785879507660866, 0.0022700109984725714]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 4.0, 2.0, 5.0, 6.0, 4.0, 12.0, 9.0, 11.0, 17.0, 18.0, 22.0, 22.0, 41.0, 27.0, 26.0, 21.0, 39.0, 29.0, 40.0, 38.0, 45.0, 46.0, 47.0, 53.0, 49.0, 40.0, 29.0, 37.0, 24.0, 34.0, 37.0, 24.0, 22.0, 21.0, 15.0, 21.0, 10.0, 12.0, 9.0, 9.0, 6.0, 11.0, 5.0, 3.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0005835890769958496, -0.0005641374737024307, -0.0005446858704090118, -0.000525234267115593, -0.0005057826638221741, -0.0004863310605287552, -0.0004668794572353363, -0.0004474278539419174, -0.00042797625064849854, -0.00040852464735507965, -0.00038907304406166077, -0.0003696214407682419, -0.000350169837474823, -0.0003307182341814041, -0.00031126663088798523, -0.00029181502759456635, -0.00027236342430114746, -0.0002529118210077286, -0.0002334602177143097, -0.0002140086144208908, -0.00019455701112747192, -0.00017510540783405304, -0.00015565380454063416, -0.00013620220124721527, -0.00011675059795379639, -9.72989946603775e-05, -7.784739136695862e-05, -5.8395788073539734e-05, -3.894418478012085e-05, -1.9492581486701965e-05, -4.0978193283081055e-08, 1.9410625100135803e-05, 3.886222839355469e-05, 5.831383168697357e-05, 7.776543498039246e-05, 9.721703827381134e-05, 0.00011666864156723022, 0.0001361202448606491, 0.000155571848154068, 0.00017502345144748688, 0.00019447505474090576, 0.00021392665803432465, 0.00023337826132774353, 0.0002528298646211624, 0.0002722814679145813, 0.0002917330712080002, 0.00031118467450141907, 0.00033063627779483795, 0.00035008788108825684, 0.0003695394843816757, 0.0003889910876750946, 0.0004084426909685135, 0.0004278942942619324, 0.00044734589755535126, 0.00046679750084877014, 0.000486249104142189, 0.0005057007074356079, 0.0005251523107290268, 0.0005446039140224457, 0.0005640555173158646, 0.0005835071206092834, 0.0006029587239027023, 0.0006224103271961212, 0.0006418619304895401, 0.000661313533782959]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 4.0, 16.0, 17.0, 17.0, 23.0, 19.0, 19.0, 27.0, 38.0, 34.0, 41.0, 47.0, 43.0, 43.0, 36.0, 49.0, 52.0, 64.0, 41.0, 48.0, 41.0, 42.0, 36.0, 36.0, 25.0, 34.0, 22.0, 16.0, 16.0, 19.0, 9.0, 7.0, 9.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.21875, -6.01800537109375, -5.8172607421875, -5.61651611328125, -5.415771484375, -5.21502685546875, -5.0142822265625, -4.81353759765625, -4.61279296875, -4.41204833984375, -4.2113037109375, -4.01055908203125, -3.809814453125, -3.60906982421875, -3.4083251953125, -3.20758056640625, -3.0068359375, -2.80609130859375, -2.6053466796875, -2.40460205078125, -2.203857421875, -2.00311279296875, -1.8023681640625, -1.60162353515625, -1.40087890625, -1.20013427734375, -0.9993896484375, -0.79864501953125, -0.597900390625, -0.39715576171875, -0.1964111328125, 0.00433349609375, 0.205078125, 0.40582275390625, 0.6065673828125, 0.80731201171875, 1.008056640625, 1.20880126953125, 1.4095458984375, 1.61029052734375, 1.81103515625, 2.01177978515625, 2.2125244140625, 2.41326904296875, 2.614013671875, 2.81475830078125, 3.0155029296875, 3.21624755859375, 3.4169921875, 3.61773681640625, 3.8184814453125, 4.01922607421875, 4.219970703125, 4.42071533203125, 4.6214599609375, 4.82220458984375, 5.02294921875, 5.22369384765625, 5.4244384765625, 5.62518310546875, 5.825927734375, 6.02667236328125, 6.2274169921875, 6.42816162109375, 6.62890625]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 3.0, 8.0, 13.0, 10.0, 22.0, 32.0, 47.0, 61.0, 85.0, 132.0, 197.0, 293.0, 442.0, 809.0, 1523.0, 3349.0, 9449.0, 33706.0, 160917.0, 589902.0, 190129.0, 39143.0, 10620.0, 3719.0, 1649.0, 835.0, 518.0, 293.0, 203.0, 138.0, 101.0, 70.0, 46.0, 24.0, 20.0, 19.0, 8.0, 8.0, 4.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.28515625, -6.0859375, -5.88671875, -5.6875, -5.48828125, -5.2890625, -5.08984375, -4.890625, -4.69140625, -4.4921875, -4.29296875, -4.09375, -3.89453125, -3.6953125, -3.49609375, -3.296875, -3.09765625, -2.8984375, -2.69921875, -2.5, -2.30078125, -2.1015625, -1.90234375, -1.703125, -1.50390625, -1.3046875, -1.10546875, -0.90625, -0.70703125, -0.5078125, -0.30859375, -0.109375, 0.08984375, 0.2890625, 0.48828125, 0.6875, 0.88671875, 1.0859375, 1.28515625, 1.484375, 1.68359375, 1.8828125, 2.08203125, 2.28125, 2.48046875, 2.6796875, 2.87890625, 3.078125, 3.27734375, 3.4765625, 3.67578125, 3.875, 4.07421875, 4.2734375, 4.47265625, 4.671875, 4.87109375, 5.0703125, 5.26953125, 5.46875, 5.66796875, 5.8671875, 6.06640625, 6.265625, 6.46484375]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 5.0, 5.0, 2.0, 9.0, 9.0, 4.0, 14.0, 13.0, 21.0, 18.0, 18.0, 26.0, 40.0, 29.0, 45.0, 48.0, 47.0, 51.0, 64.0, 354.0, 1728.0, 91.0, 63.0, 40.0, 23.0, 52.0, 41.0, 34.0, 25.0, 26.0, 18.0, 16.0, 18.0, 16.0, 9.0, 6.0, 7.0, 8.0, 3.0, 2.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.890625, -22.219970703125, -21.54931640625, -20.878662109375, -20.2080078125, -19.537353515625, -18.86669921875, -18.196044921875, -17.525390625, -16.854736328125, -16.18408203125, -15.513427734375, -14.8427734375, -14.172119140625, -13.50146484375, -12.830810546875, -12.16015625, -11.489501953125, -10.81884765625, -10.148193359375, -9.4775390625, -8.806884765625, -8.13623046875, -7.465576171875, -6.794921875, -6.124267578125, -5.45361328125, -4.782958984375, -4.1123046875, -3.441650390625, -2.77099609375, -2.100341796875, -1.4296875, -0.759033203125, -0.08837890625, 0.582275390625, 1.2529296875, 1.923583984375, 2.59423828125, 3.264892578125, 3.935546875, 4.606201171875, 5.27685546875, 5.947509765625, 6.6181640625, 7.288818359375, 7.95947265625, 8.630126953125, 9.30078125, 9.971435546875, 10.64208984375, 11.312744140625, 11.9833984375, 12.654052734375, 13.32470703125, 13.995361328125, 14.666015625, 15.336669921875, 16.00732421875, 16.677978515625, 17.3486328125, 18.019287109375, 18.68994140625, 19.360595703125, 20.03125]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 9.0, 5.0, 8.0, 7.0, 13.0, 14.0, 15.0, 12.0, 20.0, 24.0, 22.0, 48.0, 50.0, 74.0, 68.0, 127.0, 356.0, 1040.0, 47212.0, 3092069.0, 3242.0, 563.0, 218.0, 108.0, 81.0, 64.0, 40.0, 40.0, 28.0, 23.0, 20.0, 16.0, 12.0, 17.0, 8.0, 5.0, 6.0, 6.0, 5.0, 7.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-43.6875, -42.24365234375, -40.7998046875, -39.35595703125, -37.912109375, -36.46826171875, -35.0244140625, -33.58056640625, -32.13671875, -30.69287109375, -29.2490234375, -27.80517578125, -26.361328125, -24.91748046875, -23.4736328125, -22.02978515625, -20.5859375, -19.14208984375, -17.6982421875, -16.25439453125, -14.810546875, -13.36669921875, -11.9228515625, -10.47900390625, -9.03515625, -7.59130859375, -6.1474609375, -4.70361328125, -3.259765625, -1.81591796875, -0.3720703125, 1.07177734375, 2.515625, 3.95947265625, 5.4033203125, 6.84716796875, 8.291015625, 9.73486328125, 11.1787109375, 12.62255859375, 14.06640625, 15.51025390625, 16.9541015625, 18.39794921875, 19.841796875, 21.28564453125, 22.7294921875, 24.17333984375, 25.6171875, 27.06103515625, 28.5048828125, 29.94873046875, 31.392578125, 32.83642578125, 34.2802734375, 35.72412109375, 37.16796875, 38.61181640625, 40.0556640625, 41.49951171875, 42.943359375, 44.38720703125, 45.8310546875, 47.27490234375, 48.71875]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 27.0, 778.0, 207.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.676727294921875, -34.175716400146484, -30.674705505371094, -27.17369270324707, -23.67268180847168, -20.17167091369629, -16.670658111572266, -13.169647216796875, -9.668636322021484, -6.1676249504089355, -2.6666135787963867, 0.8343982696533203, 4.335409164428711, 7.836420059204102, 11.337432861328125, 14.838443756103516, 18.339454650878906, 21.840465545654297, 25.341476440429688, 28.84248924255371, 32.34349822998047, 35.844512939453125, 39.345523834228516, 42.846534729003906, 46.3475456237793, 49.84855651855469, 53.34956741333008, 56.85057830810547, 60.351593017578125, 63.85260009765625, 67.3536148071289, 70.85462951660156, 74.35563659667969, 77.85665130615234, 81.35765838623047, 84.85867309570312, 88.35968017578125, 91.8606948852539, 95.36170959472656, 98.86271667480469, 102.36372375488281, 105.86473846435547, 109.3657455444336, 112.86676025390625, 116.36776733398438, 119.86878204345703, 123.36979675292969, 126.87080383300781, 130.371826171875, 133.87283325195312, 137.3738555908203, 140.87486267089844, 144.37586975097656, 147.8768768310547, 151.37789916992188, 154.87890625, 158.37991333007812, 161.88092041015625, 165.38194274902344, 168.88294982910156, 172.3839569091797, 175.8849639892578, 179.385986328125, 182.88699340820312, 186.38800048828125]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 6.0, 6.0, 8.0, 9.0, 7.0, 16.0, 19.0, 18.0, 19.0, 27.0, 25.0, 38.0, 44.0, 38.0, 41.0, 46.0, 54.0, 30.0, 51.0, 53.0, 47.0, 39.0, 52.0, 50.0, 28.0, 40.0, 36.0, 37.0, 21.0, 18.0, 16.0, 12.0, 18.0, 9.0, 3.0, 8.0, 5.0, 5.0, 5.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.67066955566406, -55.525943756103516, -53.38121795654297, -51.23649215698242, -49.091766357421875, -46.94703674316406, -44.802310943603516, -42.65758514404297, -40.51285934448242, -38.368133544921875, -36.22340774536133, -34.07868194580078, -31.9339542388916, -29.789228439331055, -27.644500732421875, -25.499774932861328, -23.35504913330078, -21.210323333740234, -19.065597534179688, -16.920869827270508, -14.776144027709961, -12.631418228149414, -10.48669147491455, -8.341964721679688, -6.197238922119141, -4.0525126457214355, -1.9077863693237305, 0.2369399070739746, 2.3816661834716797, 4.526391983032227, 6.67111873626709, 8.815845489501953, 10.9605712890625, 13.105297088623047, 15.25002384185791, 17.394750595092773, 19.53947639465332, 21.684202194213867, 23.828929901123047, 25.973655700683594, 28.11838150024414, 30.263107299804688, 32.407833099365234, 34.55255889892578, 36.697288513183594, 38.842010498046875, 40.98674011230469, 43.131465911865234, 45.27619171142578, 47.42091751098633, 49.565643310546875, 51.71036911010742, 53.85509490966797, 55.99982452392578, 58.14455032348633, 60.289276123046875, 62.43400192260742, 64.57872772216797, 66.72345733642578, 68.86817932128906, 71.01290893554688, 73.15763092041016, 75.30236053466797, 77.44708251953125, 79.59181213378906]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 4.0, 8.0, 18.0, 13.0, 17.0, 22.0, 21.0, 20.0, 25.0, 33.0, 48.0, 30.0, 49.0, 45.0, 40.0, 38.0, 52.0, 62.0, 44.0, 46.0, 43.0, 55.0, 34.0, 42.0, 31.0, 29.0, 27.0, 27.0, 13.0, 13.0, 17.0, 9.0, 11.0, 8.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.11328125, -5.90863037109375, -5.7039794921875, -5.49932861328125, -5.294677734375, -5.09002685546875, -4.8853759765625, -4.68072509765625, -4.47607421875, -4.27142333984375, -4.0667724609375, -3.86212158203125, -3.657470703125, -3.45281982421875, -3.2481689453125, -3.04351806640625, -2.8388671875, -2.63421630859375, -2.4295654296875, -2.22491455078125, -2.020263671875, -1.81561279296875, -1.6109619140625, -1.40631103515625, -1.20166015625, -0.99700927734375, -0.7923583984375, -0.58770751953125, -0.383056640625, -0.17840576171875, 0.0262451171875, 0.23089599609375, 0.435546875, 0.64019775390625, 0.8448486328125, 1.04949951171875, 1.254150390625, 1.45880126953125, 1.6634521484375, 1.86810302734375, 2.07275390625, 2.27740478515625, 2.4820556640625, 2.68670654296875, 2.891357421875, 3.09600830078125, 3.3006591796875, 3.50531005859375, 3.7099609375, 3.91461181640625, 4.1192626953125, 4.32391357421875, 4.528564453125, 4.73321533203125, 4.9378662109375, 5.14251708984375, 5.34716796875, 5.55181884765625, 5.7564697265625, 5.96112060546875, 6.165771484375, 6.37042236328125, 6.5750732421875, 6.77972412109375, 6.984375]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 5.0, 3.0, 8.0, 13.0, 5.0, 15.0, 22.0, 25.0, 37.0, 41.0, 65.0, 100.0, 141.0, 274.0, 667.0, 2686.0, 21747.0, 643685.0, 3342953.0, 169786.0, 9406.0, 1518.0, 476.0, 212.0, 121.0, 73.0, 47.0, 30.0, 35.0, 27.0, 19.0, 10.0, 9.0, 7.0, 6.0, 4.0, 5.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.4375, -24.696533203125, -23.95556640625, -23.214599609375, -22.4736328125, -21.732666015625, -20.99169921875, -20.250732421875, -19.509765625, -18.768798828125, -18.02783203125, -17.286865234375, -16.5458984375, -15.804931640625, -15.06396484375, -14.322998046875, -13.58203125, -12.841064453125, -12.10009765625, -11.359130859375, -10.6181640625, -9.877197265625, -9.13623046875, -8.395263671875, -7.654296875, -6.913330078125, -6.17236328125, -5.431396484375, -4.6904296875, -3.949462890625, -3.20849609375, -2.467529296875, -1.7265625, -0.985595703125, -0.24462890625, 0.496337890625, 1.2373046875, 1.978271484375, 2.71923828125, 3.460205078125, 4.201171875, 4.942138671875, 5.68310546875, 6.424072265625, 7.1650390625, 7.906005859375, 8.64697265625, 9.387939453125, 10.12890625, 10.869873046875, 11.61083984375, 12.351806640625, 13.0927734375, 13.833740234375, 14.57470703125, 15.315673828125, 16.056640625, 16.797607421875, 17.53857421875, 18.279541015625, 19.0205078125, 19.761474609375, 20.50244140625, 21.243408203125, 21.984375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 6.0, 10.0, 7.0, 14.0, 25.0, 32.0, 53.0, 89.0, 115.0, 180.0, 268.0, 407.0, 607.0, 660.0, 523.0, 354.0, 265.0, 156.0, 95.0, 75.0, 47.0, 32.0, 17.0, 15.0, 12.0, 8.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.34375, -24.560546875, -23.77734375, -22.994140625, -22.2109375, -21.427734375, -20.64453125, -19.861328125, -19.078125, -18.294921875, -17.51171875, -16.728515625, -15.9453125, -15.162109375, -14.37890625, -13.595703125, -12.8125, -12.029296875, -11.24609375, -10.462890625, -9.6796875, -8.896484375, -8.11328125, -7.330078125, -6.546875, -5.763671875, -4.98046875, -4.197265625, -3.4140625, -2.630859375, -1.84765625, -1.064453125, -0.28125, 0.501953125, 1.28515625, 2.068359375, 2.8515625, 3.634765625, 4.41796875, 5.201171875, 5.984375, 6.767578125, 7.55078125, 8.333984375, 9.1171875, 9.900390625, 10.68359375, 11.466796875, 12.25, 13.033203125, 13.81640625, 14.599609375, 15.3828125, 16.166015625, 16.94921875, 17.732421875, 18.515625, 19.298828125, 20.08203125, 20.865234375, 21.6484375, 22.431640625, 23.21484375, 23.998046875, 24.78125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 8.0, 7.0, 12.0, 10.0, 31.0, 52.0, 77.0, 122.0, 208.0, 359.0, 780.0, 4845.0, 1651574.0, 2528988.0, 5417.0, 868.0, 365.0, 207.0, 121.0, 75.0, 53.0, 36.0, 22.0, 14.0, 12.0, 7.0, 4.0, 0.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.25, -56.6767578125, -54.103515625, -51.5302734375, -48.95703125, -46.3837890625, -43.810546875, -41.2373046875, -38.6640625, -36.0908203125, -33.517578125, -30.9443359375, -28.37109375, -25.7978515625, -23.224609375, -20.6513671875, -18.078125, -15.5048828125, -12.931640625, -10.3583984375, -7.78515625, -5.2119140625, -2.638671875, -0.0654296875, 2.5078125, 5.0810546875, 7.654296875, 10.2275390625, 12.80078125, 15.3740234375, 17.947265625, 20.5205078125, 23.09375, 25.6669921875, 28.240234375, 30.8134765625, 33.38671875, 35.9599609375, 38.533203125, 41.1064453125, 43.6796875, 46.2529296875, 48.826171875, 51.3994140625, 53.97265625, 56.5458984375, 59.119140625, 61.6923828125, 64.265625, 66.8388671875, 69.412109375, 71.9853515625, 74.55859375, 77.1318359375, 79.705078125, 82.2783203125, 84.8515625, 87.4248046875, 89.998046875, 92.5712890625, 95.14453125, 97.7177734375, 100.291015625, 102.8642578125, 105.4375]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 106.0, 490.0, 356.0, 59.0, 5.0], "bins": [-534.0560302734375, -525.2754516601562, -516.494873046875, -507.71429443359375, -498.9337158203125, -490.15313720703125, -481.37255859375, -472.5919494628906, -463.8113708496094, -455.0307922363281, -446.2502136230469, -437.4696350097656, -428.6890563964844, -419.908447265625, -411.12786865234375, -402.3472900390625, -393.56671142578125, -384.7861328125, -376.00555419921875, -367.2249755859375, -358.44439697265625, -349.663818359375, -340.88323974609375, -332.1026306152344, -323.32208251953125, -314.54150390625, -305.76092529296875, -296.9803466796875, -288.19976806640625, -279.419189453125, -270.63861083984375, -261.8580017089844, -253.0774383544922, -244.29685974121094, -235.5162811279297, -226.73568725585938, -217.95510864257812, -209.17453002929688, -200.39395141601562, -191.61337280273438, -182.83277893066406, -174.0522003173828, -165.27162170410156, -156.49102783203125, -147.71044921875, -138.92987060546875, -130.1492919921875, -121.36871337890625, -112.58812713623047, -103.80754852294922, -95.02696228027344, -86.24638366699219, -77.46580505371094, -68.68521881103516, -59.904640197753906, -51.12405776977539, -42.343475341796875, -33.56289291381836, -24.782312393188477, -16.001731872558594, -7.221149444580078, 1.5594329833984375, 10.340011596679688, 19.120594024658203, 27.901174545288086]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 6.0, 2.0, 4.0, 3.0, 3.0, 8.0, 14.0, 8.0, 8.0, 17.0, 18.0, 27.0, 20.0, 37.0, 24.0, 37.0, 33.0, 17.0, 32.0, 38.0, 27.0, 46.0, 34.0, 41.0, 41.0, 28.0, 35.0, 41.0, 48.0, 38.0, 26.0, 26.0, 29.0, 24.0, 26.0, 16.0, 20.0, 15.0, 10.0, 11.0, 17.0, 6.0, 7.0, 10.0, 6.0, 10.0, 4.0, 6.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-62.429046630859375, -60.59641647338867, -58.76378631591797, -56.93115997314453, -55.09852981567383, -53.265899658203125, -51.43326950073242, -49.60063934326172, -47.76801300048828, -45.93538284301758, -44.102752685546875, -42.27012634277344, -40.437496185302734, -38.60486602783203, -36.77223587036133, -34.939605712890625, -33.10697555541992, -31.27434539794922, -29.44171714782715, -27.609086990356445, -25.776458740234375, -23.943828582763672, -22.11119842529297, -20.278568267822266, -18.445940017700195, -16.613309860229492, -14.780681610107422, -12.948051452636719, -11.115422248840332, -9.282793045043945, -7.450162887573242, -5.6175336837768555, -3.7849044799804688, -1.952275037765503, -0.11964559555053711, 1.7129840850830078, 3.5456132888793945, 5.378242492675781, 7.210872650146484, 9.043501853942871, 10.876131057739258, 12.708760261535645, 14.541389465332031, 16.374019622802734, 18.206649780273438, 20.039278030395508, 21.87190818786621, 23.70453643798828, 25.537166595458984, 27.369796752929688, 29.202425003051758, 31.03505516052246, 32.86768341064453, 34.700313568115234, 36.53294372558594, 38.36557388305664, 40.198204040527344, 42.03083419799805, 43.86346435546875, 45.69609069824219, 47.52872085571289, 49.361351013183594, 51.1939811706543, 53.026611328125, 54.85923767089844]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 8.0, 14.0, 10.0, 9.0, 17.0, 10.0, 25.0, 24.0, 27.0, 27.0, 30.0, 32.0, 32.0, 44.0, 43.0, 46.0, 49.0, 45.0, 44.0, 46.0, 57.0, 42.0, 37.0, 49.0, 37.0, 32.0, 34.0, 23.0, 20.0, 23.0, 14.0, 14.0, 8.0, 9.0, 11.0, 6.0, 1.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.953125, -5.7542724609375, -5.555419921875, -5.3565673828125, -5.15771484375, -4.9588623046875, -4.760009765625, -4.5611572265625, -4.3623046875, -4.1634521484375, -3.964599609375, -3.7657470703125, -3.56689453125, -3.3680419921875, -3.169189453125, -2.9703369140625, -2.771484375, -2.5726318359375, -2.373779296875, -2.1749267578125, -1.97607421875, -1.7772216796875, -1.578369140625, -1.3795166015625, -1.1806640625, -0.9818115234375, -0.782958984375, -0.5841064453125, -0.38525390625, -0.1864013671875, 0.012451171875, 0.2113037109375, 0.41015625, 0.6090087890625, 0.807861328125, 1.0067138671875, 1.20556640625, 1.4044189453125, 1.603271484375, 1.8021240234375, 2.0009765625, 2.1998291015625, 2.398681640625, 2.5975341796875, 2.79638671875, 2.9952392578125, 3.194091796875, 3.3929443359375, 3.591796875, 3.7906494140625, 3.989501953125, 4.1883544921875, 4.38720703125, 4.5860595703125, 4.784912109375, 4.9837646484375, 5.1826171875, 5.3814697265625, 5.580322265625, 5.7791748046875, 5.97802734375, 6.1768798828125, 6.375732421875, 6.5745849609375, 6.7734375]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 10.0, 6.0, 7.0, 11.0, 31.0, 31.0, 53.0, 73.0, 128.0, 187.0, 308.0, 481.0, 718.0, 1219.0, 1949.0, 3326.0, 5491.0, 8985.0, 15255.0, 25142.0, 42550.0, 71816.0, 120532.0, 192259.0, 215563.0, 137405.0, 83017.0, 49137.0, 29052.0, 17386.0, 10431.0, 6310.0, 3739.0, 2252.0, 1402.0, 861.0, 544.0, 289.0, 209.0, 128.0, 96.0, 49.0, 42.0, 35.0, 11.0, 17.0, 8.0, 5.0, 3.0, 4.0, 1.0, 2.0], "bins": [-1.0087890625, -0.9808731079101562, -0.9529571533203125, -0.9250411987304688, -0.897125244140625, -0.8692092895507812, -0.8412933349609375, -0.8133773803710938, -0.78546142578125, -0.7575454711914062, -0.7296295166015625, -0.7017135620117188, -0.673797607421875, -0.6458816528320312, -0.6179656982421875, -0.5900497436523438, -0.5621337890625, -0.5342178344726562, -0.5063018798828125, -0.47838592529296875, -0.450469970703125, -0.42255401611328125, -0.3946380615234375, -0.36672210693359375, -0.33880615234375, -0.31089019775390625, -0.2829742431640625, -0.25505828857421875, -0.227142333984375, -0.19922637939453125, -0.1713104248046875, -0.14339447021484375, -0.115478515625, -0.08756256103515625, -0.0596466064453125, -0.03173065185546875, -0.003814697265625, 0.02410125732421875, 0.0520172119140625, 0.07993316650390625, 0.10784912109375, 0.13576507568359375, 0.1636810302734375, 0.19159698486328125, 0.219512939453125, 0.24742889404296875, 0.2753448486328125, 0.30326080322265625, 0.3311767578125, 0.35909271240234375, 0.3870086669921875, 0.41492462158203125, 0.442840576171875, 0.47075653076171875, 0.4986724853515625, 0.5265884399414062, 0.55450439453125, 0.5824203491210938, 0.6103363037109375, 0.6382522583007812, 0.666168212890625, 0.6940841674804688, 0.7220001220703125, 0.7499160766601562, 0.77783203125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 4.0, 2.0, 5.0, 7.0, 13.0, 14.0, 16.0, 22.0, 27.0, 18.0, 27.0, 29.0, 29.0, 33.0, 36.0, 46.0, 42.0, 53.0, 44.0, 45.0, 1068.0, 33.0, 40.0, 32.0, 32.0, 26.0, 31.0, 30.0, 28.0, 34.0, 29.0, 29.0, 20.0, 16.0, 14.0, 10.0, 10.0, 10.0, 4.0, 6.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.908203125, -3.791839599609375, -3.67547607421875, -3.559112548828125, -3.4427490234375, -3.326385498046875, -3.21002197265625, -3.093658447265625, -2.977294921875, -2.860931396484375, -2.74456787109375, -2.628204345703125, -2.5118408203125, -2.395477294921875, -2.27911376953125, -2.162750244140625, -2.04638671875, -1.930023193359375, -1.81365966796875, -1.697296142578125, -1.5809326171875, -1.464569091796875, -1.34820556640625, -1.231842041015625, -1.115478515625, -0.999114990234375, -0.88275146484375, -0.766387939453125, -0.6500244140625, -0.533660888671875, -0.41729736328125, -0.300933837890625, -0.1845703125, -0.068206787109375, 0.04815673828125, 0.164520263671875, 0.2808837890625, 0.397247314453125, 0.51361083984375, 0.629974365234375, 0.746337890625, 0.862701416015625, 0.97906494140625, 1.095428466796875, 1.2117919921875, 1.328155517578125, 1.44451904296875, 1.560882568359375, 1.67724609375, 1.793609619140625, 1.90997314453125, 2.026336669921875, 2.1427001953125, 2.259063720703125, 2.37542724609375, 2.491790771484375, 2.608154296875, 2.724517822265625, 2.84088134765625, 2.957244873046875, 3.0736083984375, 3.189971923828125, 3.30633544921875, 3.422698974609375, 3.5390625]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 5.0, 13.0, 11.0, 8.0, 32.0, 35.0, 52.0, 101.0, 130.0, 201.0, 291.0, 437.0, 679.0, 1078.0, 1655.0, 2535.0, 4038.0, 6038.0, 9627.0, 14721.0, 22083.0, 34451.0, 54376.0, 85770.0, 136089.0, 1251012.0, 171601.0, 108281.0, 68698.0, 43321.0, 28185.0, 18023.0, 11866.0, 7501.0, 4983.0, 3203.0, 2126.0, 1313.0, 904.0, 571.0, 341.0, 255.0, 158.0, 108.0, 67.0, 71.0, 33.0, 26.0, 18.0, 6.0, 10.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7021484375, -0.6800384521484375, -0.657928466796875, -0.6358184814453125, -0.61370849609375, -0.5915985107421875, -0.569488525390625, -0.5473785400390625, -0.5252685546875, -0.5031585693359375, -0.481048583984375, -0.4589385986328125, -0.43682861328125, -0.4147186279296875, -0.392608642578125, -0.3704986572265625, -0.348388671875, -0.3262786865234375, -0.304168701171875, -0.2820587158203125, -0.25994873046875, -0.2378387451171875, -0.215728759765625, -0.1936187744140625, -0.1715087890625, -0.1493988037109375, -0.127288818359375, -0.1051788330078125, -0.08306884765625, -0.0609588623046875, -0.038848876953125, -0.0167388916015625, 0.00537109375, 0.0274810791015625, 0.049591064453125, 0.0717010498046875, 0.09381103515625, 0.1159210205078125, 0.138031005859375, 0.1601409912109375, 0.1822509765625, 0.2043609619140625, 0.226470947265625, 0.2485809326171875, 0.27069091796875, 0.2928009033203125, 0.314910888671875, 0.3370208740234375, 0.359130859375, 0.3812408447265625, 0.403350830078125, 0.4254608154296875, 0.44757080078125, 0.4696807861328125, 0.491790771484375, 0.5139007568359375, 0.5360107421875, 0.5581207275390625, 0.580230712890625, 0.6023406982421875, 0.62445068359375, 0.6465606689453125, 0.668670654296875, 0.6907806396484375, 0.712890625]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 7.0, 5.0, 4.0, 5.0, 9.0, 8.0, 14.0, 29.0, 24.0, 27.0, 56.0, 61.0, 80.0, 90.0, 79.0, 99.0, 83.0, 70.0, 58.0, 44.0, 33.0, 29.0, 21.0, 14.0, 13.0, 4.0, 6.0, 7.0, 5.0, 5.0, 3.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001674652099609375, -0.0016166865825653076, -0.0015587210655212402, -0.0015007555484771729, -0.0014427900314331055, -0.001384824514389038, -0.0013268589973449707, -0.0012688934803009033, -0.001210927963256836, -0.0011529624462127686, -0.0010949969291687012, -0.0010370314121246338, -0.0009790658950805664, -0.000921100378036499, -0.0008631348609924316, -0.0008051693439483643, -0.0007472038269042969, -0.0006892383098602295, -0.0006312727928161621, -0.0005733072757720947, -0.0005153417587280273, -0.00045737624168395996, -0.0003994107246398926, -0.0003414452075958252, -0.0002834796905517578, -0.00022551417350769043, -0.00016754865646362305, -0.00010958313941955566, -5.161762237548828e-05, 6.3478946685791016e-06, 6.431341171264648e-05, 0.00012227892875671387, 0.00018024444580078125, 0.00023820996284484863, 0.000296175479888916, 0.0003541409969329834, 0.0004121065139770508, 0.00047007203102111816, 0.0005280375480651855, 0.0005860030651092529, 0.0006439685821533203, 0.0007019340991973877, 0.0007598996162414551, 0.0008178651332855225, 0.0008758306503295898, 0.0009337961673736572, 0.0009917616844177246, 0.001049727201461792, 0.0011076927185058594, 0.0011656582355499268, 0.0012236237525939941, 0.0012815892696380615, 0.001339554786682129, 0.0013975203037261963, 0.0014554858207702637, 0.001513451337814331, 0.0015714168548583984, 0.0016293823719024658, 0.0016873478889465332, 0.0017453134059906006, 0.001803278923034668, 0.0018612444400787354, 0.0019192099571228027, 0.00197717547416687, 0.0020351409912109375]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 0.0, 5.0, 6.0, 6.0, 10.0, 7.0, 13.0, 18.0, 20.0, 23.0, 57.0, 72.0, 106.0, 163.0, 295.0, 536.0, 15372.0, 1029790.0, 1100.0, 342.0, 212.0, 120.0, 78.0, 70.0, 36.0, 23.0, 20.0, 10.0, 7.0, 8.0, 8.0, 7.0, 4.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.044464111328125, -0.04320240020751953, -0.04194068908691406, -0.040678977966308594, -0.039417266845703125, -0.038155555725097656, -0.03689384460449219, -0.03563213348388672, -0.03437042236328125, -0.03310871124267578, -0.03184700012207031, -0.030585289001464844, -0.029323577880859375, -0.028061866760253906, -0.026800155639648438, -0.02553844451904297, -0.0242767333984375, -0.02301502227783203, -0.021753311157226562, -0.020491600036621094, -0.019229888916015625, -0.017968177795410156, -0.016706466674804688, -0.015444755554199219, -0.01418304443359375, -0.012921333312988281, -0.011659622192382812, -0.010397911071777344, -0.009136199951171875, -0.007874488830566406, -0.0066127777099609375, -0.005351066589355469, -0.00408935546875, -0.0028276443481445312, -0.0015659332275390625, -0.00030422210693359375, 0.000957489013671875, 0.0022192001342773438, 0.0034809112548828125, 0.004742622375488281, 0.00600433349609375, 0.007266044616699219, 0.008527755737304688, 0.009789466857910156, 0.011051177978515625, 0.012312889099121094, 0.013574600219726562, 0.014836311340332031, 0.0160980224609375, 0.01735973358154297, 0.018621444702148438, 0.019883155822753906, 0.021144866943359375, 0.022406578063964844, 0.023668289184570312, 0.02493000030517578, 0.02619171142578125, 0.02745342254638672, 0.028715133666992188, 0.029976844787597656, 0.031238555908203125, 0.032500267028808594, 0.03376197814941406, 0.03502368927001953, 0.036285400390625]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 20.0, 409.0, 543.0, 44.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004643936641514301, -0.004494477994740009, -0.004345019347965717, -0.004195560701191425, -0.004046102054417133, -0.0038966434076428413, -0.0037471847608685493, -0.0035977261140942574, -0.0034482674673199654, -0.0032988088205456734, -0.0031493501737713814, -0.0029998915269970894, -0.0028504328802227974, -0.0027009742334485054, -0.0025515155866742134, -0.0024020569398999214, -0.0022525980602949858, -0.0021031394135206938, -0.001953680766746402, -0.0018042221199721098, -0.0016547634731978178, -0.0015053048264235258, -0.001355846063233912, -0.00120638741645962, -0.001056928769685328, -0.000907470122911036, -0.000758011476136744, -0.0006085527711547911, -0.0004590941243804991, -0.00030963547760620713, -0.00016017677262425423, -1.0718125849962234e-05, 0.00013874052092432976, 0.00028819916769862175, 0.0004376578435767442, 0.0005871165194548666, 0.0007365751662291586, 0.0008860338130034506, 0.0010354925179854035, 0.0011849511647596955, 0.0013344098115339875, 0.0014838684583082795, 0.0016333271050825715, 0.0017827858682721853, 0.0019322445150464773, 0.0020817031618207693, 0.0022311618085950613, 0.0023806204553693533, 0.0025300791021436453, 0.0026795377489179373, 0.0028289963956922293, 0.0029784550424665213, 0.0031279136892408133, 0.0032773723360151052, 0.003426831215620041, 0.003576289862394333, 0.003725748509168625, 0.003875207155942917, 0.004024665802717209, 0.004174124449491501, 0.004323583096265793, 0.004473041743040085, 0.004622500389814377, 0.004771959036588669, 0.004921417683362961]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 3.0, 4.0, 4.0, 8.0, 4.0, 5.0, 8.0, 9.0, 3.0, 12.0, 16.0, 15.0, 19.0, 28.0, 24.0, 28.0, 33.0, 22.0, 37.0, 29.0, 41.0, 48.0, 36.0, 47.0, 37.0, 52.0, 42.0, 36.0, 31.0, 38.0, 33.0, 36.0, 34.0, 31.0, 21.0, 17.0, 29.0, 10.0, 10.0, 11.0, 12.0, 12.0, 8.0, 2.0, 3.0, 5.0, 6.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0007987618446350098, -0.000775020569562912, -0.0007512792944908142, -0.0007275380194187164, -0.0007037967443466187, -0.0006800554692745209, -0.0006563141942024231, -0.0006325729191303253, -0.0006088316440582275, -0.0005850903689861298, -0.000561349093914032, -0.0005376078188419342, -0.0005138665437698364, -0.0004901252686977386, -0.00046638399362564087, -0.0004426427185535431, -0.0004189014434814453, -0.00039516016840934753, -0.00037141889333724976, -0.000347677618265152, -0.0003239363431930542, -0.0003001950681209564, -0.00027645379304885864, -0.00025271251797676086, -0.00022897124290466309, -0.0002052299678325653, -0.00018148869276046753, -0.00015774741768836975, -0.00013400614261627197, -0.0001102648675441742, -8.652359247207642e-05, -6.278231739997864e-05, -3.904104232788086e-05, -1.529976725578308e-05, 8.441507816314697e-06, 3.2182782888412476e-05, 5.5924057960510254e-05, 7.966533303260803e-05, 0.00010340660810470581, 0.0001271478831768036, 0.00015088915824890137, 0.00017463043332099915, 0.00019837170839309692, 0.0002221129834651947, 0.0002458542585372925, 0.00026959553360939026, 0.00029333680868148804, 0.0003170780837535858, 0.0003408193588256836, 0.00036456063389778137, 0.00038830190896987915, 0.00041204318404197693, 0.0004357844591140747, 0.0004595257341861725, 0.00048326700925827026, 0.000507008284330368, 0.0005307495594024658, 0.0005544908344745636, 0.0005782321095466614, 0.0006019733846187592, 0.0006257146596908569, 0.0006494559347629547, 0.0006731972098350525, 0.0006969384849071503, 0.000720679759979248]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 8.0, 14.0, 10.0, 9.0, 17.0, 10.0, 25.0, 24.0, 27.0, 27.0, 30.0, 32.0, 32.0, 44.0, 43.0, 46.0, 49.0, 45.0, 44.0, 46.0, 57.0, 42.0, 37.0, 49.0, 37.0, 32.0, 34.0, 23.0, 20.0, 23.0, 14.0, 14.0, 8.0, 9.0, 11.0, 6.0, 1.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.953125, -5.7542724609375, -5.555419921875, -5.3565673828125, -5.15771484375, -4.9588623046875, -4.760009765625, -4.5611572265625, -4.3623046875, -4.1634521484375, -3.964599609375, -3.7657470703125, -3.56689453125, -3.3680419921875, -3.169189453125, -2.9703369140625, -2.771484375, -2.5726318359375, -2.373779296875, -2.1749267578125, -1.97607421875, -1.7772216796875, -1.578369140625, -1.3795166015625, -1.1806640625, -0.9818115234375, -0.782958984375, -0.5841064453125, -0.38525390625, -0.1864013671875, 0.012451171875, 0.2113037109375, 0.41015625, 0.6090087890625, 0.807861328125, 1.0067138671875, 1.20556640625, 1.4044189453125, 1.603271484375, 1.8021240234375, 2.0009765625, 2.1998291015625, 2.398681640625, 2.5975341796875, 2.79638671875, 2.9952392578125, 3.194091796875, 3.3929443359375, 3.591796875, 3.7906494140625, 3.989501953125, 4.1883544921875, 4.38720703125, 4.5860595703125, 4.784912109375, 4.9837646484375, 5.1826171875, 5.3814697265625, 5.580322265625, 5.7791748046875, 5.97802734375, 6.1768798828125, 6.375732421875, 6.5745849609375, 6.7734375]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 5.0, 4.0, 7.0, 17.0, 43.0, 31.0, 49.0, 97.0, 129.0, 282.0, 395.0, 728.0, 1294.0, 2335.0, 4368.0, 8990.0, 20549.0, 55672.0, 215835.0, 530116.0, 136491.0, 40039.0, 15741.0, 7175.0, 3595.0, 1880.0, 1143.0, 617.0, 342.0, 231.0, 156.0, 72.0, 51.0, 28.0, 19.0, 14.0, 9.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9140625, -4.77099609375, -4.6279296875, -4.48486328125, -4.341796875, -4.19873046875, -4.0556640625, -3.91259765625, -3.76953125, -3.62646484375, -3.4833984375, -3.34033203125, -3.197265625, -3.05419921875, -2.9111328125, -2.76806640625, -2.625, -2.48193359375, -2.3388671875, -2.19580078125, -2.052734375, -1.90966796875, -1.7666015625, -1.62353515625, -1.48046875, -1.33740234375, -1.1943359375, -1.05126953125, -0.908203125, -0.76513671875, -0.6220703125, -0.47900390625, -0.3359375, -0.19287109375, -0.0498046875, 0.09326171875, 0.236328125, 0.37939453125, 0.5224609375, 0.66552734375, 0.80859375, 0.95166015625, 1.0947265625, 1.23779296875, 1.380859375, 1.52392578125, 1.6669921875, 1.81005859375, 1.953125, 2.09619140625, 2.2392578125, 2.38232421875, 2.525390625, 2.66845703125, 2.8115234375, 2.95458984375, 3.09765625, 3.24072265625, 3.3837890625, 3.52685546875, 3.669921875, 3.81298828125, 3.9560546875, 4.09912109375, 4.2421875]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 3.0, 5.0, 2.0, 2.0, 3.0, 8.0, 6.0, 7.0, 16.0, 16.0, 10.0, 18.0, 20.0, 24.0, 27.0, 26.0, 34.0, 38.0, 37.0, 39.0, 63.0, 85.0, 1715.0, 336.0, 77.0, 51.0, 45.0, 38.0, 48.0, 37.0, 24.0, 25.0, 26.0, 28.0, 21.0, 20.0, 21.0, 18.0, 11.0, 3.0, 6.0, 5.0, 7.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.109375, -17.435791015625, -16.76220703125, -16.088623046875, -15.4150390625, -14.741455078125, -14.06787109375, -13.394287109375, -12.720703125, -12.047119140625, -11.37353515625, -10.699951171875, -10.0263671875, -9.352783203125, -8.67919921875, -8.005615234375, -7.33203125, -6.658447265625, -5.98486328125, -5.311279296875, -4.6376953125, -3.964111328125, -3.29052734375, -2.616943359375, -1.943359375, -1.269775390625, -0.59619140625, 0.077392578125, 0.7509765625, 1.424560546875, 2.09814453125, 2.771728515625, 3.4453125, 4.118896484375, 4.79248046875, 5.466064453125, 6.1396484375, 6.813232421875, 7.48681640625, 8.160400390625, 8.833984375, 9.507568359375, 10.18115234375, 10.854736328125, 11.5283203125, 12.201904296875, 12.87548828125, 13.549072265625, 14.22265625, 14.896240234375, 15.56982421875, 16.243408203125, 16.9169921875, 17.590576171875, 18.26416015625, 18.937744140625, 19.611328125, 20.284912109375, 20.95849609375, 21.632080078125, 22.3056640625, 22.979248046875, 23.65283203125, 24.326416015625, 25.0]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 7.0, 5.0, 5.0, 3.0, 6.0, 14.0, 19.0, 20.0, 14.0, 28.0, 28.0, 34.0, 37.0, 43.0, 72.0, 92.0, 156.0, 260.0, 556.0, 2719.0, 140098.0, 2990659.0, 8915.0, 1032.0, 323.0, 151.0, 107.0, 78.0, 43.0, 25.0, 34.0, 26.0, 17.0, 16.0, 10.0, 16.0, 15.0, 3.0, 8.0, 7.0, 1.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0], "bins": [-41.75, -40.628173828125, -39.50634765625, -38.384521484375, -37.2626953125, -36.140869140625, -35.01904296875, -33.897216796875, -32.775390625, -31.653564453125, -30.53173828125, -29.409912109375, -28.2880859375, -27.166259765625, -26.04443359375, -24.922607421875, -23.80078125, -22.678955078125, -21.55712890625, -20.435302734375, -19.3134765625, -18.191650390625, -17.06982421875, -15.947998046875, -14.826171875, -13.704345703125, -12.58251953125, -11.460693359375, -10.3388671875, -9.217041015625, -8.09521484375, -6.973388671875, -5.8515625, -4.729736328125, -3.60791015625, -2.486083984375, -1.3642578125, -0.242431640625, 0.87939453125, 2.001220703125, 3.123046875, 4.244873046875, 5.36669921875, 6.488525390625, 7.6103515625, 8.732177734375, 9.85400390625, 10.975830078125, 12.09765625, 13.219482421875, 14.34130859375, 15.463134765625, 16.5849609375, 17.706787109375, 18.82861328125, 19.950439453125, 21.072265625, 22.194091796875, 23.31591796875, 24.437744140625, 25.5595703125, 26.681396484375, 27.80322265625, 28.925048828125, 30.046875]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [19.0, 846.0, 152.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.61663818359375, -4.067175388336182, 1.4822874069213867, 7.031749725341797, 12.581212997436523, 18.13067626953125, 23.680137634277344, 29.229602813720703, 34.7790641784668, 40.32852554321289, 45.87799072265625, 51.427452087402344, 56.97691345214844, 62.5263786315918, 68.07583618164062, 73.62530517578125, 79.17476654052734, 84.72422790527344, 90.27368927001953, 95.82315063476562, 101.37261962890625, 106.92208099365234, 112.47154235839844, 118.02101135253906, 123.57046508789062, 129.11993408203125, 134.6693878173828, 140.21885681152344, 145.768310546875, 151.31777954101562, 156.86724853515625, 162.4167022705078, 167.96617126464844, 173.51564025878906, 179.06509399414062, 184.61456298828125, 190.1640167236328, 195.71348571777344, 201.262939453125, 206.81240844726562, 212.36187744140625, 217.91134643554688, 223.46080017089844, 229.01026916503906, 234.55972290039062, 240.10919189453125, 245.65866088867188, 251.20811462402344, 256.757568359375, 262.3070373535156, 267.85650634765625, 273.40594482421875, 278.9554138183594, 284.5048828125, 290.0543518066406, 295.60382080078125, 301.1532897949219, 306.7027587890625, 312.2522277832031, 317.8016662597656, 323.35113525390625, 328.9006042480469, 334.4500732421875, 339.9995422363281, 345.5489807128906]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 8.0, 4.0, 7.0, 9.0, 8.0, 9.0, 11.0, 16.0, 23.0, 15.0, 18.0, 13.0, 32.0, 19.0, 31.0, 47.0, 40.0, 35.0, 37.0, 44.0, 40.0, 39.0, 44.0, 33.0, 49.0, 37.0, 37.0, 51.0, 26.0, 34.0, 28.0, 27.0, 24.0, 18.0, 17.0, 23.0, 20.0, 6.0, 4.0, 10.0, 8.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-76.71792602539062, -74.57952880859375, -72.44113159179688, -70.30274200439453, -68.16434478759766, -66.02594757080078, -63.88755416870117, -61.74916076660156, -59.61076354980469, -57.47236633300781, -55.3339729309082, -53.195579528808594, -51.05718231201172, -48.918785095214844, -46.780391693115234, -44.641998291015625, -42.50360107421875, -40.365203857421875, -38.226810455322266, -36.088417053222656, -33.95001983642578, -31.81162452697754, -29.673229217529297, -27.534833908081055, -25.396438598632812, -23.25804328918457, -21.119647979736328, -18.981252670288086, -16.842857360839844, -14.704462051391602, -12.56606674194336, -10.427671432495117, -8.289268493652344, -6.150873184204102, -4.012477874755859, -1.8740825653076172, 0.264312744140625, 2.402708053588867, 4.541103363037109, 6.679498672485352, 8.817893981933594, 10.956289291381836, 13.094684600830078, 15.23307991027832, 17.371475219726562, 19.509870529174805, 21.648265838623047, 23.78666114807129, 25.92505645751953, 28.063451766967773, 30.201847076416016, 32.340240478515625, 34.4786376953125, 36.617034912109375, 38.755428314208984, 40.893821716308594, 43.03221893310547, 45.170616149902344, 47.30900955200195, 49.44740295410156, 51.58580017089844, 53.72419738769531, 55.86259078979492, 58.00098419189453, 60.139381408691406]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 7.0, 10.0, 11.0, 9.0, 16.0, 13.0, 15.0, 34.0, 17.0, 28.0, 32.0, 29.0, 43.0, 36.0, 45.0, 39.0, 45.0, 42.0, 49.0, 58.0, 52.0, 46.0, 39.0, 33.0, 46.0, 33.0, 27.0, 29.0, 26.0, 17.0, 20.0, 13.0, 8.0, 8.0, 11.0, 8.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.171875, -5.96710205078125, -5.7623291015625, -5.55755615234375, -5.352783203125, -5.14801025390625, -4.9432373046875, -4.73846435546875, -4.53369140625, -4.32891845703125, -4.1241455078125, -3.91937255859375, -3.714599609375, -3.50982666015625, -3.3050537109375, -3.10028076171875, -2.8955078125, -2.69073486328125, -2.4859619140625, -2.28118896484375, -2.076416015625, -1.87164306640625, -1.6668701171875, -1.46209716796875, -1.25732421875, -1.05255126953125, -0.8477783203125, -0.64300537109375, -0.438232421875, -0.23345947265625, -0.0286865234375, 0.17608642578125, 0.380859375, 0.58563232421875, 0.7904052734375, 0.99517822265625, 1.199951171875, 1.40472412109375, 1.6094970703125, 1.81427001953125, 2.01904296875, 2.22381591796875, 2.4285888671875, 2.63336181640625, 2.838134765625, 3.04290771484375, 3.2476806640625, 3.45245361328125, 3.6572265625, 3.86199951171875, 4.0667724609375, 4.27154541015625, 4.476318359375, 4.68109130859375, 4.8858642578125, 5.09063720703125, 5.29541015625, 5.50018310546875, 5.7049560546875, 5.90972900390625, 6.114501953125, 6.31927490234375, 6.5240478515625, 6.72882080078125, 6.93359375]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 9.0, 8.0, 14.0, 18.0, 17.0, 18.0, 28.0, 19.0, 26.0, 33.0, 29.0, 49.0, 44.0, 128.0, 695.0, 17168.0, 3430917.0, 740289.0, 4115.0, 262.0, 80.0, 42.0, 28.0, 42.0, 32.0, 41.0, 25.0, 22.0, 20.0, 15.0, 7.0, 10.0, 8.0, 5.0, 7.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.28125, -38.0068359375, -36.732421875, -35.4580078125, -34.18359375, -32.9091796875, -31.634765625, -30.3603515625, -29.0859375, -27.8115234375, -26.537109375, -25.2626953125, -23.98828125, -22.7138671875, -21.439453125, -20.1650390625, -18.890625, -17.6162109375, -16.341796875, -15.0673828125, -13.79296875, -12.5185546875, -11.244140625, -9.9697265625, -8.6953125, -7.4208984375, -6.146484375, -4.8720703125, -3.59765625, -2.3232421875, -1.048828125, 0.2255859375, 1.5, 2.7744140625, 4.048828125, 5.3232421875, 6.59765625, 7.8720703125, 9.146484375, 10.4208984375, 11.6953125, 12.9697265625, 14.244140625, 15.5185546875, 16.79296875, 18.0673828125, 19.341796875, 20.6162109375, 21.890625, 23.1650390625, 24.439453125, 25.7138671875, 26.98828125, 28.2626953125, 29.537109375, 30.8115234375, 32.0859375, 33.3603515625, 34.634765625, 35.9091796875, 37.18359375, 38.4580078125, 39.732421875, 41.0068359375, 42.28125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 5.0, 11.0, 16.0, 24.0, 38.0, 51.0, 72.0, 134.0, 222.0, 334.0, 511.0, 763.0, 662.0, 463.0, 308.0, 182.0, 111.0, 56.0, 42.0, 34.0, 23.0, 6.0, 6.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-38.75, -37.92236328125, -37.0947265625, -36.26708984375, -35.439453125, -34.61181640625, -33.7841796875, -32.95654296875, -32.12890625, -31.30126953125, -30.4736328125, -29.64599609375, -28.818359375, -27.99072265625, -27.1630859375, -26.33544921875, -25.5078125, -24.68017578125, -23.8525390625, -23.02490234375, -22.197265625, -21.36962890625, -20.5419921875, -19.71435546875, -18.88671875, -18.05908203125, -17.2314453125, -16.40380859375, -15.576171875, -14.74853515625, -13.9208984375, -13.09326171875, -12.265625, -11.43798828125, -10.6103515625, -9.78271484375, -8.955078125, -8.12744140625, -7.2998046875, -6.47216796875, -5.64453125, -4.81689453125, -3.9892578125, -3.16162109375, -2.333984375, -1.50634765625, -0.6787109375, 0.14892578125, 0.9765625, 1.80419921875, 2.6318359375, 3.45947265625, 4.287109375, 5.11474609375, 5.9423828125, 6.77001953125, 7.59765625, 8.42529296875, 9.2529296875, 10.08056640625, 10.908203125, 11.73583984375, 12.5634765625, 13.39111328125, 14.21875]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 10.0, 8.0, 21.0, 35.0, 53.0, 106.0, 189.0, 256.0, 576.0, 4542.0, 3904237.0, 281852.0, 1420.0, 394.0, 211.0, 141.0, 86.0, 44.0, 36.0, 33.0, 20.0, 6.0, 6.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-45.0, -41.744140625, -38.48828125, -35.232421875, -31.9765625, -28.720703125, -25.46484375, -22.208984375, -18.953125, -15.697265625, -12.44140625, -9.185546875, -5.9296875, -2.673828125, 0.58203125, 3.837890625, 7.09375, 10.349609375, 13.60546875, 16.861328125, 20.1171875, 23.373046875, 26.62890625, 29.884765625, 33.140625, 36.396484375, 39.65234375, 42.908203125, 46.1640625, 49.419921875, 52.67578125, 55.931640625, 59.1875, 62.443359375, 65.69921875, 68.955078125, 72.2109375, 75.466796875, 78.72265625, 81.978515625, 85.234375, 88.490234375, 91.74609375, 95.001953125, 98.2578125, 101.513671875, 104.76953125, 108.025390625, 111.28125, 114.537109375, 117.79296875, 121.048828125, 124.3046875, 127.560546875, 130.81640625, 134.072265625, 137.328125, 140.583984375, 143.83984375, 147.095703125, 150.3515625, 153.607421875, 156.86328125, 160.119140625, 163.375]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 12.0, 52.0, 155.0, 306.0, 292.0, 130.0, 50.0, 13.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-261.0731201171875, -256.14556884765625, -251.21800231933594, -246.2904510498047, -241.36289978027344, -236.4353485107422, -231.50778198242188, -226.58023071289062, -221.65267944335938, -216.72512817382812, -211.7975616455078, -206.87001037597656, -201.9424591064453, -197.01490783691406, -192.08734130859375, -187.1597900390625, -182.23223876953125, -177.3046875, -172.3771209716797, -167.44956970214844, -162.5220184326172, -157.59446716308594, -152.66690063476562, -147.73934936523438, -142.81178283691406, -137.8842315673828, -132.9566650390625, -128.02911376953125, -123.1015625, -118.17400360107422, -113.24644470214844, -108.31889343261719, -103.39134216308594, -98.46378326416016, -93.5362319946289, -88.60867309570312, -83.68112182617188, -78.7535629272461, -73.82600402832031, -68.89845275878906, -63.97089767456055, -59.04334259033203, -54.115787506103516, -49.188232421875, -44.26067352294922, -39.33312225341797, -34.40556335449219, -29.478008270263672, -24.550453186035156, -19.62289810180664, -14.695342063903809, -9.767786026000977, -4.840230941772461, 0.08732414245605469, 5.014881134033203, 9.942436218261719, 14.869991302490234, 19.79754638671875, 24.725101470947266, 29.652658462524414, 34.58021545410156, 39.50776672363281, 44.435325622558594, 49.36288070678711, 54.290435791015625]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 10.0, 7.0, 6.0, 7.0, 9.0, 10.0, 20.0, 15.0, 17.0, 27.0, 25.0, 29.0, 34.0, 31.0, 36.0, 38.0, 45.0, 46.0, 45.0, 40.0, 40.0, 47.0, 33.0, 42.0, 43.0, 35.0, 39.0, 35.0, 30.0, 20.0, 12.0, 31.0, 16.0, 20.0, 16.0, 9.0, 10.0, 10.0, 5.0, 8.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.0679931640625, -53.16908645629883, -51.27018356323242, -49.37127685546875, -47.472373962402344, -45.57346725463867, -43.674560546875, -41.775657653808594, -39.87675476074219, -37.977848052978516, -36.07894515991211, -34.18003845214844, -32.28113555908203, -30.38222885131836, -28.48332405090332, -26.58441925048828, -24.68551254272461, -22.78660774230957, -20.88770294189453, -18.98879623413086, -17.089893341064453, -15.190987586975098, -13.292081832885742, -11.393177032470703, -9.494272232055664, -7.595367431640625, -5.696462154388428, -3.7975568771362305, -1.8986520767211914, 0.00025272369384765625, 1.8991584777832031, 3.798063278198242, 5.696968078613281, 7.59587287902832, 9.49477767944336, 11.393683433532715, 13.292588233947754, 15.191493034362793, 17.09039878845215, 18.989303588867188, 20.888208389282227, 22.787113189697266, 24.686017990112305, 26.584922790527344, 28.483829498291016, 30.382732391357422, 32.281639099121094, 34.1805419921875, 36.07944869995117, 37.978355407714844, 39.87725830078125, 41.77616500854492, 43.67506790161133, 45.573974609375, 47.472877502441406, 49.37178421020508, 51.27069091796875, 53.16959762573242, 55.06850051879883, 56.9674072265625, 58.866310119628906, 60.76521682739258, 62.66412353515625, 64.56302642822266, 66.46192932128906]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 5.0, 1.0, 5.0, 8.0, 12.0, 15.0, 14.0, 14.0, 11.0, 20.0, 33.0, 24.0, 22.0, 26.0, 37.0, 33.0, 41.0, 39.0, 39.0, 43.0, 34.0, 45.0, 46.0, 55.0, 46.0, 43.0, 41.0, 33.0, 30.0, 26.0, 23.0, 26.0, 23.0, 16.0, 19.0, 19.0, 8.0, 6.0, 4.0, 7.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.83984375, -5.64495849609375, -5.4500732421875, -5.25518798828125, -5.060302734375, -4.86541748046875, -4.6705322265625, -4.47564697265625, -4.28076171875, -4.08587646484375, -3.8909912109375, -3.69610595703125, -3.501220703125, -3.30633544921875, -3.1114501953125, -2.91656494140625, -2.7216796875, -2.52679443359375, -2.3319091796875, -2.13702392578125, -1.942138671875, -1.74725341796875, -1.5523681640625, -1.35748291015625, -1.16259765625, -0.96771240234375, -0.7728271484375, -0.57794189453125, -0.383056640625, -0.18817138671875, 0.0067138671875, 0.20159912109375, 0.396484375, 0.59136962890625, 0.7862548828125, 0.98114013671875, 1.176025390625, 1.37091064453125, 1.5657958984375, 1.76068115234375, 1.95556640625, 2.15045166015625, 2.3453369140625, 2.54022216796875, 2.735107421875, 2.92999267578125, 3.1248779296875, 3.31976318359375, 3.5146484375, 3.70953369140625, 3.9044189453125, 4.09930419921875, 4.294189453125, 4.48907470703125, 4.6839599609375, 4.87884521484375, 5.07373046875, 5.26861572265625, 5.4635009765625, 5.65838623046875, 5.853271484375, 6.04815673828125, 6.2430419921875, 6.43792724609375, 6.6328125]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 7.0, 8.0, 10.0, 18.0, 24.0, 59.0, 93.0, 157.0, 210.0, 310.0, 542.0, 892.0, 1488.0, 2488.0, 4343.0, 7467.0, 12771.0, 23088.0, 41299.0, 74690.0, 137901.0, 242062.0, 223268.0, 122775.0, 66783.0, 36434.0, 21030.0, 11919.0, 6722.0, 3880.0, 2323.0, 1384.0, 814.0, 515.0, 286.0, 188.0, 111.0, 60.0, 49.0, 29.0, 21.0, 18.0, 12.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.1513671875, -1.1183853149414062, -1.0854034423828125, -1.0524215698242188, -1.019439697265625, -0.9864578247070312, -0.9534759521484375, -0.9204940795898438, -0.88751220703125, -0.8545303344726562, -0.8215484619140625, -0.7885665893554688, -0.755584716796875, -0.7226028442382812, -0.6896209716796875, -0.6566390991210938, -0.6236572265625, -0.5906753540039062, -0.5576934814453125, -0.5247116088867188, -0.491729736328125, -0.45874786376953125, -0.4257659912109375, -0.39278411865234375, -0.35980224609375, -0.32682037353515625, -0.2938385009765625, -0.26085662841796875, -0.227874755859375, -0.19489288330078125, -0.1619110107421875, -0.12892913818359375, -0.095947265625, -0.06296539306640625, -0.0299835205078125, 0.00299835205078125, 0.035980224609375, 0.06896209716796875, 0.1019439697265625, 0.13492584228515625, 0.16790771484375, 0.20088958740234375, 0.2338714599609375, 0.26685333251953125, 0.299835205078125, 0.33281707763671875, 0.3657989501953125, 0.39878082275390625, 0.4317626953125, 0.46474456787109375, 0.4977264404296875, 0.5307083129882812, 0.563690185546875, 0.5966720581054688, 0.6296539306640625, 0.6626358032226562, 0.69561767578125, 0.7285995483398438, 0.7615814208984375, 0.7945632934570312, 0.827545166015625, 0.8605270385742188, 0.8935089111328125, 0.9264907836914062, 0.95947265625]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 6.0, 4.0, 5.0, 10.0, 12.0, 12.0, 11.0, 18.0, 23.0, 22.0, 35.0, 25.0, 27.0, 28.0, 34.0, 35.0, 39.0, 43.0, 41.0, 42.0, 1066.0, 37.0, 42.0, 46.0, 47.0, 34.0, 45.0, 29.0, 28.0, 24.0, 24.0, 20.0, 8.0, 15.0, 12.0, 13.0, 9.0, 11.0, 10.0, 10.0, 6.0, 2.0, 5.0, 2.0, 7.0, 4.0, 1.0], "bins": [-4.39453125, -4.27777099609375, -4.1610107421875, -4.04425048828125, -3.927490234375, -3.81072998046875, -3.6939697265625, -3.57720947265625, -3.46044921875, -3.34368896484375, -3.2269287109375, -3.11016845703125, -2.993408203125, -2.87664794921875, -2.7598876953125, -2.64312744140625, -2.5263671875, -2.40960693359375, -2.2928466796875, -2.17608642578125, -2.059326171875, -1.94256591796875, -1.8258056640625, -1.70904541015625, -1.59228515625, -1.47552490234375, -1.3587646484375, -1.24200439453125, -1.125244140625, -1.00848388671875, -0.8917236328125, -0.77496337890625, -0.658203125, -0.54144287109375, -0.4246826171875, -0.30792236328125, -0.191162109375, -0.07440185546875, 0.0423583984375, 0.15911865234375, 0.27587890625, 0.39263916015625, 0.5093994140625, 0.62615966796875, 0.742919921875, 0.85968017578125, 0.9764404296875, 1.09320068359375, 1.2099609375, 1.32672119140625, 1.4434814453125, 1.56024169921875, 1.677001953125, 1.79376220703125, 1.9105224609375, 2.02728271484375, 2.14404296875, 2.26080322265625, 2.3775634765625, 2.49432373046875, 2.611083984375, 2.72784423828125, 2.8446044921875, 2.96136474609375, 3.078125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 13.0, 9.0, 9.0, 26.0, 34.0, 45.0, 87.0, 133.0, 196.0, 328.0, 517.0, 799.0, 1169.0, 1949.0, 3048.0, 4881.0, 7780.0, 12343.0, 20200.0, 33590.0, 55066.0, 92722.0, 158816.0, 1281879.0, 170331.0, 99590.0, 58753.0, 35364.0, 21679.0, 13362.0, 8288.0, 5202.0, 3226.0, 1993.0, 1375.0, 850.0, 520.0, 339.0, 224.0, 129.0, 110.0, 52.0, 44.0, 26.0, 9.0, 16.0, 7.0, 7.0, 3.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.89453125, -0.86865234375, -0.8427734375, -0.81689453125, -0.791015625, -0.76513671875, -0.7392578125, -0.71337890625, -0.6875, -0.66162109375, -0.6357421875, -0.60986328125, -0.583984375, -0.55810546875, -0.5322265625, -0.50634765625, -0.48046875, -0.45458984375, -0.4287109375, -0.40283203125, -0.376953125, -0.35107421875, -0.3251953125, -0.29931640625, -0.2734375, -0.24755859375, -0.2216796875, -0.19580078125, -0.169921875, -0.14404296875, -0.1181640625, -0.09228515625, -0.06640625, -0.04052734375, -0.0146484375, 0.01123046875, 0.037109375, 0.06298828125, 0.0888671875, 0.11474609375, 0.140625, 0.16650390625, 0.1923828125, 0.21826171875, 0.244140625, 0.27001953125, 0.2958984375, 0.32177734375, 0.34765625, 0.37353515625, 0.3994140625, 0.42529296875, 0.451171875, 0.47705078125, 0.5029296875, 0.52880859375, 0.5546875, 0.58056640625, 0.6064453125, 0.63232421875, 0.658203125, 0.68408203125, 0.7099609375, 0.73583984375, 0.76171875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 3.0, 4.0, 7.0, 6.0, 11.0, 10.0, 20.0, 23.0, 26.0, 28.0, 22.0, 29.0, 36.0, 38.0, 37.0, 50.0, 46.0, 67.0, 56.0, 50.0, 46.0, 47.0, 39.0, 40.0, 55.0, 30.0, 35.0, 23.0, 27.0, 21.0, 13.0, 12.0, 11.0, 8.0, 4.0, 2.0, 3.0, 4.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0009469985961914062, -0.0009155869483947754, -0.0008841753005981445, -0.0008527636528015137, -0.0008213520050048828, -0.000789940357208252, -0.0007585287094116211, -0.0007271170616149902, -0.0006957054138183594, -0.0006642937660217285, -0.0006328821182250977, -0.0006014704704284668, -0.0005700588226318359, -0.0005386471748352051, -0.0005072355270385742, -0.00047582387924194336, -0.0004444122314453125, -0.00041300058364868164, -0.0003815889358520508, -0.0003501772880554199, -0.00031876564025878906, -0.0002873539924621582, -0.00025594234466552734, -0.00022453069686889648, -0.00019311904907226562, -0.00016170740127563477, -0.0001302957534790039, -9.888410568237305e-05, -6.747245788574219e-05, -3.606081008911133e-05, -4.649162292480469e-06, 2.676248550415039e-05, 5.817413330078125e-05, 8.958578109741211e-05, 0.00012099742889404297, 0.00015240907669067383, 0.0001838207244873047, 0.00021523237228393555, 0.0002466440200805664, 0.00027805566787719727, 0.0003094673156738281, 0.000340878963470459, 0.00037229061126708984, 0.0004037022590637207, 0.00043511390686035156, 0.0004665255546569824, 0.0004979372024536133, 0.0005293488502502441, 0.000560760498046875, 0.0005921721458435059, 0.0006235837936401367, 0.0006549954414367676, 0.0006864070892333984, 0.0007178187370300293, 0.0007492303848266602, 0.000780642032623291, 0.0008120536804199219, 0.0008434653282165527, 0.0008748769760131836, 0.0009062886238098145, 0.0009377002716064453, 0.0009691119194030762, 0.001000523567199707, 0.0010319352149963379, 0.0010633468627929688]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 7.0, 2.0, 2.0, 2.0, 10.0, 7.0, 7.0, 14.0, 12.0, 39.0, 46.0, 57.0, 73.0, 126.0, 194.0, 331.0, 587.0, 6652.0, 1035684.0, 3267.0, 566.0, 301.0, 178.0, 94.0, 58.0, 56.0, 48.0, 22.0, 25.0, 29.0, 15.0, 13.0, 8.0, 7.0, 6.0, 1.0, 6.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.02850341796875, -0.027624845504760742, -0.026746273040771484, -0.025867700576782227, -0.02498912811279297, -0.02411055564880371, -0.023231983184814453, -0.022353410720825195, -0.021474838256835938, -0.02059626579284668, -0.019717693328857422, -0.018839120864868164, -0.017960548400878906, -0.01708197593688965, -0.01620340347290039, -0.015324831008911133, -0.014446258544921875, -0.013567686080932617, -0.01268911361694336, -0.011810541152954102, -0.010931968688964844, -0.010053396224975586, -0.009174823760986328, -0.00829625129699707, -0.0074176788330078125, -0.006539106369018555, -0.005660533905029297, -0.004781961441040039, -0.0039033889770507812, -0.0030248165130615234, -0.0021462440490722656, -0.0012676715850830078, -0.00038909912109375, 0.0004894733428955078, 0.0013680458068847656, 0.0022466182708740234, 0.0031251907348632812, 0.004003763198852539, 0.004882335662841797, 0.005760908126831055, 0.0066394805908203125, 0.00751805305480957, 0.008396625518798828, 0.009275197982788086, 0.010153770446777344, 0.011032342910766602, 0.01191091537475586, 0.012789487838745117, 0.013668060302734375, 0.014546632766723633, 0.01542520523071289, 0.01630377769470215, 0.017182350158691406, 0.018060922622680664, 0.018939495086669922, 0.01981806755065918, 0.020696640014648438, 0.021575212478637695, 0.022453784942626953, 0.02333235740661621, 0.02421092987060547, 0.025089502334594727, 0.025968074798583984, 0.026846647262573242, 0.0277252197265625]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 48.0, 252.0, 519.0, 172.0, 14.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001175920944660902, -0.0010878217872232199, -0.000999722513370216, -0.0009116233559325337, -0.0008235241402871907, -0.0007354249246418476, -0.0006473257672041655, -0.0005592265515588224, -0.00047112733591347933, -0.00038302812026813626, -0.00029492893372662365, -0.00020682974718511105, -0.00011873053153976798, -3.0631315894424915e-05, 5.7467841543257236e-05, 0.0001455670571886003, 0.00023366627283394337, 0.00032176548847928643, 0.00040986467502079904, 0.0004979638615623116, 0.0005860630772076547, 0.0006741622928529978, 0.0007622614502906799, 0.000850360665936023, 0.0009384598815813661, 0.0010265590390190482, 0.0011146583128720522, 0.0012027574703097343, 0.0012908566277474165, 0.0013789559016004205, 0.0014670550590381026, 0.0015551543328911066, 0.0016432534903287888, 0.001731352647766471, 0.0018194519216194749, 0.001907551079057157, 0.001995650352910161, 0.002083749510347843, 0.0021718486677855253, 0.0022599478252232075, 0.0023480472154915333, 0.0024361463729292154, 0.0025242455303668976, 0.0026123449206352234, 0.0027004440780729055, 0.0027885432355105877, 0.00287664239294827, 0.002964741550385952, 0.003052840707823634, 0.0031409398652613163, 0.0032290390226989985, 0.0033171381801366806, 0.0034052375704050064, 0.0034933367278426886, 0.0035814358852803707, 0.003669535042718053, 0.003757634200155735, 0.003845733357593417, 0.003933832515031099, 0.004021931905299425, 0.004110030829906464, 0.004198130220174789, 0.004286229610443115, 0.004374328535050154, 0.0044624279253184795]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 6.0, 3.0, 4.0, 12.0, 13.0, 11.0, 14.0, 12.0, 18.0, 16.0, 26.0, 19.0, 31.0, 23.0, 34.0, 30.0, 29.0, 34.0, 27.0, 48.0, 34.0, 33.0, 38.0, 31.0, 46.0, 41.0, 46.0, 30.0, 32.0, 30.0, 29.0, 24.0, 27.0, 28.0, 22.0, 17.0, 11.0, 16.0, 8.0, 9.0, 10.0, 7.0, 4.0, 11.0, 1.0, 7.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.0005563497543334961, -0.0005402639508247375, -0.000524178147315979, -0.0005080923438072205, -0.0004920065402984619, -0.00047592073678970337, -0.0004598349332809448, -0.0004437491297721863, -0.00042766332626342773, -0.0004115775227546692, -0.00039549171924591064, -0.0003794059157371521, -0.00036332011222839355, -0.000347234308719635, -0.00033114850521087646, -0.0003150627017021179, -0.0002989768981933594, -0.00028289109468460083, -0.0002668052911758423, -0.00025071948766708374, -0.0002346336841583252, -0.00021854788064956665, -0.0002024620771408081, -0.00018637627363204956, -0.00017029047012329102, -0.00015420466661453247, -0.00013811886310577393, -0.00012203305959701538, -0.00010594725608825684, -8.986145257949829e-05, -7.377564907073975e-05, -5.76898455619812e-05, -4.1604042053222656e-05, -2.551823854446411e-05, -9.432435035705566e-06, 6.6533684730529785e-06, 2.2739171981811523e-05, 3.882497549057007e-05, 5.491077899932861e-05, 7.099658250808716e-05, 8.70823860168457e-05, 0.00010316818952560425, 0.00011925399303436279, 0.00013533979654312134, 0.00015142560005187988, 0.00016751140356063843, 0.00018359720706939697, 0.00019968301057815552, 0.00021576881408691406, 0.0002318546175956726, 0.00024794042110443115, 0.0002640262246131897, 0.00028011202812194824, 0.0002961978316307068, 0.00031228363513946533, 0.0003283694386482239, 0.0003444552421569824, 0.00036054104566574097, 0.0003766268491744995, 0.00039271265268325806, 0.0004087984561920166, 0.00042488425970077515, 0.0004409700632095337, 0.00045705586671829224, 0.0004731416702270508]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 5.0, 1.0, 5.0, 8.0, 12.0, 15.0, 14.0, 14.0, 11.0, 20.0, 33.0, 24.0, 22.0, 26.0, 37.0, 33.0, 41.0, 39.0, 39.0, 43.0, 34.0, 45.0, 46.0, 55.0, 46.0, 43.0, 41.0, 33.0, 30.0, 26.0, 23.0, 26.0, 23.0, 16.0, 19.0, 19.0, 8.0, 6.0, 4.0, 7.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.83984375, -5.64495849609375, -5.4500732421875, -5.25518798828125, -5.060302734375, -4.86541748046875, -4.6705322265625, -4.47564697265625, -4.28076171875, -4.08587646484375, -3.8909912109375, -3.69610595703125, -3.501220703125, -3.30633544921875, -3.1114501953125, -2.91656494140625, -2.7216796875, -2.52679443359375, -2.3319091796875, -2.13702392578125, -1.942138671875, -1.74725341796875, -1.5523681640625, -1.35748291015625, -1.16259765625, -0.96771240234375, -0.7728271484375, -0.57794189453125, -0.383056640625, -0.18817138671875, 0.0067138671875, 0.20159912109375, 0.396484375, 0.59136962890625, 0.7862548828125, 0.98114013671875, 1.176025390625, 1.37091064453125, 1.5657958984375, 1.76068115234375, 1.95556640625, 2.15045166015625, 2.3453369140625, 2.54022216796875, 2.735107421875, 2.92999267578125, 3.1248779296875, 3.31976318359375, 3.5146484375, 3.70953369140625, 3.9044189453125, 4.09930419921875, 4.294189453125, 4.48907470703125, 4.6839599609375, 4.87884521484375, 5.07373046875, 5.26861572265625, 5.4635009765625, 5.65838623046875, 5.853271484375, 6.04815673828125, 6.2430419921875, 6.43792724609375, 6.6328125]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 5.0, 7.0, 10.0, 6.0, 11.0, 9.0, 22.0, 29.0, 45.0, 51.0, 81.0, 106.0, 166.0, 228.0, 348.0, 548.0, 910.0, 1476.0, 2709.0, 5431.0, 12255.0, 30655.0, 104704.0, 471814.0, 307115.0, 67895.0, 22397.0, 9278.0, 4458.0, 2206.0, 1284.0, 737.0, 517.0, 293.0, 205.0, 172.0, 114.0, 66.0, 56.0, 40.0, 28.0, 21.0, 18.0, 12.0, 13.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.35546875, -4.21868896484375, -4.0819091796875, -3.94512939453125, -3.808349609375, -3.67156982421875, -3.5347900390625, -3.39801025390625, -3.26123046875, -3.12445068359375, -2.9876708984375, -2.85089111328125, -2.714111328125, -2.57733154296875, -2.4405517578125, -2.30377197265625, -2.1669921875, -2.03021240234375, -1.8934326171875, -1.75665283203125, -1.619873046875, -1.48309326171875, -1.3463134765625, -1.20953369140625, -1.07275390625, -0.93597412109375, -0.7991943359375, -0.66241455078125, -0.525634765625, -0.38885498046875, -0.2520751953125, -0.11529541015625, 0.021484375, 0.15826416015625, 0.2950439453125, 0.43182373046875, 0.568603515625, 0.70538330078125, 0.8421630859375, 0.97894287109375, 1.11572265625, 1.25250244140625, 1.3892822265625, 1.52606201171875, 1.662841796875, 1.79962158203125, 1.9364013671875, 2.07318115234375, 2.2099609375, 2.34674072265625, 2.4835205078125, 2.62030029296875, 2.757080078125, 2.89385986328125, 3.0306396484375, 3.16741943359375, 3.30419921875, 3.44097900390625, 3.5777587890625, 3.71453857421875, 3.851318359375, 3.98809814453125, 4.1248779296875, 4.26165771484375, 4.3984375]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 8.0, 3.0, 5.0, 10.0, 8.0, 9.0, 20.0, 22.0, 20.0, 22.0, 26.0, 36.0, 36.0, 45.0, 32.0, 55.0, 60.0, 67.0, 162.0, 1857.0, 119.0, 55.0, 43.0, 37.0, 45.0, 40.0, 34.0, 37.0, 23.0, 23.0, 21.0, 12.0, 11.0, 14.0, 9.0, 10.0, 4.0, 4.0, 6.0, 8.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.9375, -24.251953125, -23.56640625, -22.880859375, -22.1953125, -21.509765625, -20.82421875, -20.138671875, -19.453125, -18.767578125, -18.08203125, -17.396484375, -16.7109375, -16.025390625, -15.33984375, -14.654296875, -13.96875, -13.283203125, -12.59765625, -11.912109375, -11.2265625, -10.541015625, -9.85546875, -9.169921875, -8.484375, -7.798828125, -7.11328125, -6.427734375, -5.7421875, -5.056640625, -4.37109375, -3.685546875, -3.0, -2.314453125, -1.62890625, -0.943359375, -0.2578125, 0.427734375, 1.11328125, 1.798828125, 2.484375, 3.169921875, 3.85546875, 4.541015625, 5.2265625, 5.912109375, 6.59765625, 7.283203125, 7.96875, 8.654296875, 9.33984375, 10.025390625, 10.7109375, 11.396484375, 12.08203125, 12.767578125, 13.453125, 14.138671875, 14.82421875, 15.509765625, 16.1953125, 16.880859375, 17.56640625, 18.251953125, 18.9375]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 3.0, 6.0, 6.0, 7.0, 9.0, 13.0, 10.0, 10.0, 20.0, 18.0, 22.0, 38.0, 42.0, 58.0, 88.0, 111.0, 149.0, 274.0, 659.0, 3229.0, 267982.0, 2865153.0, 5869.0, 880.0, 370.0, 209.0, 114.0, 72.0, 56.0, 41.0, 29.0, 29.0, 26.0, 20.0, 19.0, 19.0, 9.0, 10.0, 7.0, 4.0, 2.0, 8.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.65625, -28.6376953125, -27.619140625, -26.6005859375, -25.58203125, -24.5634765625, -23.544921875, -22.5263671875, -21.5078125, -20.4892578125, -19.470703125, -18.4521484375, -17.43359375, -16.4150390625, -15.396484375, -14.3779296875, -13.359375, -12.3408203125, -11.322265625, -10.3037109375, -9.28515625, -8.2666015625, -7.248046875, -6.2294921875, -5.2109375, -4.1923828125, -3.173828125, -2.1552734375, -1.13671875, -0.1181640625, 0.900390625, 1.9189453125, 2.9375, 3.9560546875, 4.974609375, 5.9931640625, 7.01171875, 8.0302734375, 9.048828125, 10.0673828125, 11.0859375, 12.1044921875, 13.123046875, 14.1416015625, 15.16015625, 16.1787109375, 17.197265625, 18.2158203125, 19.234375, 20.2529296875, 21.271484375, 22.2900390625, 23.30859375, 24.3271484375, 25.345703125, 26.3642578125, 27.3828125, 28.4013671875, 29.419921875, 30.4384765625, 31.45703125, 32.4755859375, 33.494140625, 34.5126953125, 35.53125]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 39.0, 641.0, 324.0, 10.0], "bins": [-212.79217529296875, -209.34825134277344, -205.90432739257812, -202.46038818359375, -199.01646423339844, -195.57254028320312, -192.1286163330078, -188.6846923828125, -185.24075317382812, -181.7968292236328, -178.3529052734375, -174.90896606445312, -171.4650421142578, -168.0211181640625, -164.5771942138672, -161.13327026367188, -157.6893310546875, -154.2454071044922, -150.80148315429688, -147.3575439453125, -143.9136199951172, -140.46969604492188, -137.02577209472656, -133.58184814453125, -130.13792419433594, -126.69400024414062, -123.25006866455078, -119.80614471435547, -116.36221313476562, -112.91828918457031, -109.474365234375, -106.03043365478516, -102.58650207519531, -99.142578125, -95.69864654541016, -92.25472259521484, -88.810791015625, -85.36686706542969, -81.92294311523438, -78.47901153564453, -75.03507995605469, -71.59115600585938, -68.14722442626953, -64.70330047607422, -61.259368896484375, -57.81544494628906, -54.371517181396484, -50.927589416503906, -47.48366165161133, -44.03973388671875, -40.59580612182617, -37.151878356933594, -33.70795440673828, -30.26402473449707, -26.820098876953125, -23.376171112060547, -19.93224334716797, -16.48831558227539, -13.044388771057129, -9.600461959838867, -6.156534194946289, -2.712606430053711, 0.7313194274902344, 4.1752471923828125, 7.619174003601074]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 7.0, 3.0, 6.0, 7.0, 12.0, 7.0, 11.0, 16.0, 25.0, 17.0, 15.0, 21.0, 21.0, 27.0, 28.0, 27.0, 28.0, 42.0, 42.0, 45.0, 37.0, 43.0, 26.0, 31.0, 30.0, 30.0, 34.0, 32.0, 34.0, 30.0, 20.0, 31.0, 26.0, 26.0, 23.0, 20.0, 19.0, 21.0, 17.0, 10.0, 14.0, 8.0, 6.0, 5.0, 9.0, 5.0, 4.0, 3.0, 4.0, 2.0, 1.0, 3.0, 4.0], "bins": [-63.172271728515625, -61.31330871582031, -59.454345703125, -57.59538269042969, -55.736419677734375, -53.87745666503906, -52.01849365234375, -50.15953063964844, -48.300567626953125, -46.44160461425781, -44.5826416015625, -42.72367858886719, -40.864715576171875, -39.00575256347656, -37.14678955078125, -35.28782653808594, -33.42886734008789, -31.569904327392578, -29.710941314697266, -27.851978302001953, -25.99301528930664, -24.134052276611328, -22.27509117126465, -20.416128158569336, -18.557165145874023, -16.69820213317871, -14.839239120483398, -12.980277061462402, -11.12131404876709, -9.262351036071777, -7.403388977050781, -5.544425964355469, -3.685466766357422, -1.8265039920806885, 0.03245878219604492, 1.8914213180541992, 3.7503843307495117, 5.609347343444824, 7.46830940246582, 9.327272415161133, 11.186235427856445, 13.045198440551758, 14.90416145324707, 16.76312255859375, 18.622085571289062, 20.481048583984375, 22.340011596679688, 24.198974609375, 26.057937622070312, 27.916900634765625, 29.775863647460938, 31.63482666015625, 33.49378967285156, 35.352752685546875, 37.21171569824219, 39.0706787109375, 40.92964172363281, 42.788604736328125, 44.64756774902344, 46.50653076171875, 48.36549377441406, 50.224456787109375, 52.08341979980469, 53.9423828125, 55.80134201049805]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 4.0, 6.0, 7.0, 9.0, 15.0, 13.0, 13.0, 15.0, 20.0, 20.0, 31.0, 22.0, 27.0, 38.0, 40.0, 34.0, 43.0, 39.0, 37.0, 36.0, 45.0, 58.0, 45.0, 49.0, 47.0, 38.0, 34.0, 34.0, 22.0, 26.0, 17.0, 22.0, 21.0, 15.0, 18.0, 15.0, 4.0, 7.0, 5.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.0390625, -5.8382568359375, -5.637451171875, -5.4366455078125, -5.23583984375, -5.0350341796875, -4.834228515625, -4.6334228515625, -4.4326171875, -4.2318115234375, -4.031005859375, -3.8302001953125, -3.62939453125, -3.4285888671875, -3.227783203125, -3.0269775390625, -2.826171875, -2.6253662109375, -2.424560546875, -2.2237548828125, -2.02294921875, -1.8221435546875, -1.621337890625, -1.4205322265625, -1.2197265625, -1.0189208984375, -0.818115234375, -0.6173095703125, -0.41650390625, -0.2156982421875, -0.014892578125, 0.1859130859375, 0.38671875, 0.5875244140625, 0.788330078125, 0.9891357421875, 1.18994140625, 1.3907470703125, 1.591552734375, 1.7923583984375, 1.9931640625, 2.1939697265625, 2.394775390625, 2.5955810546875, 2.79638671875, 2.9971923828125, 3.197998046875, 3.3988037109375, 3.599609375, 3.8004150390625, 4.001220703125, 4.2020263671875, 4.40283203125, 4.6036376953125, 4.804443359375, 5.0052490234375, 5.2060546875, 5.4068603515625, 5.607666015625, 5.8084716796875, 6.00927734375, 6.2100830078125, 6.410888671875, 6.6116943359375, 6.8125]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 3.0, 6.0, 7.0, 7.0, 5.0, 14.0, 11.0, 16.0, 20.0, 21.0, 26.0, 56.0, 80.0, 164.0, 309.0, 621.0, 1497.0, 4457.0, 16046.0, 82897.0, 729731.0, 2446273.0, 794242.0, 94145.0, 16699.0, 4306.0, 1391.0, 536.0, 283.0, 133.0, 80.0, 54.0, 32.0, 22.0, 25.0, 20.0, 16.0, 12.0, 6.0, 7.0, 2.0, 8.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.2890625, -11.899169921875, -11.50927734375, -11.119384765625, -10.7294921875, -10.339599609375, -9.94970703125, -9.559814453125, -9.169921875, -8.780029296875, -8.39013671875, -8.000244140625, -7.6103515625, -7.220458984375, -6.83056640625, -6.440673828125, -6.05078125, -5.660888671875, -5.27099609375, -4.881103515625, -4.4912109375, -4.101318359375, -3.71142578125, -3.321533203125, -2.931640625, -2.541748046875, -2.15185546875, -1.761962890625, -1.3720703125, -0.982177734375, -0.59228515625, -0.202392578125, 0.1875, 0.577392578125, 0.96728515625, 1.357177734375, 1.7470703125, 2.136962890625, 2.52685546875, 2.916748046875, 3.306640625, 3.696533203125, 4.08642578125, 4.476318359375, 4.8662109375, 5.256103515625, 5.64599609375, 6.035888671875, 6.42578125, 6.815673828125, 7.20556640625, 7.595458984375, 7.9853515625, 8.375244140625, 8.76513671875, 9.155029296875, 9.544921875, 9.934814453125, 10.32470703125, 10.714599609375, 11.1044921875, 11.494384765625, 11.88427734375, 12.274169921875, 12.6640625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 7.0, 10.0, 14.0, 21.0, 21.0, 39.0, 50.0, 81.0, 107.0, 139.0, 189.0, 258.0, 420.0, 577.0, 554.0, 478.0, 339.0, 235.0, 143.0, 107.0, 84.0, 63.0, 37.0, 29.0, 22.0, 17.0, 11.0, 8.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.515625, -18.890380859375, -18.26513671875, -17.639892578125, -17.0146484375, -16.389404296875, -15.76416015625, -15.138916015625, -14.513671875, -13.888427734375, -13.26318359375, -12.637939453125, -12.0126953125, -11.387451171875, -10.76220703125, -10.136962890625, -9.51171875, -8.886474609375, -8.26123046875, -7.635986328125, -7.0107421875, -6.385498046875, -5.76025390625, -5.135009765625, -4.509765625, -3.884521484375, -3.25927734375, -2.634033203125, -2.0087890625, -1.383544921875, -0.75830078125, -0.133056640625, 0.4921875, 1.117431640625, 1.74267578125, 2.367919921875, 2.9931640625, 3.618408203125, 4.24365234375, 4.868896484375, 5.494140625, 6.119384765625, 6.74462890625, 7.369873046875, 7.9951171875, 8.620361328125, 9.24560546875, 9.870849609375, 10.49609375, 11.121337890625, 11.74658203125, 12.371826171875, 12.9970703125, 13.622314453125, 14.24755859375, 14.872802734375, 15.498046875, 16.123291015625, 16.74853515625, 17.373779296875, 17.9990234375, 18.624267578125, 19.24951171875, 19.874755859375, 20.5]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 6.0, 2.0, 4.0, 2.0, 7.0, 6.0, 9.0, 11.0, 14.0, 11.0, 17.0, 38.0, 26.0, 40.0, 49.0, 61.0, 73.0, 112.0, 178.0, 250.0, 484.0, 1149.0, 7787.0, 304715.0, 3818826.0, 55206.0, 3285.0, 723.0, 373.0, 216.0, 147.0, 90.0, 78.0, 75.0, 40.0, 36.0, 24.0, 22.0, 28.0, 15.0, 11.0, 9.0, 9.0, 5.0, 5.0, 6.0, 3.0, 0.0, 3.0, 1.0, 3.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-49.34375, -47.66015625, -45.9765625, -44.29296875, -42.609375, -40.92578125, -39.2421875, -37.55859375, -35.875, -34.19140625, -32.5078125, -30.82421875, -29.140625, -27.45703125, -25.7734375, -24.08984375, -22.40625, -20.72265625, -19.0390625, -17.35546875, -15.671875, -13.98828125, -12.3046875, -10.62109375, -8.9375, -7.25390625, -5.5703125, -3.88671875, -2.203125, -0.51953125, 1.1640625, 2.84765625, 4.53125, 6.21484375, 7.8984375, 9.58203125, 11.265625, 12.94921875, 14.6328125, 16.31640625, 18.0, 19.68359375, 21.3671875, 23.05078125, 24.734375, 26.41796875, 28.1015625, 29.78515625, 31.46875, 33.15234375, 34.8359375, 36.51953125, 38.203125, 39.88671875, 41.5703125, 43.25390625, 44.9375, 46.62109375, 48.3046875, 49.98828125, 51.671875, 53.35546875, 55.0390625, 56.72265625, 58.40625]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 11.0, 21.0, 55.0, 127.0, 174.0, 221.0, 201.0, 108.0, 51.0, 27.0, 11.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-108.68533325195312, -105.13290405273438, -101.58047485351562, -98.02804565429688, -94.47562408447266, -90.9231948852539, -87.37076568603516, -83.8183364868164, -80.26591491699219, -76.71348571777344, -73.16105651855469, -69.60862731933594, -66.05620574951172, -62.50377655029297, -58.95134735107422, -55.39891815185547, -51.84648895263672, -48.29405975341797, -44.741634368896484, -41.189205169677734, -37.63677978515625, -34.0843505859375, -30.53192138671875, -26.979494094848633, -23.427066802978516, -19.8746395111084, -16.32221221923828, -12.769783020019531, -9.217355728149414, -5.664928436279297, -2.112499237060547, 1.4399280548095703, 4.992362976074219, 8.544790267944336, 12.09721851348877, 15.649646759033203, 19.20207405090332, 22.754501342773438, 26.306930541992188, 29.859357833862305, 33.41178512573242, 36.96421432495117, 40.516639709472656, 44.069068908691406, 47.621498107910156, 51.17392349243164, 54.72635269165039, 58.278778076171875, 61.831207275390625, 65.38363647460938, 68.93606567382812, 72.48849487304688, 76.0409164428711, 79.59334564208984, 83.1457748413086, 86.69820404052734, 90.25062561035156, 93.80305480957031, 97.35548400878906, 100.90791320800781, 104.46033477783203, 108.01276397705078, 111.56519317626953, 115.11762237548828, 118.67005157470703]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 7.0, 1.0, 0.0, 4.0, 7.0, 8.0, 16.0, 16.0, 11.0, 17.0, 12.0, 17.0, 30.0, 24.0, 39.0, 38.0, 38.0, 48.0, 32.0, 49.0, 43.0, 35.0, 43.0, 46.0, 40.0, 42.0, 57.0, 39.0, 32.0, 30.0, 41.0, 19.0, 21.0, 19.0, 21.0, 18.0, 10.0, 9.0, 5.0, 5.0, 3.0, 4.0, 2.0, 3.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.154117584228516, -58.234718322753906, -56.31531524658203, -54.39591598510742, -52.47651290893555, -50.55711364746094, -48.63771057128906, -46.71831130981445, -44.798912048339844, -42.879512786865234, -40.96010971069336, -39.04071044921875, -37.121307373046875, -35.201908111572266, -33.282508850097656, -31.36310577392578, -29.443702697753906, -27.524301528930664, -25.604900360107422, -23.685501098632812, -21.766098022460938, -19.846698760986328, -17.927297592163086, -16.007896423339844, -14.088495254516602, -12.16909408569336, -10.249692916870117, -8.330292701721191, -6.410891532897949, -4.491490364074707, -2.5720901489257812, -0.6526889801025391, 1.2667160034179688, 3.186116933822632, 5.105517864227295, 7.024918556213379, 8.944319725036621, 10.863720893859863, 12.783121109008789, 14.702522277832031, 16.621923446655273, 18.541324615478516, 20.460725784301758, 22.380126953125, 24.29952621459961, 26.218929290771484, 28.138328552246094, 30.057729721069336, 31.977130889892578, 33.89653015136719, 35.81593322753906, 37.73533248901367, 39.65473556518555, 41.574134826660156, 43.49353790283203, 45.41293716430664, 47.33233642578125, 49.25173568725586, 51.171138763427734, 53.090538024902344, 55.00994110107422, 56.92934036254883, 58.84873962402344, 60.76814270019531, 62.68754577636719]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 10.0, 4.0, 9.0, 11.0, 13.0, 12.0, 15.0, 16.0, 29.0, 22.0, 27.0, 21.0, 35.0, 41.0, 33.0, 40.0, 46.0, 39.0, 45.0, 51.0, 31.0, 44.0, 52.0, 47.0, 44.0, 34.0, 27.0, 29.0, 35.0, 29.0, 18.0, 20.0, 15.0, 11.0, 10.0, 10.0, 11.0, 5.0, 3.0, 1.0, 3.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6875, -6.48150634765625, -6.2755126953125, -6.06951904296875, -5.863525390625, -5.65753173828125, -5.4515380859375, -5.24554443359375, -5.03955078125, -4.83355712890625, -4.6275634765625, -4.42156982421875, -4.215576171875, -4.00958251953125, -3.8035888671875, -3.59759521484375, -3.3916015625, -3.18560791015625, -2.9796142578125, -2.77362060546875, -2.567626953125, -2.36163330078125, -2.1556396484375, -1.94964599609375, -1.74365234375, -1.53765869140625, -1.3316650390625, -1.12567138671875, -0.919677734375, -0.71368408203125, -0.5076904296875, -0.30169677734375, -0.095703125, 0.11029052734375, 0.3162841796875, 0.52227783203125, 0.728271484375, 0.93426513671875, 1.1402587890625, 1.34625244140625, 1.55224609375, 1.75823974609375, 1.9642333984375, 2.17022705078125, 2.376220703125, 2.58221435546875, 2.7882080078125, 2.99420166015625, 3.2001953125, 3.40618896484375, 3.6121826171875, 3.81817626953125, 4.024169921875, 4.23016357421875, 4.4361572265625, 4.64215087890625, 4.84814453125, 5.05413818359375, 5.2601318359375, 5.46612548828125, 5.672119140625, 5.87811279296875, 6.0841064453125, 6.29010009765625, 6.49609375]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 10.0, 8.0, 14.0, 16.0, 28.0, 39.0, 47.0, 87.0, 115.0, 150.0, 229.0, 298.0, 493.0, 730.0, 1093.0, 1545.0, 2266.0, 3231.0, 4886.0, 6998.0, 10406.0, 15536.0, 23018.0, 34757.0, 53455.0, 83133.0, 129901.0, 194971.0, 168794.0, 108059.0, 69322.0, 44760.0, 29310.0, 19771.0, 13135.0, 8878.0, 6074.0, 4118.0, 2789.0, 1916.0, 1361.0, 858.0, 622.0, 387.0, 316.0, 184.0, 147.0, 81.0, 74.0, 42.0, 34.0, 24.0, 17.0, 15.0, 4.0, 2.0, 4.0, 4.0], "bins": [-0.85888671875, -0.8334732055664062, -0.8080596923828125, -0.7826461791992188, -0.757232666015625, -0.7318191528320312, -0.7064056396484375, -0.6809921264648438, -0.65557861328125, -0.6301651000976562, -0.6047515869140625, -0.5793380737304688, -0.553924560546875, -0.5285110473632812, -0.5030975341796875, -0.47768402099609375, -0.4522705078125, -0.42685699462890625, -0.4014434814453125, -0.37602996826171875, -0.350616455078125, -0.32520294189453125, -0.2997894287109375, -0.27437591552734375, -0.24896240234375, -0.22354888916015625, -0.1981353759765625, -0.17272186279296875, -0.147308349609375, -0.12189483642578125, -0.0964813232421875, -0.07106781005859375, -0.045654296875, -0.02024078369140625, 0.0051727294921875, 0.03058624267578125, 0.055999755859375, 0.08141326904296875, 0.1068267822265625, 0.13224029541015625, 0.15765380859375, 0.18306732177734375, 0.2084808349609375, 0.23389434814453125, 0.259307861328125, 0.28472137451171875, 0.3101348876953125, 0.33554840087890625, 0.3609619140625, 0.38637542724609375, 0.4117889404296875, 0.43720245361328125, 0.462615966796875, 0.48802947998046875, 0.5134429931640625, 0.5388565063476562, 0.56427001953125, 0.5896835327148438, 0.6150970458984375, 0.6405105590820312, 0.665924072265625, 0.6913375854492188, 0.7167510986328125, 0.7421646118164062, 0.767578125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 6.0, 0.0, 6.0, 3.0, 4.0, 6.0, 5.0, 8.0, 10.0, 13.0, 9.0, 13.0, 15.0, 29.0, 15.0, 27.0, 26.0, 34.0, 41.0, 42.0, 35.0, 38.0, 42.0, 29.0, 45.0, 32.0, 1072.0, 43.0, 35.0, 42.0, 31.0, 25.0, 31.0, 29.0, 23.0, 25.0, 32.0, 17.0, 17.0, 12.0, 16.0, 13.0, 8.0, 9.0, 6.0, 5.0, 5.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.578125, -3.45892333984375, -3.3397216796875, -3.22052001953125, -3.101318359375, -2.98211669921875, -2.8629150390625, -2.74371337890625, -2.62451171875, -2.50531005859375, -2.3861083984375, -2.26690673828125, -2.147705078125, -2.02850341796875, -1.9093017578125, -1.79010009765625, -1.6708984375, -1.55169677734375, -1.4324951171875, -1.31329345703125, -1.194091796875, -1.07489013671875, -0.9556884765625, -0.83648681640625, -0.71728515625, -0.59808349609375, -0.4788818359375, -0.35968017578125, -0.240478515625, -0.12127685546875, -0.0020751953125, 0.11712646484375, 0.236328125, 0.35552978515625, 0.4747314453125, 0.59393310546875, 0.713134765625, 0.83233642578125, 0.9515380859375, 1.07073974609375, 1.18994140625, 1.30914306640625, 1.4283447265625, 1.54754638671875, 1.666748046875, 1.78594970703125, 1.9051513671875, 2.02435302734375, 2.1435546875, 2.26275634765625, 2.3819580078125, 2.50115966796875, 2.620361328125, 2.73956298828125, 2.8587646484375, 2.97796630859375, 3.09716796875, 3.21636962890625, 3.3355712890625, 3.45477294921875, 3.573974609375, 3.69317626953125, 3.8123779296875, 3.93157958984375, 4.05078125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 8.0, 14.0, 20.0, 25.0, 37.0, 59.0, 91.0, 168.0, 208.0, 324.0, 524.0, 803.0, 1189.0, 1887.0, 2908.0, 4392.0, 6967.0, 10612.0, 16581.0, 25456.0, 40176.0, 63115.0, 100232.0, 156474.0, 1251585.0, 150536.0, 95168.0, 60107.0, 38257.0, 24304.0, 15801.0, 10185.0, 6650.0, 4226.0, 2780.0, 1878.0, 1214.0, 757.0, 547.0, 315.0, 180.0, 132.0, 97.0, 49.0, 35.0, 31.0, 16.0, 6.0, 6.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.728515625, -0.70458984375, -0.6806640625, -0.65673828125, -0.6328125, -0.60888671875, -0.5849609375, -0.56103515625, -0.537109375, -0.51318359375, -0.4892578125, -0.46533203125, -0.44140625, -0.41748046875, -0.3935546875, -0.36962890625, -0.345703125, -0.32177734375, -0.2978515625, -0.27392578125, -0.25, -0.22607421875, -0.2021484375, -0.17822265625, -0.154296875, -0.13037109375, -0.1064453125, -0.08251953125, -0.05859375, -0.03466796875, -0.0107421875, 0.01318359375, 0.037109375, 0.06103515625, 0.0849609375, 0.10888671875, 0.1328125, 0.15673828125, 0.1806640625, 0.20458984375, 0.228515625, 0.25244140625, 0.2763671875, 0.30029296875, 0.32421875, 0.34814453125, 0.3720703125, 0.39599609375, 0.419921875, 0.44384765625, 0.4677734375, 0.49169921875, 0.515625, 0.53955078125, 0.5634765625, 0.58740234375, 0.611328125, 0.63525390625, 0.6591796875, 0.68310546875, 0.70703125, 0.73095703125, 0.7548828125, 0.77880859375, 0.802734375]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 7.0, 8.0, 5.0, 8.0, 14.0, 14.0, 11.0, 27.0, 20.0, 30.0, 32.0, 53.0, 42.0, 48.0, 78.0, 76.0, 60.0, 55.0, 65.0, 60.0, 56.0, 37.0, 35.0, 38.0, 27.0, 22.0, 14.0, 11.0, 10.0, 13.0, 10.0, 5.0, 3.0, 4.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014467239379882812, -0.001399114727973938, -0.0013515055179595947, -0.0013038963079452515, -0.0012562870979309082, -0.001208677887916565, -0.0011610686779022217, -0.0011134594678878784, -0.0010658502578735352, -0.001018241047859192, -0.0009706318378448486, -0.0009230226278305054, -0.0008754134178161621, -0.0008278042078018188, -0.0007801949977874756, -0.0007325857877731323, -0.0006849765777587891, -0.0006373673677444458, -0.0005897581577301025, -0.0005421489477157593, -0.000494539737701416, -0.00044693052768707275, -0.0003993213176727295, -0.00035171210765838623, -0.00030410289764404297, -0.0002564936876296997, -0.00020888447761535645, -0.00016127526760101318, -0.00011366605758666992, -6.605684757232666e-05, -1.84476375579834e-05, 2.9161572456359863e-05, 7.677078247070312e-05, 0.0001243799924850464, 0.00017198920249938965, 0.0002195984125137329, 0.00026720762252807617, 0.00031481683254241943, 0.0003624260425567627, 0.00041003525257110596, 0.0004576444625854492, 0.0005052536725997925, 0.0005528628826141357, 0.000600472092628479, 0.0006480813026428223, 0.0006956905126571655, 0.0007432997226715088, 0.000790908932685852, 0.0008385181427001953, 0.0008861273527145386, 0.0009337365627288818, 0.000981345772743225, 0.0010289549827575684, 0.0010765641927719116, 0.0011241734027862549, 0.0011717826128005981, 0.0012193918228149414, 0.0012670010328292847, 0.001314610242843628, 0.0013622194528579712, 0.0014098286628723145, 0.0014574378728866577, 0.001505047082901001, 0.0015526562929153442, 0.0016002655029296875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 6.0, 4.0, 8.0, 9.0, 8.0, 16.0, 28.0, 37.0, 53.0, 85.0, 105.0, 148.0, 227.0, 380.0, 1016.0, 243418.0, 800426.0, 1392.0, 428.0, 220.0, 177.0, 114.0, 59.0, 50.0, 37.0, 29.0, 19.0, 19.0, 12.0, 8.0, 3.0, 2.0, 3.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.040985107421875, -0.039879560470581055, -0.03877401351928711, -0.037668466567993164, -0.03656291961669922, -0.03545737266540527, -0.03435182571411133, -0.03324627876281738, -0.03214073181152344, -0.031035184860229492, -0.029929637908935547, -0.0288240909576416, -0.027718544006347656, -0.02661299705505371, -0.025507450103759766, -0.02440190315246582, -0.023296356201171875, -0.02219080924987793, -0.021085262298583984, -0.01997971534729004, -0.018874168395996094, -0.01776862144470215, -0.016663074493408203, -0.015557527542114258, -0.014451980590820312, -0.013346433639526367, -0.012240886688232422, -0.011135339736938477, -0.010029792785644531, -0.008924245834350586, -0.00781869888305664, -0.006713151931762695, -0.00560760498046875, -0.004502058029174805, -0.0033965110778808594, -0.002290964126586914, -0.0011854171752929688, -7.987022399902344e-05, 0.0010256767272949219, 0.002131223678588867, 0.0032367706298828125, 0.004342317581176758, 0.005447864532470703, 0.0065534114837646484, 0.007658958435058594, 0.008764505386352539, 0.009870052337646484, 0.01097559928894043, 0.012081146240234375, 0.01318669319152832, 0.014292240142822266, 0.015397787094116211, 0.016503334045410156, 0.0176088809967041, 0.018714427947998047, 0.019819974899291992, 0.020925521850585938, 0.022031068801879883, 0.023136615753173828, 0.024242162704467773, 0.02534770965576172, 0.026453256607055664, 0.02755880355834961, 0.028664350509643555, 0.0297698974609375]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 11.0, 44.0, 94.0, 236.0, 290.0, 207.0, 87.0, 29.0, 11.0, 2.0, 2.0], "bins": [-0.0037928707897663116, -0.0037267417646944523, -0.003660612739622593, -0.00359448348172009, -0.0035283544566482306, -0.003462225431576371, -0.003396096173673868, -0.003329967148602009, -0.0032638381235301495, -0.00319770909845829, -0.0031315800733864307, -0.0030654508154839277, -0.0029993217904120684, -0.002933192765340209, -0.002867063507437706, -0.0028009344823658466, -0.0027348054572939873, -0.002668676432222128, -0.0026025474071502686, -0.0025364181492477655, -0.002470289124175906, -0.002404160099104047, -0.002338030841201544, -0.0022719018161296844, -0.002205772791057825, -0.0021396437659859657, -0.0020735147409141064, -0.0020073854830116034, -0.001941256457939744, -0.0018751274328678846, -0.0018089982913807034, -0.0017428691498935223, -0.001676740124821663, -0.0016106110997498035, -0.0015444819582626224, -0.0014783528167754412, -0.0014122237917035818, -0.0013460947666317225, -0.0012799656251445413, -0.00121383648365736, -0.0011477074585855007, -0.0010815784335136414, -0.0010154492920264602, -0.0009493202087469399, -0.0008831911254674196, -0.0008170620421878994, -0.0007509329589083791, -0.0006848038756288588, -0.0006186748505569994, -0.0005525457672774792, -0.0004864166839979589, -0.0004202876007184386, -0.00035415851743891835, -0.0002880294341593981, -0.0002219003508798778, -0.00015577126760035753, -8.964218432083726e-05, -2.3513101041316986e-05, 4.261598223820329e-05, 0.00010874506551772356, 0.00017487414879724383, 0.0002410032320767641, 0.0003071323153562844, 0.00037326139863580465, 0.0004393904819153249]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 2.0, 4.0, 1.0, 6.0, 7.0, 14.0, 11.0, 5.0, 11.0, 16.0, 19.0, 17.0, 26.0, 29.0, 25.0, 23.0, 24.0, 21.0, 34.0, 34.0, 27.0, 30.0, 33.0, 28.0, 42.0, 32.0, 34.0, 31.0, 38.0, 31.0, 40.0, 20.0, 39.0, 33.0, 22.0, 22.0, 13.0, 15.0, 25.0, 15.0, 13.0, 11.0, 16.0, 13.0, 11.0, 7.0, 6.0, 9.0, 6.0, 2.0, 3.0, 4.0, 2.0, 2.0, 3.0, 3.0, 1.0], "bins": [-0.000608980655670166, -0.000590234063565731, -0.0005714874714612961, -0.0005527408793568611, -0.0005339942872524261, -0.0005152476951479912, -0.0004965011030435562, -0.00047775451093912125, -0.0004590079188346863, -0.0004402613267302513, -0.00042151473462581635, -0.0004027681425213814, -0.0003840215504169464, -0.00036527495831251144, -0.0003465283662080765, -0.0003277817741036415, -0.00030903518199920654, -0.0002902885898947716, -0.0002715419977903366, -0.00025279540568590164, -0.00023404881358146667, -0.0002153022214770317, -0.00019655562937259674, -0.00017780903726816177, -0.0001590624451637268, -0.00014031585305929184, -0.00012156926095485687, -0.0001028226688504219, -8.407607674598694e-05, -6.532948464155197e-05, -4.6582892537117004e-05, -2.7836300432682037e-05, -9.08970832824707e-06, 9.656883776187897e-06, 2.8403475880622864e-05, 4.715006798505783e-05, 6.58966600894928e-05, 8.464325219392776e-05, 0.00010338984429836273, 0.0001221364364027977, 0.00014088302850723267, 0.00015962962061166763, 0.0001783762127161026, 0.00019712280482053757, 0.00021586939692497253, 0.0002346159890294075, 0.00025336258113384247, 0.00027210917323827744, 0.0002908557653427124, 0.00030960235744714737, 0.00032834894955158234, 0.0003470955416560173, 0.00036584213376045227, 0.00038458872586488724, 0.0004033353179693222, 0.00042208191007375717, 0.00044082850217819214, 0.0004595750942826271, 0.00047832168638706207, 0.000497068278491497, 0.000515814870595932, 0.000534561462700367, 0.0005533080548048019, 0.0005720546469092369, 0.0005908012390136719]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 10.0, 4.0, 9.0, 11.0, 13.0, 12.0, 15.0, 16.0, 29.0, 22.0, 27.0, 21.0, 35.0, 41.0, 33.0, 40.0, 46.0, 39.0, 45.0, 51.0, 31.0, 44.0, 52.0, 46.0, 45.0, 34.0, 27.0, 29.0, 35.0, 29.0, 18.0, 20.0, 15.0, 11.0, 10.0, 10.0, 11.0, 5.0, 3.0, 1.0, 3.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6875, -6.48150634765625, -6.2755126953125, -6.06951904296875, -5.863525390625, -5.65753173828125, -5.4515380859375, -5.24554443359375, -5.03955078125, -4.83355712890625, -4.6275634765625, -4.42156982421875, -4.215576171875, -4.00958251953125, -3.8035888671875, -3.59759521484375, -3.3916015625, -3.18560791015625, -2.9796142578125, -2.77362060546875, -2.567626953125, -2.36163330078125, -2.1556396484375, -1.94964599609375, -1.74365234375, -1.53765869140625, -1.3316650390625, -1.12567138671875, -0.919677734375, -0.71368408203125, -0.5076904296875, -0.30169677734375, -0.095703125, 0.11029052734375, 0.3162841796875, 0.52227783203125, 0.728271484375, 0.93426513671875, 1.1402587890625, 1.34625244140625, 1.55224609375, 1.75823974609375, 1.9642333984375, 2.17022705078125, 2.376220703125, 2.58221435546875, 2.7882080078125, 2.99420166015625, 3.2001953125, 3.40618896484375, 3.6121826171875, 3.81817626953125, 4.024169921875, 4.23016357421875, 4.4361572265625, 4.64215087890625, 4.84814453125, 5.05413818359375, 5.2601318359375, 5.46612548828125, 5.672119140625, 5.87811279296875, 6.0841064453125, 6.29010009765625, 6.49609375]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 4.0, 9.0, 6.0, 9.0, 22.0, 14.0, 31.0, 40.0, 52.0, 74.0, 122.0, 145.0, 224.0, 353.0, 512.0, 817.0, 1328.0, 2160.0, 3745.0, 7003.0, 14664.0, 37347.0, 118126.0, 416637.0, 307477.0, 83308.0, 28204.0, 11842.0, 5972.0, 3203.0, 1832.0, 1119.0, 700.0, 482.0, 311.0, 208.0, 135.0, 110.0, 46.0, 42.0, 42.0, 29.0, 15.0, 11.0, 4.0, 7.0, 7.0, 7.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.0078125, -3.88201904296875, -3.7562255859375, -3.63043212890625, -3.504638671875, -3.37884521484375, -3.2530517578125, -3.12725830078125, -3.00146484375, -2.87567138671875, -2.7498779296875, -2.62408447265625, -2.498291015625, -2.37249755859375, -2.2467041015625, -2.12091064453125, -1.9951171875, -1.86932373046875, -1.7435302734375, -1.61773681640625, -1.491943359375, -1.36614990234375, -1.2403564453125, -1.11456298828125, -0.98876953125, -0.86297607421875, -0.7371826171875, -0.61138916015625, -0.485595703125, -0.35980224609375, -0.2340087890625, -0.10821533203125, 0.017578125, 0.14337158203125, 0.2691650390625, 0.39495849609375, 0.520751953125, 0.64654541015625, 0.7723388671875, 0.89813232421875, 1.02392578125, 1.14971923828125, 1.2755126953125, 1.40130615234375, 1.527099609375, 1.65289306640625, 1.7786865234375, 1.90447998046875, 2.0302734375, 2.15606689453125, 2.2818603515625, 2.40765380859375, 2.533447265625, 2.65924072265625, 2.7850341796875, 2.91082763671875, 3.03662109375, 3.16241455078125, 3.2882080078125, 3.41400146484375, 3.539794921875, 3.66558837890625, 3.7913818359375, 3.91717529296875, 4.04296875]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 1.0, 5.0, 6.0, 11.0, 10.0, 9.0, 15.0, 14.0, 15.0, 19.0, 22.0, 27.0, 34.0, 38.0, 51.0, 39.0, 41.0, 55.0, 80.0, 1584.0, 491.0, 76.0, 47.0, 42.0, 33.0, 32.0, 43.0, 30.0, 33.0, 20.0, 26.0, 23.0, 19.0, 12.0, 14.0, 7.0, 5.0, 8.0, 6.0, 5.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.9375, -22.17236328125, -21.4072265625, -20.64208984375, -19.876953125, -19.11181640625, -18.3466796875, -17.58154296875, -16.81640625, -16.05126953125, -15.2861328125, -14.52099609375, -13.755859375, -12.99072265625, -12.2255859375, -11.46044921875, -10.6953125, -9.93017578125, -9.1650390625, -8.39990234375, -7.634765625, -6.86962890625, -6.1044921875, -5.33935546875, -4.57421875, -3.80908203125, -3.0439453125, -2.27880859375, -1.513671875, -0.74853515625, 0.0166015625, 0.78173828125, 1.546875, 2.31201171875, 3.0771484375, 3.84228515625, 4.607421875, 5.37255859375, 6.1376953125, 6.90283203125, 7.66796875, 8.43310546875, 9.1982421875, 9.96337890625, 10.728515625, 11.49365234375, 12.2587890625, 13.02392578125, 13.7890625, 14.55419921875, 15.3193359375, 16.08447265625, 16.849609375, 17.61474609375, 18.3798828125, 19.14501953125, 19.91015625, 20.67529296875, 21.4404296875, 22.20556640625, 22.970703125, 23.73583984375, 24.5009765625, 25.26611328125, 26.03125]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 6.0, 7.0, 9.0, 6.0, 10.0, 18.0, 22.0, 22.0, 30.0, 36.0, 36.0, 58.0, 71.0, 92.0, 152.0, 285.0, 554.0, 2765.0, 573221.0, 2563095.0, 3719.0, 618.0, 288.0, 139.0, 100.0, 81.0, 63.0, 49.0, 29.0, 20.0, 24.0, 10.0, 11.0, 13.0, 8.0, 10.0, 10.0, 5.0, 3.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-42.21875, -40.97900390625, -39.7392578125, -38.49951171875, -37.259765625, -36.02001953125, -34.7802734375, -33.54052734375, -32.30078125, -31.06103515625, -29.8212890625, -28.58154296875, -27.341796875, -26.10205078125, -24.8623046875, -23.62255859375, -22.3828125, -21.14306640625, -19.9033203125, -18.66357421875, -17.423828125, -16.18408203125, -14.9443359375, -13.70458984375, -12.46484375, -11.22509765625, -9.9853515625, -8.74560546875, -7.505859375, -6.26611328125, -5.0263671875, -3.78662109375, -2.546875, -1.30712890625, -0.0673828125, 1.17236328125, 2.412109375, 3.65185546875, 4.8916015625, 6.13134765625, 7.37109375, 8.61083984375, 9.8505859375, 11.09033203125, 12.330078125, 13.56982421875, 14.8095703125, 16.04931640625, 17.2890625, 18.52880859375, 19.7685546875, 21.00830078125, 22.248046875, 23.48779296875, 24.7275390625, 25.96728515625, 27.20703125, 28.44677734375, 29.6865234375, 30.92626953125, 32.166015625, 33.40576171875, 34.6455078125, 35.88525390625, 37.125]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [5.0, 167.0, 768.0, 78.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.039982795715332, -5.830307483673096, -1.6206321716308594, 2.589043617248535, 6.798718452453613, 11.008393287658691, 15.218070030212402, 19.427745819091797, 23.637420654296875, 27.847095489501953, 32.05677032470703, 36.266448974609375, 40.47611999511719, 44.68579864501953, 48.89547348022461, 53.10514831542969, 57.314823150634766, 61.524497985839844, 65.73417663574219, 69.94384765625, 74.15352630615234, 78.36319732666016, 82.5728759765625, 86.78254699707031, 90.99222564697266, 95.201904296875, 99.41157531738281, 103.62125396728516, 107.83092498779297, 112.04060363769531, 116.25027465820312, 120.45995330810547, 124.66963195800781, 128.87930297851562, 133.0889892578125, 137.2986602783203, 141.50833129882812, 145.71800231933594, 149.9276885986328, 154.13735961914062, 158.34703063964844, 162.55670166015625, 166.76638793945312, 170.97605895996094, 175.18572998046875, 179.39540100097656, 183.60508728027344, 187.81475830078125, 192.02444458007812, 196.23411560058594, 200.4438018798828, 204.65347290039062, 208.86314392089844, 213.07281494140625, 217.28250122070312, 221.49217224121094, 225.70184326171875, 229.91151428222656, 234.12120056152344, 238.33087158203125, 242.54054260253906, 246.75021362304688, 250.95989990234375, 255.16957092285156, 259.3792419433594]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 8.0, 7.0, 2.0, 7.0, 3.0, 13.0, 7.0, 11.0, 13.0, 19.0, 21.0, 17.0, 16.0, 25.0, 21.0, 24.0, 31.0, 30.0, 24.0, 37.0, 37.0, 41.0, 39.0, 48.0, 35.0, 40.0, 45.0, 43.0, 25.0, 41.0, 44.0, 28.0, 22.0, 20.0, 27.0, 13.0, 15.0, 9.0, 14.0, 17.0, 18.0, 14.0, 7.0, 3.0, 5.0, 9.0, 7.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-72.71269226074219, -70.53578186035156, -68.35887145996094, -66.18196105957031, -64.00505065917969, -61.82814025878906, -59.6512336730957, -57.47432327270508, -55.29741287231445, -53.12050247192383, -50.9435920715332, -48.76668167114258, -46.58977508544922, -44.412864685058594, -42.23595428466797, -40.059043884277344, -37.88213348388672, -35.705223083496094, -33.52831268310547, -31.351404190063477, -29.17449378967285, -26.997583389282227, -24.820674896240234, -22.64376449584961, -20.466854095458984, -18.28994369506836, -16.113033294677734, -13.936124801635742, -11.759214401245117, -9.582304000854492, -7.405394554138184, -5.228485107421875, -3.0515823364257812, -0.8746724128723145, 1.3022375106811523, 3.479147434234619, 5.656057357788086, 7.832967758178711, 10.00987720489502, 12.186786651611328, 14.363697052001953, 16.540607452392578, 18.717517852783203, 20.894426345825195, 23.07133674621582, 25.248247146606445, 27.425155639648438, 29.602066040039062, 31.778976440429688, 33.95588684082031, 36.13279724121094, 38.30970764160156, 40.48661804199219, 42.66352844238281, 44.84043502807617, 47.0173454284668, 49.19425582885742, 51.37116622924805, 53.54807662963867, 55.7249870300293, 57.901893615722656, 60.07880401611328, 62.255714416503906, 64.43262481689453, 66.60953521728516]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 8.0, 7.0, 5.0, 10.0, 10.0, 13.0, 16.0, 10.0, 19.0, 24.0, 19.0, 34.0, 26.0, 31.0, 33.0, 39.0, 36.0, 43.0, 52.0, 32.0, 43.0, 45.0, 47.0, 48.0, 36.0, 47.0, 40.0, 20.0, 33.0, 31.0, 28.0, 24.0, 21.0, 15.0, 9.0, 10.0, 11.0, 12.0, 5.0, 1.0, 3.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.71875, -6.51177978515625, -6.3048095703125, -6.09783935546875, -5.890869140625, -5.68389892578125, -5.4769287109375, -5.26995849609375, -5.06298828125, -4.85601806640625, -4.6490478515625, -4.44207763671875, -4.235107421875, -4.02813720703125, -3.8211669921875, -3.61419677734375, -3.4072265625, -3.20025634765625, -2.9932861328125, -2.78631591796875, -2.579345703125, -2.37237548828125, -2.1654052734375, -1.95843505859375, -1.75146484375, -1.54449462890625, -1.3375244140625, -1.13055419921875, -0.923583984375, -0.71661376953125, -0.5096435546875, -0.30267333984375, -0.095703125, 0.11126708984375, 0.3182373046875, 0.52520751953125, 0.732177734375, 0.93914794921875, 1.1461181640625, 1.35308837890625, 1.56005859375, 1.76702880859375, 1.9739990234375, 2.18096923828125, 2.387939453125, 2.59490966796875, 2.8018798828125, 3.00885009765625, 3.2158203125, 3.42279052734375, 3.6297607421875, 3.83673095703125, 4.043701171875, 4.25067138671875, 4.4576416015625, 4.66461181640625, 4.87158203125, 5.07855224609375, 5.2855224609375, 5.49249267578125, 5.699462890625, 5.90643310546875, 6.1134033203125, 6.32037353515625, 6.52734375]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 7.0, 8.0, 12.0, 13.0, 17.0, 16.0, 17.0, 15.0, 26.0, 28.0, 45.0, 76.0, 111.0, 193.0, 390.0, 1623.0, 8971.0, 108092.0, 2442870.0, 1564272.0, 59460.0, 6003.0, 1107.0, 376.0, 171.0, 94.0, 65.0, 37.0, 29.0, 37.0, 14.0, 16.0, 7.0, 15.0, 12.0, 9.0, 7.0, 5.0, 4.0, 2.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.140625, -20.498046875, -19.85546875, -19.212890625, -18.5703125, -17.927734375, -17.28515625, -16.642578125, -16.0, -15.357421875, -14.71484375, -14.072265625, -13.4296875, -12.787109375, -12.14453125, -11.501953125, -10.859375, -10.216796875, -9.57421875, -8.931640625, -8.2890625, -7.646484375, -7.00390625, -6.361328125, -5.71875, -5.076171875, -4.43359375, -3.791015625, -3.1484375, -2.505859375, -1.86328125, -1.220703125, -0.578125, 0.064453125, 0.70703125, 1.349609375, 1.9921875, 2.634765625, 3.27734375, 3.919921875, 4.5625, 5.205078125, 5.84765625, 6.490234375, 7.1328125, 7.775390625, 8.41796875, 9.060546875, 9.703125, 10.345703125, 10.98828125, 11.630859375, 12.2734375, 12.916015625, 13.55859375, 14.201171875, 14.84375, 15.486328125, 16.12890625, 16.771484375, 17.4140625, 18.056640625, 18.69921875, 19.341796875, 19.984375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 4.0, 3.0, 12.0, 21.0, 22.0, 33.0, 63.0, 101.0, 127.0, 196.0, 268.0, 441.0, 569.0, 624.0, 524.0, 380.0, 231.0, 148.0, 99.0, 74.0, 42.0, 32.0, 26.0, 11.0, 7.0, 6.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.546875, -23.848876953125, -23.15087890625, -22.452880859375, -21.7548828125, -21.056884765625, -20.35888671875, -19.660888671875, -18.962890625, -18.264892578125, -17.56689453125, -16.868896484375, -16.1708984375, -15.472900390625, -14.77490234375, -14.076904296875, -13.37890625, -12.680908203125, -11.98291015625, -11.284912109375, -10.5869140625, -9.888916015625, -9.19091796875, -8.492919921875, -7.794921875, -7.096923828125, -6.39892578125, -5.700927734375, -5.0029296875, -4.304931640625, -3.60693359375, -2.908935546875, -2.2109375, -1.512939453125, -0.81494140625, -0.116943359375, 0.5810546875, 1.279052734375, 1.97705078125, 2.675048828125, 3.373046875, 4.071044921875, 4.76904296875, 5.467041015625, 6.1650390625, 6.863037109375, 7.56103515625, 8.259033203125, 8.95703125, 9.655029296875, 10.35302734375, 11.051025390625, 11.7490234375, 12.447021484375, 13.14501953125, 13.843017578125, 14.541015625, 15.239013671875, 15.93701171875, 16.635009765625, 17.3330078125, 18.031005859375, 18.72900390625, 19.427001953125, 20.125]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 7.0, 3.0, 5.0, 8.0, 18.0, 18.0, 24.0, 36.0, 52.0, 70.0, 97.0, 136.0, 193.0, 345.0, 944.0, 6419.0, 1688217.0, 2487962.0, 7783.0, 932.0, 327.0, 207.0, 134.0, 94.0, 71.0, 52.0, 37.0, 25.0, 24.0, 19.0, 5.0, 5.0, 6.0, 3.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.78125, -50.58447265625, -48.3876953125, -46.19091796875, -43.994140625, -41.79736328125, -39.6005859375, -37.40380859375, -35.20703125, -33.01025390625, -30.8134765625, -28.61669921875, -26.419921875, -24.22314453125, -22.0263671875, -19.82958984375, -17.6328125, -15.43603515625, -13.2392578125, -11.04248046875, -8.845703125, -6.64892578125, -4.4521484375, -2.25537109375, -0.05859375, 2.13818359375, 4.3349609375, 6.53173828125, 8.728515625, 10.92529296875, 13.1220703125, 15.31884765625, 17.515625, 19.71240234375, 21.9091796875, 24.10595703125, 26.302734375, 28.49951171875, 30.6962890625, 32.89306640625, 35.08984375, 37.28662109375, 39.4833984375, 41.68017578125, 43.876953125, 46.07373046875, 48.2705078125, 50.46728515625, 52.6640625, 54.86083984375, 57.0576171875, 59.25439453125, 61.451171875, 63.64794921875, 65.8447265625, 68.04150390625, 70.23828125, 72.43505859375, 74.6318359375, 76.82861328125, 79.025390625, 81.22216796875, 83.4189453125, 85.61572265625, 87.8125]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 12.0, 46.0, 105.0, 197.0, 272.0, 196.0, 111.0, 52.0, 13.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-163.05514526367188, -158.57041931152344, -154.08570861816406, -149.60098266601562, -145.11627197265625, -140.6315460205078, -136.14682006835938, -131.662109375, -127.17738342285156, -122.69266510009766, -118.20794677734375, -113.72322082519531, -109.2385025024414, -104.7537841796875, -100.26905822753906, -95.78433990478516, -91.29962158203125, -86.81490325927734, -82.33018493652344, -77.845458984375, -73.3607406616211, -68.87602233886719, -64.39129638671875, -59.906578063964844, -55.42185974121094, -50.93714141845703, -46.45241928100586, -41.96769714355469, -37.48297882080078, -32.998260498046875, -28.513538360595703, -24.028818130493164, -19.544097900390625, -15.059377670288086, -10.574657440185547, -6.089937210083008, -1.6052169799804688, 2.8795032501220703, 7.364223480224609, 11.848943710327148, 16.333663940429688, 20.818384170532227, 25.303104400634766, 29.787824630737305, 34.272544860839844, 38.75726318359375, 43.24198532104492, 47.726707458496094, 52.21142578125, 56.696144104003906, 61.18086624145508, 65.66558837890625, 70.15030670166016, 74.63502502441406, 79.1197509765625, 83.6044692993164, 88.08918762207031, 92.57390594482422, 97.05862426757812, 101.54335021972656, 106.02806854248047, 110.51278686523438, 114.99751281738281, 119.48223114013672, 123.96694946289062]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 7.0, 7.0, 11.0, 8.0, 13.0, 11.0, 21.0, 20.0, 22.0, 22.0, 20.0, 25.0, 30.0, 26.0, 26.0, 28.0, 37.0, 36.0, 43.0, 37.0, 32.0, 31.0, 41.0, 44.0, 44.0, 41.0, 35.0, 23.0, 30.0, 24.0, 22.0, 22.0, 21.0, 26.0, 20.0, 20.0, 16.0, 10.0, 10.0, 10.0, 5.0, 8.0, 5.0, 4.0, 3.0, 3.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.805999755859375, -49.17817687988281, -47.550350189208984, -45.922523498535156, -44.294700622558594, -42.66687774658203, -41.0390510559082, -39.411224365234375, -37.78340148925781, -36.15557861328125, -34.52775192260742, -32.899925231933594, -31.27210235595703, -29.644277572631836, -28.01645278930664, -26.388628005981445, -24.76080322265625, -23.132978439331055, -21.50515365600586, -19.877328872680664, -18.24950408935547, -16.621679306030273, -14.993854522705078, -13.366029739379883, -11.738204956054688, -10.110380172729492, -8.482555389404297, -6.854730606079102, -5.226905822753906, -3.599081039428711, -1.9712562561035156, -0.3434314727783203, 1.284393310546875, 2.9122180938720703, 4.540042877197266, 6.167867660522461, 7.795692443847656, 9.423517227172852, 11.051342010498047, 12.679166793823242, 14.306991577148438, 15.934816360473633, 17.562641143798828, 19.190465927124023, 20.81829071044922, 22.446115493774414, 24.07394027709961, 25.701765060424805, 27.32958984375, 28.957414627075195, 30.58523941040039, 32.21306610107422, 33.84088897705078, 35.468711853027344, 37.09653854370117, 38.724365234375, 40.35218811035156, 41.980010986328125, 43.60783767700195, 45.23566436767578, 46.863487243652344, 48.491310119628906, 50.119136810302734, 51.74696350097656, 53.374786376953125]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 9.0, 14.0, 10.0, 7.0, 17.0, 20.0, 16.0, 21.0, 19.0, 30.0, 25.0, 34.0, 29.0, 31.0, 39.0, 41.0, 36.0, 35.0, 46.0, 43.0, 48.0, 39.0, 37.0, 40.0, 32.0, 29.0, 37.0, 29.0, 35.0, 21.0, 23.0, 11.0, 15.0, 21.0, 9.0, 9.0, 12.0, 8.0, 7.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.68359375, -6.48138427734375, -6.2791748046875, -6.07696533203125, -5.874755859375, -5.67254638671875, -5.4703369140625, -5.26812744140625, -5.06591796875, -4.86370849609375, -4.6614990234375, -4.45928955078125, -4.257080078125, -4.05487060546875, -3.8526611328125, -3.65045166015625, -3.4482421875, -3.24603271484375, -3.0438232421875, -2.84161376953125, -2.639404296875, -2.43719482421875, -2.2349853515625, -2.03277587890625, -1.83056640625, -1.62835693359375, -1.4261474609375, -1.22393798828125, -1.021728515625, -0.81951904296875, -0.6173095703125, -0.41510009765625, -0.212890625, -0.01068115234375, 0.1915283203125, 0.39373779296875, 0.595947265625, 0.79815673828125, 1.0003662109375, 1.20257568359375, 1.40478515625, 1.60699462890625, 1.8092041015625, 2.01141357421875, 2.213623046875, 2.41583251953125, 2.6180419921875, 2.82025146484375, 3.0224609375, 3.22467041015625, 3.4268798828125, 3.62908935546875, 3.831298828125, 4.03350830078125, 4.2357177734375, 4.43792724609375, 4.64013671875, 4.84234619140625, 5.0445556640625, 5.24676513671875, 5.448974609375, 5.65118408203125, 5.8533935546875, 6.05560302734375, 6.2578125]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 6.0, 5.0, 12.0, 20.0, 25.0, 26.0, 43.0, 66.0, 100.0, 154.0, 188.0, 256.0, 410.0, 610.0, 863.0, 1221.0, 1764.0, 2702.0, 3810.0, 5770.0, 8495.0, 12696.0, 19409.0, 29798.0, 46139.0, 72337.0, 113949.0, 180878.0, 196869.0, 125031.0, 78774.0, 50229.0, 32163.0, 21011.0, 13904.0, 9401.0, 6178.0, 4119.0, 2787.0, 1977.0, 1382.0, 888.0, 647.0, 432.0, 324.0, 198.0, 159.0, 113.0, 78.0, 52.0, 32.0, 26.0, 11.0, 12.0, 7.0, 3.0, 2.0, 4.0, 3.0, 2.0], "bins": [-0.86572265625, -0.8387527465820312, -0.8117828369140625, -0.7848129272460938, -0.757843017578125, -0.7308731079101562, -0.7039031982421875, -0.6769332885742188, -0.64996337890625, -0.6229934692382812, -0.5960235595703125, -0.5690536499023438, -0.542083740234375, -0.5151138305664062, -0.4881439208984375, -0.46117401123046875, -0.4342041015625, -0.40723419189453125, -0.3802642822265625, -0.35329437255859375, -0.326324462890625, -0.29935455322265625, -0.2723846435546875, -0.24541473388671875, -0.21844482421875, -0.19147491455078125, -0.1645050048828125, -0.13753509521484375, -0.110565185546875, -0.08359527587890625, -0.0566253662109375, -0.02965545654296875, -0.002685546875, 0.02428436279296875, 0.0512542724609375, 0.07822418212890625, 0.105194091796875, 0.13216400146484375, 0.1591339111328125, 0.18610382080078125, 0.21307373046875, 0.24004364013671875, 0.2670135498046875, 0.29398345947265625, 0.320953369140625, 0.34792327880859375, 0.3748931884765625, 0.40186309814453125, 0.4288330078125, 0.45580291748046875, 0.4827728271484375, 0.5097427368164062, 0.536712646484375, 0.5636825561523438, 0.5906524658203125, 0.6176223754882812, 0.64459228515625, 0.6715621948242188, 0.6985321044921875, 0.7255020141601562, 0.752471923828125, 0.7794418334960938, 0.8064117431640625, 0.8333816528320312, 0.8603515625]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 1.0, 0.0, 0.0, 5.0, 4.0, 6.0, 4.0, 5.0, 6.0, 12.0, 5.0, 7.0, 13.0, 20.0, 18.0, 29.0, 24.0, 31.0, 15.0, 33.0, 31.0, 42.0, 35.0, 33.0, 36.0, 49.0, 36.0, 1065.0, 45.0, 43.0, 43.0, 36.0, 29.0, 31.0, 20.0, 32.0, 28.0, 26.0, 19.0, 17.0, 16.0, 17.0, 14.0, 9.0, 13.0, 10.0, 7.0, 5.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.140625, -4.021087646484375, -3.90155029296875, -3.782012939453125, -3.6624755859375, -3.542938232421875, -3.42340087890625, -3.303863525390625, -3.184326171875, -3.064788818359375, -2.94525146484375, -2.825714111328125, -2.7061767578125, -2.586639404296875, -2.46710205078125, -2.347564697265625, -2.22802734375, -2.108489990234375, -1.98895263671875, -1.869415283203125, -1.7498779296875, -1.630340576171875, -1.51080322265625, -1.391265869140625, -1.271728515625, -1.152191162109375, -1.03265380859375, -0.913116455078125, -0.7935791015625, -0.674041748046875, -0.55450439453125, -0.434967041015625, -0.3154296875, -0.195892333984375, -0.07635498046875, 0.043182373046875, 0.1627197265625, 0.282257080078125, 0.40179443359375, 0.521331787109375, 0.640869140625, 0.760406494140625, 0.87994384765625, 0.999481201171875, 1.1190185546875, 1.238555908203125, 1.35809326171875, 1.477630615234375, 1.59716796875, 1.716705322265625, 1.83624267578125, 1.955780029296875, 2.0753173828125, 2.194854736328125, 2.31439208984375, 2.433929443359375, 2.553466796875, 2.673004150390625, 2.79254150390625, 2.912078857421875, 3.0316162109375, 3.151153564453125, 3.27069091796875, 3.390228271484375, 3.509765625]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 3.0, 8.0, 13.0, 11.0, 11.0, 24.0, 42.0, 55.0, 91.0, 147.0, 190.0, 298.0, 419.0, 592.0, 951.0, 1467.0, 2134.0, 3223.0, 4615.0, 6981.0, 10335.0, 15839.0, 24434.0, 37499.0, 57957.0, 89813.0, 139460.0, 1247682.0, 159945.0, 102280.0, 66171.0, 43212.0, 27602.0, 17958.0, 11736.0, 7930.0, 5350.0, 3445.0, 2356.0, 1576.0, 1069.0, 741.0, 485.0, 319.0, 216.0, 173.0, 99.0, 70.0, 34.0, 31.0, 23.0, 13.0, 8.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.77490234375, -0.7504196166992188, -0.7259368896484375, -0.7014541625976562, -0.676971435546875, -0.6524887084960938, -0.6280059814453125, -0.6035232543945312, -0.57904052734375, -0.5545578002929688, -0.5300750732421875, -0.5055923461914062, -0.481109619140625, -0.45662689208984375, -0.4321441650390625, -0.40766143798828125, -0.3831787109375, -0.35869598388671875, -0.3342132568359375, -0.30973052978515625, -0.285247802734375, -0.26076507568359375, -0.2362823486328125, -0.21179962158203125, -0.18731689453125, -0.16283416748046875, -0.1383514404296875, -0.11386871337890625, -0.089385986328125, -0.06490325927734375, -0.0404205322265625, -0.01593780517578125, 0.008544921875, 0.03302764892578125, 0.0575103759765625, 0.08199310302734375, 0.106475830078125, 0.13095855712890625, 0.1554412841796875, 0.17992401123046875, 0.20440673828125, 0.22888946533203125, 0.2533721923828125, 0.27785491943359375, 0.302337646484375, 0.32682037353515625, 0.3513031005859375, 0.37578582763671875, 0.4002685546875, 0.42475128173828125, 0.4492340087890625, 0.47371673583984375, 0.498199462890625, 0.5226821899414062, 0.5471649169921875, 0.5716476440429688, 0.59613037109375, 0.6206130981445312, 0.6450958251953125, 0.6695785522460938, 0.694061279296875, 0.7185440063476562, 0.7430267333984375, 0.7675094604492188, 0.7919921875]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 7.0, 9.0, 7.0, 8.0, 12.0, 12.0, 11.0, 15.0, 20.0, 20.0, 27.0, 34.0, 42.0, 47.0, 61.0, 63.0, 68.0, 93.0, 74.0, 62.0, 59.0, 42.0, 27.0, 36.0, 24.0, 28.0, 25.0, 17.0, 14.0, 6.0, 8.0, 9.0, 3.0, 0.0, 6.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.0018682479858398438, -0.0018110424280166626, -0.0017538368701934814, -0.0016966313123703003, -0.0016394257545471191, -0.001582220196723938, -0.0015250146389007568, -0.0014678090810775757, -0.0014106035232543945, -0.0013533979654312134, -0.0012961924076080322, -0.001238986849784851, -0.00118178129196167, -0.0011245757341384888, -0.0010673701763153076, -0.0010101646184921265, -0.0009529590606689453, -0.0008957535028457642, -0.000838547945022583, -0.0007813423871994019, -0.0007241368293762207, -0.0006669312715530396, -0.0006097257137298584, -0.0005525201559066772, -0.0004953145980834961, -0.00043810904026031494, -0.0003809034824371338, -0.00032369792461395264, -0.0002664923667907715, -0.00020928680896759033, -0.00015208125114440918, -9.487569332122803e-05, -3.7670135498046875e-05, 1.9535422325134277e-05, 7.674098014831543e-05, 0.00013394653797149658, 0.00019115209579467773, 0.0002483576536178589, 0.00030556321144104004, 0.0003627687692642212, 0.00041997432708740234, 0.0004771798849105835, 0.0005343854427337646, 0.0005915910005569458, 0.000648796558380127, 0.0007060021162033081, 0.0007632076740264893, 0.0008204132318496704, 0.0008776187896728516, 0.0009348243474960327, 0.0009920299053192139, 0.001049235463142395, 0.0011064410209655762, 0.0011636465787887573, 0.0012208521366119385, 0.0012780576944351196, 0.0013352632522583008, 0.001392468810081482, 0.001449674367904663, 0.0015068799257278442, 0.0015640854835510254, 0.0016212910413742065, 0.0016784965991973877, 0.0017357021570205688, 0.00179290771484375]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 4.0, 8.0, 11.0, 4.0, 13.0, 9.0, 23.0, 18.0, 32.0, 45.0, 60.0, 95.0, 160.0, 281.0, 647.0, 28193.0, 1016093.0, 1786.0, 430.0, 205.0, 125.0, 74.0, 43.0, 32.0, 30.0, 23.0, 21.0, 19.0, 12.0, 9.0, 8.0, 10.0, 6.0, 5.0, 4.0, 2.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0372314453125, -0.035913944244384766, -0.03459644317626953, -0.0332789421081543, -0.03196144104003906, -0.030643939971923828, -0.029326438903808594, -0.02800893783569336, -0.026691436767578125, -0.02537393569946289, -0.024056434631347656, -0.022738933563232422, -0.021421432495117188, -0.020103931427001953, -0.01878643035888672, -0.017468929290771484, -0.01615142822265625, -0.014833927154541016, -0.013516426086425781, -0.012198925018310547, -0.010881423950195312, -0.009563922882080078, -0.008246421813964844, -0.006928920745849609, -0.005611419677734375, -0.004293918609619141, -0.0029764175415039062, -0.0016589164733886719, -0.0003414154052734375, 0.0009760856628417969, 0.0022935867309570312, 0.0036110877990722656, 0.0049285888671875, 0.006246089935302734, 0.007563591003417969, 0.008881092071533203, 0.010198593139648438, 0.011516094207763672, 0.012833595275878906, 0.01415109634399414, 0.015468597412109375, 0.01678609848022461, 0.018103599548339844, 0.019421100616455078, 0.020738601684570312, 0.022056102752685547, 0.02337360382080078, 0.024691104888916016, 0.02600860595703125, 0.027326107025146484, 0.02864360809326172, 0.029961109161376953, 0.03127861022949219, 0.03259611129760742, 0.033913612365722656, 0.03523111343383789, 0.036548614501953125, 0.03786611557006836, 0.039183616638183594, 0.04050111770629883, 0.04181861877441406, 0.0431361198425293, 0.04445362091064453, 0.045771121978759766, 0.047088623046875]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 53.0, 427.0, 449.0, 75.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0084548844024539, -0.008292448706924915, -0.008130013011395931, -0.007967577315866947, -0.00780514208599925, -0.007642706390470266, -0.007480270694941282, -0.0073178354650735855, -0.0071553997695446014, -0.006992964074015617, -0.006830528378486633, -0.0066680931486189365, -0.0065056574530899525, -0.006343221757560968, -0.006180786062031984, -0.006018350832164288, -0.0058559151366353035, -0.005693479441106319, -0.005531043745577335, -0.005368608515709639, -0.0052061728201806545, -0.0050437371246516705, -0.004881301429122686, -0.00471886619925499, -0.004556430038064718, -0.004393994342535734, -0.00423155864700675, -0.004069123417139053, -0.003906687721610069, -0.003744252026081085, -0.003581816330552101, -0.0034193808678537607, -0.003256945637986064, -0.00309450994245708, -0.0029320744797587395, -0.0027696387842297554, -0.002607203321531415, -0.002444767626002431, -0.0022823321633040905, -0.0021198964677751064, -0.0019574607722461224, -0.0017950251931324601, -0.0016325896140187979, -0.0014701539184898138, -0.0013077184557914734, -0.0011452827602624893, -0.000982847181148827, -0.0008204116020351648, -0.0006579761393368244, -0.0004955405602231622, -0.0003331049520056695, -0.00017066934378817677, -8.233764674514532e-06, 0.0001542018144391477, 0.00031663745176047087, 0.0004790730308741331, 0.0006415086099877954, 0.0008039441891014576, 0.0009663797682151198, 0.001128815347328782, 0.0012912510428577662, 0.0014536865055561066, 0.0016161222010850906, 0.0017785577801987529, 0.0019409933593124151]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 9.0, 6.0, 1.0, 5.0, 9.0, 5.0, 10.0, 22.0, 19.0, 24.0, 21.0, 25.0, 32.0, 31.0, 30.0, 30.0, 34.0, 30.0, 41.0, 36.0, 45.0, 43.0, 47.0, 28.0, 29.0, 46.0, 47.0, 35.0, 33.0, 31.0, 20.0, 23.0, 29.0, 21.0, 28.0, 17.0, 14.0, 11.0, 8.0, 11.0, 7.0, 1.0, 2.0, 6.0, 0.0, 1.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0009077787399291992, -0.0008791247382760048, -0.0008504707366228104, -0.0008218167349696159, -0.0007931627333164215, -0.0007645087316632271, -0.0007358547300100327, -0.0007072007283568382, -0.0006785467267036438, -0.0006498927250504494, -0.0006212387233972549, -0.0005925847217440605, -0.0005639307200908661, -0.0005352767184376717, -0.0005066227167844772, -0.0004779687151312828, -0.0004493147134780884, -0.00042066071182489395, -0.0003920067101716995, -0.0003633527085185051, -0.00033469870686531067, -0.00030604470521211624, -0.0002773907035589218, -0.0002487367019057274, -0.00022008270025253296, -0.00019142869859933853, -0.0001627746969461441, -0.00013412069529294968, -0.00010546669363975525, -7.681269198656082e-05, -4.8158690333366394e-05, -1.9504688680171967e-05, 9.149312973022461e-06, 3.780331462621689e-05, 6.645731627941132e-05, 9.511131793260574e-05, 0.00012376531958580017, 0.0001524193212389946, 0.00018107332289218903, 0.00020972732454538345, 0.00023838132619857788, 0.0002670353278517723, 0.00029568932950496674, 0.00032434333115816116, 0.0003529973328113556, 0.00038165133446455, 0.00041030533611774445, 0.0004389593377709389, 0.0004676133394241333, 0.0004962673410773277, 0.0005249213427305222, 0.0005535753443837166, 0.000582229346036911, 0.0006108833476901054, 0.0006395373493432999, 0.0006681913509964943, 0.0006968453526496887, 0.0007254993543028831, 0.0007541533559560776, 0.000782807357609272, 0.0008114613592624664, 0.0008401153609156609, 0.0008687693625688553, 0.0008974233642220497, 0.0009260773658752441]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 9.0, 14.0, 10.0, 7.0, 17.0, 20.0, 16.0, 21.0, 19.0, 30.0, 25.0, 34.0, 29.0, 31.0, 39.0, 41.0, 36.0, 35.0, 46.0, 43.0, 48.0, 39.0, 37.0, 40.0, 32.0, 29.0, 37.0, 29.0, 35.0, 21.0, 23.0, 11.0, 15.0, 21.0, 9.0, 9.0, 13.0, 7.0, 7.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.68359375, -6.48138427734375, -6.2791748046875, -6.07696533203125, -5.874755859375, -5.67254638671875, -5.4703369140625, -5.26812744140625, -5.06591796875, -4.86370849609375, -4.6614990234375, -4.45928955078125, -4.257080078125, -4.05487060546875, -3.8526611328125, -3.65045166015625, -3.4482421875, -3.24603271484375, -3.0438232421875, -2.84161376953125, -2.639404296875, -2.43719482421875, -2.2349853515625, -2.03277587890625, -1.83056640625, -1.62835693359375, -1.4261474609375, -1.22393798828125, -1.021728515625, -0.81951904296875, -0.6173095703125, -0.41510009765625, -0.212890625, -0.01068115234375, 0.1915283203125, 0.39373779296875, 0.595947265625, 0.79815673828125, 1.0003662109375, 1.20257568359375, 1.40478515625, 1.60699462890625, 1.8092041015625, 2.01141357421875, 2.213623046875, 2.41583251953125, 2.6180419921875, 2.82025146484375, 3.0224609375, 3.22467041015625, 3.4268798828125, 3.62908935546875, 3.831298828125, 4.03350830078125, 4.2357177734375, 4.43792724609375, 4.64013671875, 4.84234619140625, 5.0445556640625, 5.24676513671875, 5.448974609375, 5.65118408203125, 5.8533935546875, 6.05560302734375, 6.2578125]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 3.0, 4.0, 9.0, 11.0, 17.0, 33.0, 39.0, 67.0, 84.0, 111.0, 182.0, 260.0, 384.0, 609.0, 851.0, 1277.0, 1856.0, 2898.0, 4496.0, 7324.0, 12885.0, 26989.0, 73030.0, 301512.0, 442315.0, 99486.0, 33646.0, 15385.0, 8154.0, 5000.0, 3213.0, 2102.0, 1374.0, 934.0, 647.0, 424.0, 313.0, 183.0, 137.0, 92.0, 77.0, 42.0, 35.0, 18.0, 18.0, 10.0, 3.0, 10.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.23046875, -5.07257080078125, -4.9146728515625, -4.75677490234375, -4.598876953125, -4.44097900390625, -4.2830810546875, -4.12518310546875, -3.96728515625, -3.80938720703125, -3.6514892578125, -3.49359130859375, -3.335693359375, -3.17779541015625, -3.0198974609375, -2.86199951171875, -2.7041015625, -2.54620361328125, -2.3883056640625, -2.23040771484375, -2.072509765625, -1.91461181640625, -1.7567138671875, -1.59881591796875, -1.44091796875, -1.28302001953125, -1.1251220703125, -0.96722412109375, -0.809326171875, -0.65142822265625, -0.4935302734375, -0.33563232421875, -0.177734375, -0.01983642578125, 0.1380615234375, 0.29595947265625, 0.453857421875, 0.61175537109375, 0.7696533203125, 0.92755126953125, 1.08544921875, 1.24334716796875, 1.4012451171875, 1.55914306640625, 1.717041015625, 1.87493896484375, 2.0328369140625, 2.19073486328125, 2.3486328125, 2.50653076171875, 2.6644287109375, 2.82232666015625, 2.980224609375, 3.13812255859375, 3.2960205078125, 3.45391845703125, 3.61181640625, 3.76971435546875, 3.9276123046875, 4.08551025390625, 4.243408203125, 4.40130615234375, 4.5592041015625, 4.71710205078125, 4.875]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 11.0, 3.0, 5.0, 6.0, 13.0, 10.0, 20.0, 15.0, 17.0, 22.0, 25.0, 38.0, 30.0, 38.0, 33.0, 35.0, 47.0, 52.0, 76.0, 222.0, 1708.0, 160.0, 65.0, 38.0, 37.0, 47.0, 36.0, 34.0, 34.0, 24.0, 28.0, 26.0, 20.0, 15.0, 13.0, 20.0, 4.0, 7.0, 4.0, 8.0, 2.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-27.734375, -26.991455078125, -26.24853515625, -25.505615234375, -24.7626953125, -24.019775390625, -23.27685546875, -22.533935546875, -21.791015625, -21.048095703125, -20.30517578125, -19.562255859375, -18.8193359375, -18.076416015625, -17.33349609375, -16.590576171875, -15.84765625, -15.104736328125, -14.36181640625, -13.618896484375, -12.8759765625, -12.133056640625, -11.39013671875, -10.647216796875, -9.904296875, -9.161376953125, -8.41845703125, -7.675537109375, -6.9326171875, -6.189697265625, -5.44677734375, -4.703857421875, -3.9609375, -3.218017578125, -2.47509765625, -1.732177734375, -0.9892578125, -0.246337890625, 0.49658203125, 1.239501953125, 1.982421875, 2.725341796875, 3.46826171875, 4.211181640625, 4.9541015625, 5.697021484375, 6.43994140625, 7.182861328125, 7.92578125, 8.668701171875, 9.41162109375, 10.154541015625, 10.8974609375, 11.640380859375, 12.38330078125, 13.126220703125, 13.869140625, 14.612060546875, 15.35498046875, 16.097900390625, 16.8408203125, 17.583740234375, 18.32666015625, 19.069580078125, 19.8125]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 1.0, 5.0, 3.0, 9.0, 6.0, 8.0, 14.0, 19.0, 21.0, 39.0, 35.0, 37.0, 54.0, 90.0, 136.0, 211.0, 309.0, 880.0, 7277.0, 2919289.0, 212619.0, 3169.0, 592.0, 271.0, 181.0, 115.0, 71.0, 66.0, 46.0, 25.0, 29.0, 21.0, 17.0, 13.0, 7.0, 4.0, 10.0, 2.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-47.375, -45.7880859375, -44.201171875, -42.6142578125, -41.02734375, -39.4404296875, -37.853515625, -36.2666015625, -34.6796875, -33.0927734375, -31.505859375, -29.9189453125, -28.33203125, -26.7451171875, -25.158203125, -23.5712890625, -21.984375, -20.3974609375, -18.810546875, -17.2236328125, -15.63671875, -14.0498046875, -12.462890625, -10.8759765625, -9.2890625, -7.7021484375, -6.115234375, -4.5283203125, -2.94140625, -1.3544921875, 0.232421875, 1.8193359375, 3.40625, 4.9931640625, 6.580078125, 8.1669921875, 9.75390625, 11.3408203125, 12.927734375, 14.5146484375, 16.1015625, 17.6884765625, 19.275390625, 20.8623046875, 22.44921875, 24.0361328125, 25.623046875, 27.2099609375, 28.796875, 30.3837890625, 31.970703125, 33.5576171875, 35.14453125, 36.7314453125, 38.318359375, 39.9052734375, 41.4921875, 43.0791015625, 44.666015625, 46.2529296875, 47.83984375, 49.4267578125, 51.013671875, 52.6005859375, 54.1875]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 11.0, 111.0, 324.0, 400.0, 127.0, 30.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.56564712524414, -19.198305130004883, -16.830963134765625, -14.463619232177734, -12.096277236938477, -9.728935241699219, -7.3615922927856445, -4.99424934387207, -2.6269073486328125, -0.2595648765563965, 2.1077775955200195, 4.4751200675964355, 6.842462539672852, 9.20980453491211, 11.577147483825684, 13.944490432739258, 16.311832427978516, 18.679174423217773, 21.04651641845703, 23.413860321044922, 25.78120231628418, 28.148544311523438, 30.515888214111328, 32.88323211669922, 35.250572204589844, 37.617916107177734, 39.98525619506836, 42.35260009765625, 44.719940185546875, 47.087284088134766, 49.454627990722656, 51.82196807861328, 54.18931579589844, 56.55665969848633, 58.92399978637695, 61.291343688964844, 63.65868377685547, 66.02603149414062, 68.39337158203125, 70.76071166992188, 73.1280517578125, 75.49539184570312, 77.86273956298828, 80.2300796508789, 82.59741973876953, 84.96476745605469, 87.33210754394531, 89.69944763183594, 92.0667953491211, 94.43413543701172, 96.80148315429688, 99.1688232421875, 101.53616333007812, 103.90350341796875, 106.2708511352539, 108.63819122314453, 111.00553894042969, 113.37287902832031, 115.74022674560547, 118.1075668334961, 120.47490692138672, 122.84225463867188, 125.2095947265625, 127.57693481445312, 129.94427490234375]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 7.0, 3.0, 5.0, 5.0, 6.0, 7.0, 17.0, 21.0, 20.0, 19.0, 28.0, 18.0, 34.0, 25.0, 27.0, 35.0, 35.0, 28.0, 37.0, 49.0, 44.0, 41.0, 32.0, 34.0, 39.0, 34.0, 36.0, 31.0, 32.0, 35.0, 31.0, 28.0, 25.0, 19.0, 11.0, 24.0, 14.0, 8.0, 9.0, 8.0, 11.0, 11.0, 7.0, 2.0, 4.0, 4.0, 1.0, 4.0, 1.0, 0.0, 2.0], "bins": [-73.367431640625, -71.26718139648438, -69.16693115234375, -67.06668090820312, -64.9664306640625, -62.866180419921875, -60.765933990478516, -58.66568374633789, -56.565433502197266, -54.46518325805664, -52.364933013916016, -50.26468276977539, -48.16443634033203, -46.064186096191406, -43.96393585205078, -41.863685607910156, -39.76343536376953, -37.663185119628906, -35.56293487548828, -33.462684631347656, -31.362436294555664, -29.26218605041504, -27.161937713623047, -25.061687469482422, -22.961437225341797, -20.861186981201172, -18.760936737060547, -16.660688400268555, -14.56043815612793, -12.460187911987305, -10.359938621520996, -8.259689331054688, -6.159431457519531, -4.0591816902160645, -1.9589319229125977, 0.14131784439086914, 2.241567611694336, 4.341817855834961, 6.4420671463012695, 8.542316436767578, 10.642566680908203, 12.742816925048828, 14.843066215515137, 16.943315505981445, 19.04356575012207, 21.143815994262695, 23.244064331054688, 25.344314575195312, 27.444564819335938, 29.544815063476562, 31.645065307617188, 33.74531555175781, 35.84556579589844, 37.94581604003906, 40.04606246948242, 42.14631271362305, 44.24656295776367, 46.3468132019043, 48.44706344604492, 50.54731369018555, 52.647560119628906, 54.74781036376953, 56.848060607910156, 58.94831085205078, 61.048561096191406]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 6.0, 5.0, 7.0, 8.0, 14.0, 9.0, 20.0, 13.0, 10.0, 20.0, 12.0, 28.0, 28.0, 33.0, 30.0, 31.0, 32.0, 38.0, 33.0, 41.0, 32.0, 41.0, 54.0, 37.0, 34.0, 41.0, 36.0, 32.0, 29.0, 30.0, 28.0, 35.0, 21.0, 17.0, 23.0, 16.0, 14.0, 16.0, 9.0, 10.0, 8.0, 9.0, 4.0, 6.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0], "bins": [-6.7421875, -6.54388427734375, -6.3455810546875, -6.14727783203125, -5.948974609375, -5.75067138671875, -5.5523681640625, -5.35406494140625, -5.15576171875, -4.95745849609375, -4.7591552734375, -4.56085205078125, -4.362548828125, -4.16424560546875, -3.9659423828125, -3.76763916015625, -3.5693359375, -3.37103271484375, -3.1727294921875, -2.97442626953125, -2.776123046875, -2.57781982421875, -2.3795166015625, -2.18121337890625, -1.98291015625, -1.78460693359375, -1.5863037109375, -1.38800048828125, -1.189697265625, -0.99139404296875, -0.7930908203125, -0.59478759765625, -0.396484375, -0.19818115234375, 0.0001220703125, 0.19842529296875, 0.396728515625, 0.59503173828125, 0.7933349609375, 0.99163818359375, 1.18994140625, 1.38824462890625, 1.5865478515625, 1.78485107421875, 1.983154296875, 2.18145751953125, 2.3797607421875, 2.57806396484375, 2.7763671875, 2.97467041015625, 3.1729736328125, 3.37127685546875, 3.569580078125, 3.76788330078125, 3.9661865234375, 4.16448974609375, 4.36279296875, 4.56109619140625, 4.7593994140625, 4.95770263671875, 5.156005859375, 5.35430908203125, 5.5526123046875, 5.75091552734375, 5.94921875]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 6.0, 1.0, 4.0, 12.0, 17.0, 18.0, 22.0, 39.0, 55.0, 72.0, 100.0, 145.0, 258.0, 425.0, 739.0, 1381.0, 2491.0, 5022.0, 10919.0, 27431.0, 81999.0, 297956.0, 943012.0, 1503351.0, 904241.0, 289908.0, 77680.0, 26095.0, 10496.0, 4789.0, 2444.0, 1284.0, 709.0, 446.0, 245.0, 144.0, 90.0, 64.0, 38.0, 46.0, 30.0, 21.0, 13.0, 12.0, 6.0, 4.0, 5.0, 4.0, 5.0, 0.0, 0.0, 1.0], "bins": [-8.0625, -7.83526611328125, -7.6080322265625, -7.38079833984375, -7.153564453125, -6.92633056640625, -6.6990966796875, -6.47186279296875, -6.24462890625, -6.01739501953125, -5.7901611328125, -5.56292724609375, -5.335693359375, -5.10845947265625, -4.8812255859375, -4.65399169921875, -4.4267578125, -4.19952392578125, -3.9722900390625, -3.74505615234375, -3.517822265625, -3.29058837890625, -3.0633544921875, -2.83612060546875, -2.60888671875, -2.38165283203125, -2.1544189453125, -1.92718505859375, -1.699951171875, -1.47271728515625, -1.2454833984375, -1.01824951171875, -0.791015625, -0.56378173828125, -0.3365478515625, -0.10931396484375, 0.117919921875, 0.34515380859375, 0.5723876953125, 0.79962158203125, 1.02685546875, 1.25408935546875, 1.4813232421875, 1.70855712890625, 1.935791015625, 2.16302490234375, 2.3902587890625, 2.61749267578125, 2.8447265625, 3.07196044921875, 3.2991943359375, 3.52642822265625, 3.753662109375, 3.98089599609375, 4.2081298828125, 4.43536376953125, 4.66259765625, 4.88983154296875, 5.1170654296875, 5.34429931640625, 5.571533203125, 5.79876708984375, 6.0260009765625, 6.25323486328125, 6.48046875]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 4.0, 2.0, 5.0, 11.0, 17.0, 17.0, 25.0, 41.0, 43.0, 50.0, 54.0, 82.0, 78.0, 122.0, 146.0, 209.0, 253.0, 281.0, 379.0, 396.0, 364.0, 312.0, 267.0, 202.0, 160.0, 118.0, 87.0, 75.0, 41.0, 61.0, 39.0, 31.0, 26.0, 21.0, 14.0, 6.0, 6.0, 12.0, 3.0, 2.0, 0.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.015625, -14.5924072265625, -14.169189453125, -13.7459716796875, -13.32275390625, -12.8995361328125, -12.476318359375, -12.0531005859375, -11.6298828125, -11.2066650390625, -10.783447265625, -10.3602294921875, -9.93701171875, -9.5137939453125, -9.090576171875, -8.6673583984375, -8.244140625, -7.8209228515625, -7.397705078125, -6.9744873046875, -6.55126953125, -6.1280517578125, -5.704833984375, -5.2816162109375, -4.8583984375, -4.4351806640625, -4.011962890625, -3.5887451171875, -3.16552734375, -2.7423095703125, -2.319091796875, -1.8958740234375, -1.47265625, -1.0494384765625, -0.626220703125, -0.2030029296875, 0.22021484375, 0.6434326171875, 1.066650390625, 1.4898681640625, 1.9130859375, 2.3363037109375, 2.759521484375, 3.1827392578125, 3.60595703125, 4.0291748046875, 4.452392578125, 4.8756103515625, 5.298828125, 5.7220458984375, 6.145263671875, 6.5684814453125, 6.99169921875, 7.4149169921875, 7.838134765625, 8.2613525390625, 8.6845703125, 9.1077880859375, 9.531005859375, 9.9542236328125, 10.37744140625, 10.8006591796875, 11.223876953125, 11.6470947265625, 12.0703125]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 9.0, 13.0, 11.0, 29.0, 29.0, 32.0, 49.0, 66.0, 101.0, 138.0, 211.0, 388.0, 1128.0, 23521.0, 4022601.0, 142538.0, 2150.0, 490.0, 262.0, 154.0, 101.0, 52.0, 49.0, 46.0, 33.0, 20.0, 16.0, 13.0, 9.0, 10.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.34375, -56.06982421875, -53.7958984375, -51.52197265625, -49.248046875, -46.97412109375, -44.7001953125, -42.42626953125, -40.15234375, -37.87841796875, -35.6044921875, -33.33056640625, -31.056640625, -28.78271484375, -26.5087890625, -24.23486328125, -21.9609375, -19.68701171875, -17.4130859375, -15.13916015625, -12.865234375, -10.59130859375, -8.3173828125, -6.04345703125, -3.76953125, -1.49560546875, 0.7783203125, 3.05224609375, 5.326171875, 7.60009765625, 9.8740234375, 12.14794921875, 14.421875, 16.69580078125, 18.9697265625, 21.24365234375, 23.517578125, 25.79150390625, 28.0654296875, 30.33935546875, 32.61328125, 34.88720703125, 37.1611328125, 39.43505859375, 41.708984375, 43.98291015625, 46.2568359375, 48.53076171875, 50.8046875, 53.07861328125, 55.3525390625, 57.62646484375, 59.900390625, 62.17431640625, 64.4482421875, 66.72216796875, 68.99609375, 71.27001953125, 73.5439453125, 75.81787109375, 78.091796875, 80.36572265625, 82.6396484375, 84.91357421875, 87.1875]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 19.0, 30.0, 66.0, 103.0, 140.0, 195.0, 163.0, 125.0, 83.0, 47.0, 17.0, 11.0, 3.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-136.95057678222656, -133.8875274658203, -130.824462890625, -127.76141357421875, -124.69835662841797, -121.63529968261719, -118.5722427368164, -115.50918579101562, -112.44612884521484, -109.38307189941406, -106.32001495361328, -103.2569580078125, -100.19390869140625, -97.13085174560547, -94.06779479980469, -91.0047378540039, -87.94168090820312, -84.87862396240234, -81.81556701660156, -78.75251770019531, -75.68946075439453, -72.62640380859375, -69.56334686279297, -66.50028991699219, -63.43724060058594, -60.374183654785156, -57.31113052368164, -54.24807357788086, -51.18501663208008, -48.12196350097656, -45.05890655517578, -41.995849609375, -38.932796478271484, -35.8697395324707, -32.80668640136719, -29.743629455566406, -26.680572509765625, -23.617517471313477, -20.554462432861328, -17.491405487060547, -14.428350448608398, -11.365294456481934, -8.302238464355469, -5.23918342590332, -2.1761274337768555, 0.8869285583496094, 3.949983596801758, 7.013040542602539, 10.076095581054688, 13.139151573181152, 16.202207565307617, 19.265262603759766, 22.328319549560547, 25.391374588012695, 28.454429626464844, 31.517486572265625, 34.580543518066406, 37.64360046386719, 40.7066535949707, 43.769710540771484, 46.832767486572266, 49.89582061767578, 52.95887756347656, 56.021934509277344, 59.08498764038086]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 8.0, 5.0, 12.0, 8.0, 12.0, 17.0, 17.0, 14.0, 14.0, 19.0, 32.0, 25.0, 27.0, 21.0, 29.0, 30.0, 30.0, 32.0, 42.0, 40.0, 33.0, 38.0, 35.0, 42.0, 42.0, 37.0, 29.0, 32.0, 29.0, 31.0, 25.0, 16.0, 21.0, 15.0, 18.0, 19.0, 14.0, 15.0, 5.0, 11.0, 12.0, 14.0, 2.0, 5.0, 5.0, 4.0, 3.0, 3.0, 4.0, 1.0, 1.0], "bins": [-51.87261962890625, -50.37895202636719, -48.88528823852539, -47.391624450683594, -45.89795684814453, -44.40428924560547, -42.91062545776367, -41.416961669921875, -39.92329406738281, -38.42962646484375, -36.93596267700195, -35.442298889160156, -33.948631286621094, -32.45496368408203, -30.961299896240234, -29.467634201049805, -27.973968505859375, -26.480302810668945, -24.986637115478516, -23.492971420288086, -21.999305725097656, -20.505640029907227, -19.011974334716797, -17.518308639526367, -16.024642944335938, -14.530977249145508, -13.037311553955078, -11.543645858764648, -10.049980163574219, -8.556314468383789, -7.062648773193359, -5.56898307800293, -4.0753173828125, -2.5816516876220703, -1.0879859924316406, 0.40567970275878906, 1.8993453979492188, 3.3930110931396484, 4.886676788330078, 6.380342483520508, 7.8740081787109375, 9.367673873901367, 10.861339569091797, 12.355005264282227, 13.848670959472656, 15.342336654663086, 16.836002349853516, 18.329668045043945, 19.823333740234375, 21.316999435424805, 22.810665130615234, 24.304330825805664, 25.797996520996094, 27.291662216186523, 28.785327911376953, 30.278993606567383, 31.772659301757812, 33.266326904296875, 34.75999069213867, 36.25365447998047, 37.74732208251953, 39.240989685058594, 40.73465347290039, 42.22831726074219, 43.72198486328125]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 6.0, 8.0, 15.0, 12.0, 13.0, 11.0, 11.0, 16.0, 19.0, 27.0, 33.0, 30.0, 39.0, 29.0, 32.0, 37.0, 49.0, 36.0, 32.0, 28.0, 39.0, 47.0, 37.0, 36.0, 35.0, 40.0, 33.0, 35.0, 29.0, 22.0, 19.0, 27.0, 18.0, 17.0, 14.0, 9.0, 12.0, 12.0, 7.0, 7.0, 7.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.70703125, -6.5042724609375, -6.301513671875, -6.0987548828125, -5.89599609375, -5.6932373046875, -5.490478515625, -5.2877197265625, -5.0849609375, -4.8822021484375, -4.679443359375, -4.4766845703125, -4.27392578125, -4.0711669921875, -3.868408203125, -3.6656494140625, -3.462890625, -3.2601318359375, -3.057373046875, -2.8546142578125, -2.65185546875, -2.4490966796875, -2.246337890625, -2.0435791015625, -1.8408203125, -1.6380615234375, -1.435302734375, -1.2325439453125, -1.02978515625, -0.8270263671875, -0.624267578125, -0.4215087890625, -0.21875, -0.0159912109375, 0.186767578125, 0.3895263671875, 0.59228515625, 0.7950439453125, 0.997802734375, 1.2005615234375, 1.4033203125, 1.6060791015625, 1.808837890625, 2.0115966796875, 2.21435546875, 2.4171142578125, 2.619873046875, 2.8226318359375, 3.025390625, 3.2281494140625, 3.430908203125, 3.6336669921875, 3.83642578125, 4.0391845703125, 4.241943359375, 4.4447021484375, 4.6474609375, 4.8502197265625, 5.052978515625, 5.2557373046875, 5.45849609375, 5.6612548828125, 5.864013671875, 6.0667724609375, 6.26953125]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 11.0, 4.0, 20.0, 40.0, 37.0, 48.0, 77.0, 101.0, 153.0, 233.0, 341.0, 466.0, 654.0, 1014.0, 1497.0, 2048.0, 3012.0, 4218.0, 6172.0, 8682.0, 12628.0, 17771.0, 26541.0, 38487.0, 56806.0, 83962.0, 124107.0, 173788.0, 155264.0, 104948.0, 71257.0, 47931.0, 33047.0, 22203.0, 15215.0, 10780.0, 7659.0, 5198.0, 3748.0, 2582.0, 1738.0, 1191.0, 855.0, 616.0, 447.0, 328.0, 188.0, 148.0, 110.0, 75.0, 39.0, 29.0, 20.0, 7.0, 8.0, 8.0, 5.0, 3.0, 4.0], "bins": [-0.80078125, -0.7763595581054688, -0.7519378662109375, -0.7275161743164062, -0.703094482421875, -0.6786727905273438, -0.6542510986328125, -0.6298294067382812, -0.60540771484375, -0.5809860229492188, -0.5565643310546875, -0.5321426391601562, -0.507720947265625, -0.48329925537109375, -0.4588775634765625, -0.43445587158203125, -0.4100341796875, -0.38561248779296875, -0.3611907958984375, -0.33676910400390625, -0.312347412109375, -0.28792572021484375, -0.2635040283203125, -0.23908233642578125, -0.21466064453125, -0.19023895263671875, -0.1658172607421875, -0.14139556884765625, -0.116973876953125, -0.09255218505859375, -0.0681304931640625, -0.04370880126953125, -0.019287109375, 0.00513458251953125, 0.0295562744140625, 0.05397796630859375, 0.078399658203125, 0.10282135009765625, 0.1272430419921875, 0.15166473388671875, 0.17608642578125, 0.20050811767578125, 0.2249298095703125, 0.24935150146484375, 0.273773193359375, 0.29819488525390625, 0.3226165771484375, 0.34703826904296875, 0.3714599609375, 0.39588165283203125, 0.4203033447265625, 0.44472503662109375, 0.469146728515625, 0.49356842041015625, 0.5179901123046875, 0.5424118041992188, 0.56683349609375, 0.5912551879882812, 0.6156768798828125, 0.6400985717773438, 0.664520263671875, 0.6889419555664062, 0.7133636474609375, 0.7377853393554688, 0.76220703125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 4.0, 5.0, 6.0, 8.0, 5.0, 9.0, 14.0, 11.0, 13.0, 16.0, 15.0, 18.0, 20.0, 33.0, 32.0, 30.0, 33.0, 44.0, 35.0, 31.0, 39.0, 30.0, 1067.0, 44.0, 43.0, 40.0, 42.0, 32.0, 28.0, 29.0, 29.0, 29.0, 29.0, 22.0, 27.0, 24.0, 18.0, 11.0, 12.0, 10.0, 10.0, 11.0, 8.0, 7.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.21875, -4.09466552734375, -3.9705810546875, -3.84649658203125, -3.722412109375, -3.59832763671875, -3.4742431640625, -3.35015869140625, -3.22607421875, -3.10198974609375, -2.9779052734375, -2.85382080078125, -2.729736328125, -2.60565185546875, -2.4815673828125, -2.35748291015625, -2.2333984375, -2.10931396484375, -1.9852294921875, -1.86114501953125, -1.737060546875, -1.61297607421875, -1.4888916015625, -1.36480712890625, -1.24072265625, -1.11663818359375, -0.9925537109375, -0.86846923828125, -0.744384765625, -0.62030029296875, -0.4962158203125, -0.37213134765625, -0.248046875, -0.12396240234375, 0.0001220703125, 0.12420654296875, 0.248291015625, 0.37237548828125, 0.4964599609375, 0.62054443359375, 0.74462890625, 0.86871337890625, 0.9927978515625, 1.11688232421875, 1.240966796875, 1.36505126953125, 1.4891357421875, 1.61322021484375, 1.7373046875, 1.86138916015625, 1.9854736328125, 2.10955810546875, 2.233642578125, 2.35772705078125, 2.4818115234375, 2.60589599609375, 2.72998046875, 2.85406494140625, 2.9781494140625, 3.10223388671875, 3.226318359375, 3.35040283203125, 3.4744873046875, 3.59857177734375, 3.72265625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 5.0, 2.0, 11.0, 13.0, 18.0, 31.0, 29.0, 43.0, 67.0, 120.0, 159.0, 289.0, 413.0, 707.0, 987.0, 1595.0, 2362.0, 3672.0, 6031.0, 9601.0, 15319.0, 24954.0, 40471.0, 66298.0, 107691.0, 173559.0, 1263729.0, 144575.0, 89822.0, 55249.0, 34149.0, 20543.0, 12711.0, 7922.0, 5064.0, 3121.0, 2055.0, 1247.0, 884.0, 574.0, 372.0, 204.0, 156.0, 114.0, 71.0, 52.0, 25.0, 20.0, 14.0, 7.0, 6.0, 3.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0], "bins": [-0.8642578125, -0.8375091552734375, -0.810760498046875, -0.7840118408203125, -0.75726318359375, -0.7305145263671875, -0.703765869140625, -0.6770172119140625, -0.6502685546875, -0.6235198974609375, -0.596771240234375, -0.5700225830078125, -0.54327392578125, -0.5165252685546875, -0.489776611328125, -0.4630279541015625, -0.436279296875, -0.4095306396484375, -0.382781982421875, -0.3560333251953125, -0.32928466796875, -0.3025360107421875, -0.275787353515625, -0.2490386962890625, -0.2222900390625, -0.1955413818359375, -0.168792724609375, -0.1420440673828125, -0.11529541015625, -0.0885467529296875, -0.061798095703125, -0.0350494384765625, -0.00830078125, 0.0184478759765625, 0.045196533203125, 0.0719451904296875, 0.09869384765625, 0.1254425048828125, 0.152191162109375, 0.1789398193359375, 0.2056884765625, 0.2324371337890625, 0.259185791015625, 0.2859344482421875, 0.31268310546875, 0.3394317626953125, 0.366180419921875, 0.3929290771484375, 0.419677734375, 0.4464263916015625, 0.473175048828125, 0.4999237060546875, 0.52667236328125, 0.5534210205078125, 0.580169677734375, 0.6069183349609375, 0.6336669921875, 0.6604156494140625, 0.687164306640625, 0.7139129638671875, 0.74066162109375, 0.7674102783203125, 0.794158935546875, 0.8209075927734375, 0.84765625]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 5.0, 6.0, 8.0, 11.0, 14.0, 7.0, 10.0, 16.0, 18.0, 19.0, 30.0, 34.0, 41.0, 38.0, 49.0, 50.0, 45.0, 58.0, 53.0, 55.0, 41.0, 32.0, 50.0, 51.0, 33.0, 32.0, 33.0, 27.0, 16.0, 30.0, 20.0, 14.0, 15.0, 12.0, 5.0, 3.0, 3.0, 5.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015764236450195312, -0.0015301108360290527, -0.0014837980270385742, -0.0014374852180480957, -0.0013911724090576172, -0.0013448596000671387, -0.0012985467910766602, -0.0012522339820861816, -0.0012059211730957031, -0.0011596083641052246, -0.001113295555114746, -0.0010669827461242676, -0.001020669937133789, -0.0009743571281433105, -0.000928044319152832, -0.0008817315101623535, -0.000835418701171875, -0.0007891058921813965, -0.000742793083190918, -0.0006964802742004395, -0.0006501674652099609, -0.0006038546562194824, -0.0005575418472290039, -0.0005112290382385254, -0.0004649162292480469, -0.00041860342025756836, -0.00037229061126708984, -0.00032597780227661133, -0.0002796649932861328, -0.0002333521842956543, -0.00018703937530517578, -0.00014072656631469727, -9.441375732421875e-05, -4.8100948333740234e-05, -1.7881393432617188e-06, 4.45246696472168e-05, 9.083747863769531e-05, 0.00013715028762817383, 0.00018346309661865234, 0.00022977590560913086, 0.0002760887145996094, 0.0003224015235900879, 0.0003687143325805664, 0.0004150271415710449, 0.00046133995056152344, 0.000507652759552002, 0.0005539655685424805, 0.000600278377532959, 0.0006465911865234375, 0.000692903995513916, 0.0007392168045043945, 0.000785529613494873, 0.0008318424224853516, 0.0008781552314758301, 0.0009244680404663086, 0.0009707808494567871, 0.0010170936584472656, 0.0010634064674377441, 0.0011097192764282227, 0.0011560320854187012, 0.0012023448944091797, 0.0012486577033996582, 0.0012949705123901367, 0.0013412833213806152, 0.0013875961303710938]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 6.0, 2.0, 8.0, 2.0, 11.0, 6.0, 5.0, 12.0, 20.0, 25.0, 18.0, 22.0, 24.0, 46.0, 55.0, 74.0, 139.0, 258.0, 485.0, 1601.0, 974583.0, 69334.0, 835.0, 370.0, 201.0, 121.0, 71.0, 45.0, 39.0, 23.0, 23.0, 23.0, 11.0, 11.0, 9.0, 9.0, 9.0, 4.0, 4.0, 6.0, 5.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033905029296875, -0.03272819519042969, -0.031551361083984375, -0.030374526977539062, -0.02919769287109375, -0.028020858764648438, -0.026844024658203125, -0.025667190551757812, -0.0244903564453125, -0.023313522338867188, -0.022136688232421875, -0.020959854125976562, -0.01978302001953125, -0.018606185913085938, -0.017429351806640625, -0.016252517700195312, -0.01507568359375, -0.013898849487304688, -0.012722015380859375, -0.011545181274414062, -0.01036834716796875, -0.009191513061523438, -0.008014678955078125, -0.0068378448486328125, -0.0056610107421875, -0.0044841766357421875, -0.003307342529296875, -0.0021305084228515625, -0.00095367431640625, 0.0002231597900390625, 0.001399993896484375, 0.0025768280029296875, 0.003753662109375, 0.0049304962158203125, 0.006107330322265625, 0.0072841644287109375, 0.00846099853515625, 0.009637832641601562, 0.010814666748046875, 0.011991500854492188, 0.0131683349609375, 0.014345169067382812, 0.015522003173828125, 0.016698837280273438, 0.01787567138671875, 0.019052505493164062, 0.020229339599609375, 0.021406173706054688, 0.0225830078125, 0.023759841918945312, 0.024936676025390625, 0.026113510131835938, 0.02729034423828125, 0.028467178344726562, 0.029644012451171875, 0.030820846557617188, 0.0319976806640625, 0.03317451477050781, 0.034351348876953125, 0.03552818298339844, 0.03670501708984375, 0.03788185119628906, 0.039058685302734375, 0.04023551940917969, 0.041412353515625]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 21.0, 145.0, 488.0, 298.0, 55.0, 8.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0024785022251307964, -0.0023590559139847755, -0.0022396096028387547, -0.0021201632916927338, -0.002000716980546713, -0.001881270669400692, -0.001761824358254671, -0.0016423780471086502, -0.0015229317359626293, -0.0014034854248166084, -0.0012840391136705875, -0.0011645928025245667, -0.0010451464913785458, -0.0009257001802325249, -0.000806253869086504, -0.0006868075579404831, -0.0005673612467944622, -0.0004479149356484413, -0.0003284686245024204, -0.00020902231335639954, -8.957600221037865e-05, 2.9870308935642242e-05, 0.00014931662008166313, 0.000268762931227684, 0.0003882092423737049, 0.0005076555535197258, 0.0006271018646657467, 0.0007465481758117676, 0.0008659944869577885, 0.0009854407981038094, 0.0011048871092498302, 0.0012243334203958511, 0.001343779731541872, 0.001463226042687893, 0.0015826723538339138, 0.0017021186649799347, 0.0018215649761259556, 0.0019410112872719765, 0.0020604575984179974, 0.0021799039095640182, 0.002299350220710039, 0.00241879653185606, 0.002538242843002081, 0.002657689154148102, 0.0027771354652941227, 0.0028965817764401436, 0.0030160280875861645, 0.0031354743987321854, 0.0032549207098782063, 0.003374367021024227, 0.003493813332170248, 0.003613259643316269, 0.00373270595446229, 0.0038521522656083107, 0.003971598576754332, 0.0040910448879003525, 0.004210491199046373, 0.004329937510192394, 0.004449383821338415, 0.004568830132484436, 0.004688276443630457, 0.004807722754776478, 0.004927169065922499, 0.00504661537706852, 0.0051660616882145405]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 4.0, 1.0, 4.0, 2.0, 4.0, 4.0, 9.0, 8.0, 5.0, 13.0, 11.0, 14.0, 19.0, 18.0, 16.0, 23.0, 26.0, 18.0, 25.0, 33.0, 30.0, 27.0, 39.0, 26.0, 34.0, 34.0, 32.0, 45.0, 36.0, 46.0, 33.0, 35.0, 33.0, 26.0, 32.0, 23.0, 25.0, 26.0, 26.0, 21.0, 20.0, 14.0, 10.0, 14.0, 9.0, 12.0, 6.0, 9.0, 3.0, 10.0, 5.0, 4.0, 1.0, 5.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.0006586909294128418, -0.0006370516493916512, -0.0006154123693704605, -0.0005937730893492699, -0.0005721338093280792, -0.0005504945293068886, -0.0005288552492856979, -0.0005072159692645073, -0.00048557668924331665, -0.000463937409222126, -0.00044229812920093536, -0.0004206588491797447, -0.0003990195691585541, -0.00037738028913736343, -0.0003557410091161728, -0.00033410172909498215, -0.0003124624490737915, -0.00029082316905260086, -0.0002691838890314102, -0.0002475446090102196, -0.00022590532898902893, -0.0002042660489678383, -0.00018262676894664764, -0.000160987488925457, -0.00013934820890426636, -0.00011770892888307571, -9.606964886188507e-05, -7.443036884069443e-05, -5.2791088819503784e-05, -3.115180879831314e-05, -9.512528777122498e-06, 1.2126751244068146e-05, 3.376603126525879e-05, 5.540531128644943e-05, 7.704459130764008e-05, 9.868387132883072e-05, 0.00012032315135002136, 0.000141962431371212, 0.00016360171139240265, 0.0001852409914135933, 0.00020688027143478394, 0.00022851955145597458, 0.0002501588314771652, 0.00027179811149835587, 0.0002934373915195465, 0.00031507667154073715, 0.0003367159515619278, 0.00035835523158311844, 0.0003799945116043091, 0.0004016337916254997, 0.00042327307164669037, 0.000444912351667881, 0.00046655163168907166, 0.0004881909117102623, 0.0005098301917314529, 0.0005314694717526436, 0.0005531087517738342, 0.0005747480317950249, 0.0005963873118162155, 0.0006180265918374062, 0.0006396658718585968, 0.0006613051518797874, 0.0006829444319009781, 0.0007045837119221687, 0.0007262229919433594]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 6.0, 8.0, 15.0, 12.0, 13.0, 11.0, 11.0, 16.0, 19.0, 27.0, 33.0, 30.0, 39.0, 29.0, 32.0, 37.0, 49.0, 36.0, 32.0, 28.0, 39.0, 47.0, 37.0, 36.0, 35.0, 40.0, 33.0, 35.0, 29.0, 22.0, 19.0, 27.0, 18.0, 17.0, 14.0, 9.0, 12.0, 12.0, 7.0, 7.0, 7.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.70703125, -6.5042724609375, -6.301513671875, -6.0987548828125, -5.89599609375, -5.6932373046875, -5.490478515625, -5.2877197265625, -5.0849609375, -4.8822021484375, -4.679443359375, -4.4766845703125, -4.27392578125, -4.0711669921875, -3.868408203125, -3.6656494140625, -3.462890625, -3.2601318359375, -3.057373046875, -2.8546142578125, -2.65185546875, -2.4490966796875, -2.246337890625, -2.0435791015625, -1.8408203125, -1.6380615234375, -1.435302734375, -1.2325439453125, -1.02978515625, -0.8270263671875, -0.624267578125, -0.4215087890625, -0.21875, -0.0159912109375, 0.186767578125, 0.3895263671875, 0.59228515625, 0.7950439453125, 0.997802734375, 1.2005615234375, 1.4033203125, 1.6060791015625, 1.808837890625, 2.0115966796875, 2.21435546875, 2.4171142578125, 2.619873046875, 2.8226318359375, 3.025390625, 3.2281494140625, 3.430908203125, 3.6336669921875, 3.83642578125, 4.0391845703125, 4.241943359375, 4.4447021484375, 4.6474609375, 4.8502197265625, 5.052978515625, 5.2557373046875, 5.45849609375, 5.6612548828125, 5.864013671875, 6.0667724609375, 6.26953125]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 3.0, 2.0, 8.0, 2.0, 15.0, 8.0, 28.0, 27.0, 36.0, 47.0, 62.0, 105.0, 158.0, 262.0, 386.0, 556.0, 848.0, 1326.0, 2264.0, 4325.0, 8776.0, 20464.0, 54509.0, 180705.0, 461629.0, 207498.0, 61177.0, 22498.0, 9685.0, 4663.0, 2459.0, 1408.0, 871.0, 571.0, 388.0, 229.0, 180.0, 104.0, 83.0, 52.0, 36.0, 28.0, 23.0, 11.0, 10.0, 9.0, 5.0, 4.0, 6.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.66015625, -4.50762939453125, -4.3551025390625, -4.20257568359375, -4.050048828125, -3.89752197265625, -3.7449951171875, -3.59246826171875, -3.43994140625, -3.28741455078125, -3.1348876953125, -2.98236083984375, -2.829833984375, -2.67730712890625, -2.5247802734375, -2.37225341796875, -2.2197265625, -2.06719970703125, -1.9146728515625, -1.76214599609375, -1.609619140625, -1.45709228515625, -1.3045654296875, -1.15203857421875, -0.99951171875, -0.84698486328125, -0.6944580078125, -0.54193115234375, -0.389404296875, -0.23687744140625, -0.0843505859375, 0.06817626953125, 0.220703125, 0.37322998046875, 0.5257568359375, 0.67828369140625, 0.830810546875, 0.98333740234375, 1.1358642578125, 1.28839111328125, 1.44091796875, 1.59344482421875, 1.7459716796875, 1.89849853515625, 2.051025390625, 2.20355224609375, 2.3560791015625, 2.50860595703125, 2.6611328125, 2.81365966796875, 2.9661865234375, 3.11871337890625, 3.271240234375, 3.42376708984375, 3.5762939453125, 3.72882080078125, 3.88134765625, 4.03387451171875, 4.1864013671875, 4.33892822265625, 4.491455078125, 4.64398193359375, 4.7965087890625, 4.94903564453125, 5.1015625]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 3.0, 5.0, 5.0, 3.0, 5.0, 5.0, 5.0, 9.0, 20.0, 22.0, 20.0, 18.0, 23.0, 34.0, 31.0, 47.0, 42.0, 43.0, 57.0, 69.0, 175.0, 1774.0, 157.0, 70.0, 65.0, 48.0, 45.0, 31.0, 40.0, 22.0, 32.0, 21.0, 20.0, 16.0, 14.0, 11.0, 11.0, 11.0, 5.0, 5.0, 6.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.375, -25.562744140625, -24.75048828125, -23.938232421875, -23.1259765625, -22.313720703125, -21.50146484375, -20.689208984375, -19.876953125, -19.064697265625, -18.25244140625, -17.440185546875, -16.6279296875, -15.815673828125, -15.00341796875, -14.191162109375, -13.37890625, -12.566650390625, -11.75439453125, -10.942138671875, -10.1298828125, -9.317626953125, -8.50537109375, -7.693115234375, -6.880859375, -6.068603515625, -5.25634765625, -4.444091796875, -3.6318359375, -2.819580078125, -2.00732421875, -1.195068359375, -0.3828125, 0.429443359375, 1.24169921875, 2.053955078125, 2.8662109375, 3.678466796875, 4.49072265625, 5.302978515625, 6.115234375, 6.927490234375, 7.73974609375, 8.552001953125, 9.3642578125, 10.176513671875, 10.98876953125, 11.801025390625, 12.61328125, 13.425537109375, 14.23779296875, 15.050048828125, 15.8623046875, 16.674560546875, 17.48681640625, 18.299072265625, 19.111328125, 19.923583984375, 20.73583984375, 21.548095703125, 22.3603515625, 23.172607421875, 23.98486328125, 24.797119140625, 25.609375]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 6.0, 7.0, 12.0, 9.0, 14.0, 16.0, 16.0, 33.0, 23.0, 49.0, 47.0, 77.0, 92.0, 151.0, 173.0, 278.0, 569.0, 3793.0, 2950023.0, 187259.0, 1693.0, 448.0, 249.0, 190.0, 110.0, 73.0, 79.0, 40.0, 36.0, 31.0, 29.0, 20.0, 13.0, 9.0, 5.0, 10.0, 5.0, 7.0, 4.0, 1.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.15625, -49.49853515625, -47.8408203125, -46.18310546875, -44.525390625, -42.86767578125, -41.2099609375, -39.55224609375, -37.89453125, -36.23681640625, -34.5791015625, -32.92138671875, -31.263671875, -29.60595703125, -27.9482421875, -26.29052734375, -24.6328125, -22.97509765625, -21.3173828125, -19.65966796875, -18.001953125, -16.34423828125, -14.6865234375, -13.02880859375, -11.37109375, -9.71337890625, -8.0556640625, -6.39794921875, -4.740234375, -3.08251953125, -1.4248046875, 0.23291015625, 1.890625, 3.54833984375, 5.2060546875, 6.86376953125, 8.521484375, 10.17919921875, 11.8369140625, 13.49462890625, 15.15234375, 16.81005859375, 18.4677734375, 20.12548828125, 21.783203125, 23.44091796875, 25.0986328125, 26.75634765625, 28.4140625, 30.07177734375, 31.7294921875, 33.38720703125, 35.044921875, 36.70263671875, 38.3603515625, 40.01806640625, 41.67578125, 43.33349609375, 44.9912109375, 46.64892578125, 48.306640625, 49.96435546875, 51.6220703125, 53.27978515625, 54.9375]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [344.0, 666.0, 6.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.9185028076171875, -0.8384151458740234, 5.241672515869141, 11.321760177612305, 17.40184783935547, 23.481935501098633, 29.562023162841797, 35.642112731933594, 41.722198486328125, 47.802284240722656, 53.88237380981445, 59.96246337890625, 66.04254913330078, 72.12263488769531, 78.20272827148438, 84.2828140258789, 90.36289978027344, 96.44298553466797, 102.5230712890625, 108.60316467285156, 114.6832504272461, 120.76333618164062, 126.84342956542969, 132.92352294921875, 139.00360107421875, 145.0836944580078, 151.1637725830078, 157.24386596679688, 163.32394409179688, 169.40403747558594, 175.484130859375, 181.564208984375, 187.64431762695312, 193.7244110107422, 199.8044891357422, 205.88458251953125, 211.96466064453125, 218.0447540283203, 224.12484741210938, 230.20492553710938, 236.28501892089844, 242.3651123046875, 248.4451904296875, 254.52528381347656, 260.6053771972656, 266.6854553222656, 272.7655334472656, 278.84564208984375, 284.92572021484375, 291.00579833984375, 297.0859069824219, 303.1659851074219, 309.2460632324219, 315.326171875, 321.40625, 327.486328125, 333.56640625, 339.646484375, 345.7265930175781, 351.8066711425781, 357.8867492675781, 363.96685791015625, 370.04693603515625, 376.12701416015625, 382.2071228027344]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 5.0, 5.0, 8.0, 14.0, 5.0, 10.0, 11.0, 8.0, 8.0, 12.0, 13.0, 16.0, 21.0, 32.0, 35.0, 20.0, 27.0, 35.0, 24.0, 34.0, 24.0, 39.0, 39.0, 40.0, 33.0, 33.0, 36.0, 34.0, 38.0, 35.0, 30.0, 34.0, 31.0, 39.0, 19.0, 22.0, 19.0, 18.0, 17.0, 20.0, 9.0, 13.0, 9.0, 8.0, 6.0, 1.0, 5.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 3.0], "bins": [-59.544830322265625, -57.8148307800293, -56.08483123779297, -54.35483169555664, -52.62483215332031, -50.894832611083984, -49.164833068847656, -47.43482971191406, -45.704833984375, -43.97483444213867, -42.244834899902344, -40.514835357666016, -38.78483581542969, -37.05483627319336, -35.32483673095703, -33.59483337402344, -31.86483383178711, -30.13483428955078, -28.404834747314453, -26.674835205078125, -24.944835662841797, -23.21483612060547, -21.484834671020508, -19.75483512878418, -18.02483558654785, -16.294836044311523, -14.564836502075195, -12.83483600616455, -11.104836463928223, -9.374836921691895, -7.64483642578125, -5.914836883544922, -4.184833526611328, -2.454833745956421, -0.7248339653015137, 1.0051660537719727, 2.735165596008301, 4.465165138244629, 6.195165634155273, 7.925165176391602, 9.65516471862793, 11.385164260864258, 13.115163803100586, 14.84516429901123, 16.575164794921875, 18.305164337158203, 20.03516387939453, 21.76516342163086, 23.495162963867188, 25.225162506103516, 26.955162048339844, 28.685161590576172, 30.4151611328125, 32.14516067504883, 33.875160217285156, 35.60516357421875, 37.33515930175781, 39.06515884399414, 40.79515838623047, 42.5251579284668, 44.255157470703125, 45.98515701293945, 47.71515655517578, 49.445159912109375, 51.1751594543457]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 5.0, 4.0, 3.0, 14.0, 9.0, 10.0, 14.0, 15.0, 12.0, 19.0, 19.0, 22.0, 37.0, 34.0, 26.0, 23.0, 58.0, 37.0, 38.0, 36.0, 36.0, 42.0, 28.0, 43.0, 44.0, 32.0, 41.0, 30.0, 36.0, 27.0, 29.0, 24.0, 21.0, 28.0, 15.0, 19.0, 13.0, 9.0, 13.0, 6.0, 8.0, 11.0, 2.0, 5.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.0390625, -6.831298828125, -6.62353515625, -6.415771484375, -6.2080078125, -6.000244140625, -5.79248046875, -5.584716796875, -5.376953125, -5.169189453125, -4.96142578125, -4.753662109375, -4.5458984375, -4.338134765625, -4.13037109375, -3.922607421875, -3.71484375, -3.507080078125, -3.29931640625, -3.091552734375, -2.8837890625, -2.676025390625, -2.46826171875, -2.260498046875, -2.052734375, -1.844970703125, -1.63720703125, -1.429443359375, -1.2216796875, -1.013916015625, -0.80615234375, -0.598388671875, -0.390625, -0.182861328125, 0.02490234375, 0.232666015625, 0.4404296875, 0.648193359375, 0.85595703125, 1.063720703125, 1.271484375, 1.479248046875, 1.68701171875, 1.894775390625, 2.1025390625, 2.310302734375, 2.51806640625, 2.725830078125, 2.93359375, 3.141357421875, 3.34912109375, 3.556884765625, 3.7646484375, 3.972412109375, 4.18017578125, 4.387939453125, 4.595703125, 4.803466796875, 5.01123046875, 5.218994140625, 5.4267578125, 5.634521484375, 5.84228515625, 6.050048828125, 6.2578125]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 6.0, 4.0, 8.0, 14.0, 13.0, 15.0, 23.0, 8.0, 14.0, 29.0, 36.0, 20.0, 41.0, 56.0, 61.0, 102.0, 139.0, 493.0, 4409.0, 328102.0, 3801132.0, 56746.0, 1938.0, 327.0, 124.0, 70.0, 58.0, 57.0, 37.0, 25.0, 26.0, 31.0, 20.0, 12.0, 15.0, 13.0, 13.0, 8.0, 11.0, 3.0, 7.0, 3.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 2.0], "bins": [-40.4375, -39.29345703125, -38.1494140625, -37.00537109375, -35.861328125, -34.71728515625, -33.5732421875, -32.42919921875, -31.28515625, -30.14111328125, -28.9970703125, -27.85302734375, -26.708984375, -25.56494140625, -24.4208984375, -23.27685546875, -22.1328125, -20.98876953125, -19.8447265625, -18.70068359375, -17.556640625, -16.41259765625, -15.2685546875, -14.12451171875, -12.98046875, -11.83642578125, -10.6923828125, -9.54833984375, -8.404296875, -7.26025390625, -6.1162109375, -4.97216796875, -3.828125, -2.68408203125, -1.5400390625, -0.39599609375, 0.748046875, 1.89208984375, 3.0361328125, 4.18017578125, 5.32421875, 6.46826171875, 7.6123046875, 8.75634765625, 9.900390625, 11.04443359375, 12.1884765625, 13.33251953125, 14.4765625, 15.62060546875, 16.7646484375, 17.90869140625, 19.052734375, 20.19677734375, 21.3408203125, 22.48486328125, 23.62890625, 24.77294921875, 25.9169921875, 27.06103515625, 28.205078125, 29.34912109375, 30.4931640625, 31.63720703125, 32.78125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 2.0, 4.0, 7.0, 12.0, 14.0, 12.0, 20.0, 30.0, 48.0, 49.0, 60.0, 88.0, 113.0, 179.0, 225.0, 290.0, 397.0, 413.0, 427.0, 390.0, 331.0, 245.0, 214.0, 131.0, 99.0, 78.0, 46.0, 29.0, 31.0, 21.0, 17.0, 15.0, 12.0, 9.0, 6.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.59375, -11.13134765625, -10.6689453125, -10.20654296875, -9.744140625, -9.28173828125, -8.8193359375, -8.35693359375, -7.89453125, -7.43212890625, -6.9697265625, -6.50732421875, -6.044921875, -5.58251953125, -5.1201171875, -4.65771484375, -4.1953125, -3.73291015625, -3.2705078125, -2.80810546875, -2.345703125, -1.88330078125, -1.4208984375, -0.95849609375, -0.49609375, -0.03369140625, 0.4287109375, 0.89111328125, 1.353515625, 1.81591796875, 2.2783203125, 2.74072265625, 3.203125, 3.66552734375, 4.1279296875, 4.59033203125, 5.052734375, 5.51513671875, 5.9775390625, 6.43994140625, 6.90234375, 7.36474609375, 7.8271484375, 8.28955078125, 8.751953125, 9.21435546875, 9.6767578125, 10.13916015625, 10.6015625, 11.06396484375, 11.5263671875, 11.98876953125, 12.451171875, 12.91357421875, 13.3759765625, 13.83837890625, 14.30078125, 14.76318359375, 15.2255859375, 15.68798828125, 16.150390625, 16.61279296875, 17.0751953125, 17.53759765625, 18.0]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 4.0, 9.0, 5.0, 11.0, 6.0, 18.0, 22.0, 26.0, 32.0, 43.0, 68.0, 80.0, 87.0, 151.0, 203.0, 304.0, 528.0, 1497.0, 43787.0, 4030168.0, 113346.0, 2149.0, 614.0, 340.0, 206.0, 134.0, 105.0, 75.0, 75.0, 42.0, 28.0, 29.0, 25.0, 13.0, 15.0, 11.0, 4.0, 6.0, 5.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-55.78125, -53.75927734375, -51.7373046875, -49.71533203125, -47.693359375, -45.67138671875, -43.6494140625, -41.62744140625, -39.60546875, -37.58349609375, -35.5615234375, -33.53955078125, -31.517578125, -29.49560546875, -27.4736328125, -25.45166015625, -23.4296875, -21.40771484375, -19.3857421875, -17.36376953125, -15.341796875, -13.31982421875, -11.2978515625, -9.27587890625, -7.25390625, -5.23193359375, -3.2099609375, -1.18798828125, 0.833984375, 2.85595703125, 4.8779296875, 6.89990234375, 8.921875, 10.94384765625, 12.9658203125, 14.98779296875, 17.009765625, 19.03173828125, 21.0537109375, 23.07568359375, 25.09765625, 27.11962890625, 29.1416015625, 31.16357421875, 33.185546875, 35.20751953125, 37.2294921875, 39.25146484375, 41.2734375, 43.29541015625, 45.3173828125, 47.33935546875, 49.361328125, 51.38330078125, 53.4052734375, 55.42724609375, 57.44921875, 59.47119140625, 61.4931640625, 63.51513671875, 65.537109375, 67.55908203125, 69.5810546875, 71.60302734375, 73.625]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 8.0, 50.0, 146.0, 259.0, 297.0, 161.0, 70.0, 18.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-262.4325866699219, -257.2919006347656, -252.15122985839844, -247.01055908203125, -241.869873046875, -236.72918701171875, -231.58851623535156, -226.44784545898438, -221.30715942382812, -216.16647338867188, -211.0258026123047, -205.8851318359375, -200.74444580078125, -195.603759765625, -190.4630889892578, -185.32241821289062, -180.18173217773438, -175.04104614257812, -169.90037536621094, -164.75970458984375, -159.6190185546875, -154.47833251953125, -149.33766174316406, -144.19699096679688, -139.05630493164062, -133.91561889648438, -128.7749481201172, -123.63426971435547, -118.49359130859375, -113.35291290283203, -108.21223449707031, -103.0715560913086, -97.9308853149414, -92.79020690917969, -87.64952850341797, -82.50885009765625, -77.36817169189453, -72.22749328613281, -67.0868148803711, -61.946136474609375, -56.805458068847656, -51.66477966308594, -46.52410125732422, -41.3834228515625, -36.24274444580078, -31.102066040039062, -25.961387634277344, -20.820709228515625, -15.680030822753906, -10.539352416992188, -5.398674011230469, -0.25799560546875, 4.882682800292969, 10.023361206054688, 15.164039611816406, 20.304718017578125, 25.445396423339844, 30.586074829101562, 35.72675323486328, 40.867431640625, 46.00811004638672, 51.14878845214844, 56.289466857910156, 61.430145263671875, 66.5708236694336]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 3.0, 5.0, 6.0, 9.0, 11.0, 12.0, 15.0, 11.0, 18.0, 15.0, 26.0, 17.0, 18.0, 23.0, 23.0, 29.0, 40.0, 41.0, 29.0, 49.0, 34.0, 36.0, 35.0, 39.0, 34.0, 26.0, 41.0, 39.0, 35.0, 32.0, 24.0, 26.0, 25.0, 25.0, 21.0, 16.0, 23.0, 19.0, 12.0, 16.0, 5.0, 7.0, 12.0, 5.0, 5.0, 5.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-43.546993255615234, -42.135963439941406, -40.724937438964844, -39.313907623291016, -37.90287780761719, -36.49184799194336, -35.08081817626953, -33.66979217529297, -32.25876235961914, -30.847732543945312, -29.436704635620117, -28.025676727294922, -26.614646911621094, -25.203617095947266, -23.79258918762207, -22.381561279296875, -20.970531463623047, -19.55950164794922, -18.148473739624023, -16.737445831298828, -15.326416015625, -13.915387153625488, -12.504358291625977, -11.093329429626465, -9.682300567626953, -8.271271705627441, -6.86024284362793, -5.449213981628418, -4.038185119628906, -2.6271562576293945, -1.2161273956298828, 0.1949014663696289, 1.605926513671875, 3.0169553756713867, 4.427984237670898, 5.83901309967041, 7.250041961669922, 8.661070823669434, 10.072099685668945, 11.483128547668457, 12.894157409667969, 14.30518627166748, 15.716215133666992, 17.127243041992188, 18.538272857666016, 19.949302673339844, 21.36033058166504, 22.771358489990234, 24.182388305664062, 25.59341812133789, 27.004446029663086, 28.41547393798828, 29.82650375366211, 31.237533569335938, 32.6485595703125, 34.05958938598633, 35.470619201660156, 36.881649017333984, 38.29267883300781, 39.703704833984375, 41.1147346496582, 42.52576446533203, 43.936790466308594, 45.34782028198242, 46.75885009765625]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 7.0, 5.0, 11.0, 7.0, 7.0, 13.0, 9.0, 9.0, 16.0, 17.0, 21.0, 25.0, 21.0, 28.0, 33.0, 27.0, 33.0, 38.0, 39.0, 35.0, 44.0, 28.0, 33.0, 35.0, 40.0, 34.0, 31.0, 33.0, 34.0, 30.0, 29.0, 18.0, 28.0, 24.0, 25.0, 21.0, 16.0, 19.0, 15.0, 14.0, 16.0, 3.0, 6.0, 5.0, 5.0, 2.0, 3.0, 3.0, 4.0, 3.0, 5.0, 0.0, 2.0, 1.0, 2.0], "bins": [-6.26171875, -6.06634521484375, -5.8709716796875, -5.67559814453125, -5.480224609375, -5.28485107421875, -5.0894775390625, -4.89410400390625, -4.69873046875, -4.50335693359375, -4.3079833984375, -4.11260986328125, -3.917236328125, -3.72186279296875, -3.5264892578125, -3.33111572265625, -3.1357421875, -2.94036865234375, -2.7449951171875, -2.54962158203125, -2.354248046875, -2.15887451171875, -1.9635009765625, -1.76812744140625, -1.57275390625, -1.37738037109375, -1.1820068359375, -0.98663330078125, -0.791259765625, -0.59588623046875, -0.4005126953125, -0.20513916015625, -0.009765625, 0.18560791015625, 0.3809814453125, 0.57635498046875, 0.771728515625, 0.96710205078125, 1.1624755859375, 1.35784912109375, 1.55322265625, 1.74859619140625, 1.9439697265625, 2.13934326171875, 2.334716796875, 2.53009033203125, 2.7254638671875, 2.92083740234375, 3.1162109375, 3.31158447265625, 3.5069580078125, 3.70233154296875, 3.897705078125, 4.09307861328125, 4.2884521484375, 4.48382568359375, 4.67919921875, 4.87457275390625, 5.0699462890625, 5.26531982421875, 5.460693359375, 5.65606689453125, 5.8514404296875, 6.04681396484375, 6.2421875]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 9.0, 16.0, 21.0, 25.0, 34.0, 71.0, 86.0, 158.0, 234.0, 265.0, 438.0, 621.0, 952.0, 1322.0, 2068.0, 2981.0, 4435.0, 6624.0, 9956.0, 14815.0, 22238.0, 34247.0, 52210.0, 80934.0, 125483.0, 186072.0, 173130.0, 114869.0, 73524.0, 47701.0, 31196.0, 20445.0, 13579.0, 8929.0, 6116.0, 4165.0, 2720.0, 1880.0, 1231.0, 883.0, 612.0, 419.0, 275.0, 187.0, 134.0, 84.0, 68.0, 32.0, 30.0, 14.0, 11.0, 5.0, 3.0, 6.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.87939453125, -0.8509292602539062, -0.8224639892578125, -0.7939987182617188, -0.765533447265625, -0.7370681762695312, -0.7086029052734375, -0.6801376342773438, -0.65167236328125, -0.6232070922851562, -0.5947418212890625, -0.5662765502929688, -0.537811279296875, -0.5093460083007812, -0.4808807373046875, -0.45241546630859375, -0.4239501953125, -0.39548492431640625, -0.3670196533203125, -0.33855438232421875, -0.310089111328125, -0.28162384033203125, -0.2531585693359375, -0.22469329833984375, -0.19622802734375, -0.16776275634765625, -0.1392974853515625, -0.11083221435546875, -0.082366943359375, -0.05390167236328125, -0.0254364013671875, 0.00302886962890625, 0.031494140625, 0.05995941162109375, 0.0884246826171875, 0.11688995361328125, 0.145355224609375, 0.17382049560546875, 0.2022857666015625, 0.23075103759765625, 0.25921630859375, 0.28768157958984375, 0.3161468505859375, 0.34461212158203125, 0.373077392578125, 0.40154266357421875, 0.4300079345703125, 0.45847320556640625, 0.4869384765625, 0.5154037475585938, 0.5438690185546875, 0.5723342895507812, 0.600799560546875, 0.6292648315429688, 0.6577301025390625, 0.6861953735351562, 0.71466064453125, 0.7431259155273438, 0.7715911865234375, 0.8000564575195312, 0.828521728515625, 0.8569869995117188, 0.8854522705078125, 0.9139175415039062, 0.9423828125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 6.0, 7.0, 10.0, 8.0, 13.0, 12.0, 12.0, 14.0, 22.0, 21.0, 28.0, 29.0, 30.0, 21.0, 34.0, 32.0, 39.0, 46.0, 44.0, 45.0, 1055.0, 49.0, 51.0, 39.0, 45.0, 36.0, 36.0, 36.0, 32.0, 31.0, 20.0, 19.0, 19.0, 16.0, 15.0, 10.0, 10.0, 9.0, 6.0, 6.0, 4.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.5625, -4.41912841796875, -4.2757568359375, -4.13238525390625, -3.989013671875, -3.84564208984375, -3.7022705078125, -3.55889892578125, -3.41552734375, -3.27215576171875, -3.1287841796875, -2.98541259765625, -2.842041015625, -2.69866943359375, -2.5552978515625, -2.41192626953125, -2.2685546875, -2.12518310546875, -1.9818115234375, -1.83843994140625, -1.695068359375, -1.55169677734375, -1.4083251953125, -1.26495361328125, -1.12158203125, -0.97821044921875, -0.8348388671875, -0.69146728515625, -0.548095703125, -0.40472412109375, -0.2613525390625, -0.11798095703125, 0.025390625, 0.16876220703125, 0.3121337890625, 0.45550537109375, 0.598876953125, 0.74224853515625, 0.8856201171875, 1.02899169921875, 1.17236328125, 1.31573486328125, 1.4591064453125, 1.60247802734375, 1.745849609375, 1.88922119140625, 2.0325927734375, 2.17596435546875, 2.3193359375, 2.46270751953125, 2.6060791015625, 2.74945068359375, 2.892822265625, 3.03619384765625, 3.1795654296875, 3.32293701171875, 3.46630859375, 3.60968017578125, 3.7530517578125, 3.89642333984375, 4.039794921875, 4.18316650390625, 4.3265380859375, 4.46990966796875, 4.61328125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 5.0, 4.0, 16.0, 17.0, 22.0, 41.0, 44.0, 73.0, 112.0, 197.0, 272.0, 383.0, 587.0, 954.0, 1421.0, 2154.0, 3202.0, 5005.0, 7637.0, 11823.0, 18295.0, 28566.0, 45317.0, 71421.0, 113664.0, 182420.0, 1248983.0, 130481.0, 81607.0, 51209.0, 32301.0, 20482.0, 13379.0, 8519.0, 5644.0, 3660.0, 2477.0, 1594.0, 1040.0, 727.0, 480.0, 286.0, 233.0, 110.0, 94.0, 68.0, 39.0, 29.0, 19.0, 11.0, 5.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.8896484375, -0.861968994140625, -0.83428955078125, -0.806610107421875, -0.7789306640625, -0.751251220703125, -0.72357177734375, -0.695892333984375, -0.668212890625, -0.640533447265625, -0.61285400390625, -0.585174560546875, -0.5574951171875, -0.529815673828125, -0.50213623046875, -0.474456787109375, -0.44677734375, -0.419097900390625, -0.39141845703125, -0.363739013671875, -0.3360595703125, -0.308380126953125, -0.28070068359375, -0.253021240234375, -0.225341796875, -0.197662353515625, -0.16998291015625, -0.142303466796875, -0.1146240234375, -0.086944580078125, -0.05926513671875, -0.031585693359375, -0.00390625, 0.023773193359375, 0.05145263671875, 0.079132080078125, 0.1068115234375, 0.134490966796875, 0.16217041015625, 0.189849853515625, 0.217529296875, 0.245208740234375, 0.27288818359375, 0.300567626953125, 0.3282470703125, 0.355926513671875, 0.38360595703125, 0.411285400390625, 0.43896484375, 0.466644287109375, 0.49432373046875, 0.522003173828125, 0.5496826171875, 0.577362060546875, 0.60504150390625, 0.632720947265625, 0.660400390625, 0.688079833984375, 0.71575927734375, 0.743438720703125, 0.7711181640625, 0.798797607421875, 0.82647705078125, 0.854156494140625, 0.8818359375]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 3.0, 6.0, 16.0, 10.0, 10.0, 23.0, 24.0, 24.0, 30.0, 39.0, 38.0, 41.0, 54.0, 56.0, 68.0, 70.0, 67.0, 42.0, 59.0, 55.0, 41.0, 45.0, 32.0, 29.0, 18.0, 17.0, 24.0, 11.0, 8.0, 8.0, 12.0, 7.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00154876708984375, -0.0014983564615249634, -0.0014479458332061768, -0.0013975352048873901, -0.0013471245765686035, -0.001296713948249817, -0.0012463033199310303, -0.0011958926916122437, -0.001145482063293457, -0.0010950714349746704, -0.0010446608066558838, -0.0009942501783370972, -0.0009438395500183105, -0.0008934289216995239, -0.0008430182933807373, -0.0007926076650619507, -0.0007421970367431641, -0.0006917864084243774, -0.0006413757801055908, -0.0005909651517868042, -0.0005405545234680176, -0.000490143895149231, -0.00043973326683044434, -0.0003893226385116577, -0.0003389120101928711, -0.00028850138187408447, -0.00023809075355529785, -0.00018768012523651123, -0.0001372694969177246, -8.685886859893799e-05, -3.644824028015137e-05, 1.3962388038635254e-05, 6.437301635742188e-05, 0.0001147836446762085, 0.00016519427299499512, 0.00021560490131378174, 0.00026601552963256836, 0.000316426157951355, 0.0003668367862701416, 0.0004172474145889282, 0.00046765804290771484, 0.0005180686712265015, 0.0005684792995452881, 0.0006188899278640747, 0.0006693005561828613, 0.000719711184501648, 0.0007701218128204346, 0.0008205324411392212, 0.0008709430694580078, 0.0009213536977767944, 0.0009717643260955811, 0.0010221749544143677, 0.0010725855827331543, 0.001122996211051941, 0.0011734068393707275, 0.0012238174676895142, 0.0012742280960083008, 0.0013246387243270874, 0.001375049352645874, 0.0014254599809646606, 0.0014758706092834473, 0.0015262812376022339, 0.0015766918659210205, 0.0016271024942398071, 0.0016775131225585938]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 9.0, 11.0, 8.0, 14.0, 20.0, 15.0, 22.0, 37.0, 44.0, 59.0, 87.0, 126.0, 208.0, 517.0, 2968.0, 1025286.0, 17589.0, 743.0, 291.0, 153.0, 95.0, 60.0, 47.0, 33.0, 28.0, 23.0, 15.0, 11.0, 6.0, 6.0, 1.0, 8.0, 10.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.039093017578125, -0.03789567947387695, -0.036698341369628906, -0.03550100326538086, -0.03430366516113281, -0.033106327056884766, -0.03190898895263672, -0.030711650848388672, -0.029514312744140625, -0.028316974639892578, -0.02711963653564453, -0.025922298431396484, -0.024724960327148438, -0.02352762222290039, -0.022330284118652344, -0.021132946014404297, -0.01993560791015625, -0.018738269805908203, -0.017540931701660156, -0.01634359359741211, -0.015146255493164062, -0.013948917388916016, -0.012751579284667969, -0.011554241180419922, -0.010356903076171875, -0.009159564971923828, -0.007962226867675781, -0.006764888763427734, -0.0055675506591796875, -0.004370212554931641, -0.0031728744506835938, -0.001975536346435547, -0.0007781982421875, 0.0004191398620605469, 0.0016164779663085938, 0.0028138160705566406, 0.0040111541748046875, 0.005208492279052734, 0.006405830383300781, 0.007603168487548828, 0.008800506591796875, 0.009997844696044922, 0.011195182800292969, 0.012392520904541016, 0.013589859008789062, 0.01478719711303711, 0.015984535217285156, 0.017181873321533203, 0.01837921142578125, 0.019576549530029297, 0.020773887634277344, 0.02197122573852539, 0.023168563842773438, 0.024365901947021484, 0.02556324005126953, 0.026760578155517578, 0.027957916259765625, 0.029155254364013672, 0.03035259246826172, 0.031549930572509766, 0.03274726867675781, 0.03394460678100586, 0.035141944885253906, 0.03633928298950195, 0.03753662109375]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 7.0, 4.0, 16.0, 42.0, 106.0, 184.0, 210.0, 199.0, 127.0, 69.0, 29.0, 17.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0020032308530062437, -0.0019485864322632551, -0.0018939421279355884, -0.0018392977071925998, -0.0017846532864496112, -0.0017300089821219444, -0.0016753645613789558, -0.0016207201406359673, -0.0015660757198929787, -0.00151143129914999, -0.0014567869948223233, -0.0014021425740793347, -0.0013474981533363461, -0.0012928538490086794, -0.0012382094282656908, -0.0011835650075227022, -0.0011289207031950355, -0.0010742762824520469, -0.0010196319781243801, -0.0009649875573813915, -0.0009103431366384029, -0.0008556987741030753, -0.0008010544115677476, -0.000746409990824759, -0.0006917656282894313, -0.0006371212657541037, -0.0005824768450111151, -0.0005278324824757874, -0.00047318809083662927, -0.00041854369919747114, -0.00036389933666214347, -0.00030925494502298534, -0.0002546104369685054, -0.00019996604532934725, -0.00014532166824210435, -9.067729115486145e-05, -3.603289951570332e-05, 1.861149212345481e-05, 7.325585465878248e-05, 0.0001279002462979406, 0.00018254463793709874, 0.00023718902957625687, 0.000291833421215415, 0.0003464777837507427, 0.0004011221753899008, 0.00045576656702905893, 0.0005104109295643866, 0.0005650552920997143, 0.0006196997128427029, 0.0006743440753780305, 0.0007289884961210191, 0.0007836328586563468, 0.0008382772793993354, 0.0008929216419346631, 0.0009475660044699907, 0.0010022104252129793, 0.001056854845955968, 0.0011114992666989565, 0.0011661435710266232, 0.0012207879917696118, 0.0012754324125126004, 0.0013300767168402672, 0.0013847211375832558, 0.0014393655583262444, 0.0014940098626539111]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 6.0, 1.0, 3.0, 9.0, 4.0, 6.0, 13.0, 14.0, 22.0, 11.0, 18.0, 26.0, 23.0, 32.0, 28.0, 29.0, 29.0, 42.0, 32.0, 34.0, 37.0, 41.0, 41.0, 43.0, 40.0, 40.0, 35.0, 32.0, 28.0, 32.0, 29.0, 28.0, 26.0, 31.0, 19.0, 14.0, 13.0, 19.0, 18.0, 11.0, 13.0, 9.0, 7.0, 4.0, 1.0, 6.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.0007635951042175293, -0.0007400056347250938, -0.0007164161652326584, -0.0006928266957402229, -0.0006692372262477875, -0.000645647756755352, -0.0006220582872629166, -0.0005984688177704811, -0.0005748793482780457, -0.0005512898787856102, -0.0005277004092931747, -0.0005041109398007393, -0.00048052147030830383, -0.0004569320008158684, -0.0004333425313234329, -0.00040975306183099747, -0.000386163592338562, -0.00036257412284612656, -0.0003389846533536911, -0.00031539518386125565, -0.0002918057143688202, -0.00026821624487638474, -0.0002446267753839493, -0.00022103730589151382, -0.00019744783639907837, -0.00017385836690664291, -0.00015026889741420746, -0.000126679427921772, -0.00010308995842933655, -7.950048893690109e-05, -5.591101944446564e-05, -3.232154995203018e-05, -8.732080459594727e-06, 1.4857389032840729e-05, 3.8446858525276184e-05, 6.203632801771164e-05, 8.56257975101471e-05, 0.00010921526700258255, 0.000132804736495018, 0.00015639420598745346, 0.00017998367547988892, 0.00020357314497232437, 0.00022716261446475983, 0.0002507520839571953, 0.00027434155344963074, 0.0002979310229420662, 0.00032152049243450165, 0.0003451099619269371, 0.00036869943141937256, 0.000392288900911808, 0.00041587837040424347, 0.0004394678398966789, 0.0004630573093891144, 0.00048664677888154984, 0.0005102362483739853, 0.0005338257178664207, 0.0005574151873588562, 0.0005810046568512917, 0.0006045941263437271, 0.0006281835958361626, 0.000651773065328598, 0.0006753625348210335, 0.0006989520043134689, 0.0007225414738059044, 0.0007461309432983398]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 7.0, 5.0, 11.0, 7.0, 7.0, 13.0, 9.0, 9.0, 15.0, 18.0, 21.0, 25.0, 21.0, 28.0, 32.0, 28.0, 33.0, 37.0, 39.0, 34.0, 46.0, 28.0, 32.0, 36.0, 39.0, 34.0, 32.0, 32.0, 34.0, 31.0, 29.0, 17.0, 29.0, 24.0, 23.0, 23.0, 16.0, 18.0, 16.0, 13.0, 17.0, 3.0, 6.0, 5.0, 5.0, 2.0, 3.0, 3.0, 4.0, 3.0, 5.0, 0.0, 2.0, 1.0, 2.0], "bins": [-6.26171875, -6.06640625, -5.87109375, -5.67578125, -5.48046875, -5.28515625, -5.08984375, -4.89453125, -4.69921875, -4.50390625, -4.30859375, -4.11328125, -3.91796875, -3.72265625, -3.52734375, -3.33203125, -3.13671875, -2.94140625, -2.74609375, -2.55078125, -2.35546875, -2.16015625, -1.96484375, -1.76953125, -1.57421875, -1.37890625, -1.18359375, -0.98828125, -0.79296875, -0.59765625, -0.40234375, -0.20703125, -0.01171875, 0.18359375, 0.37890625, 0.57421875, 0.76953125, 0.96484375, 1.16015625, 1.35546875, 1.55078125, 1.74609375, 1.94140625, 2.13671875, 2.33203125, 2.52734375, 2.72265625, 2.91796875, 3.11328125, 3.30859375, 3.50390625, 3.69921875, 3.89453125, 4.08984375, 4.28515625, 4.48046875, 4.67578125, 4.87109375, 5.06640625, 5.26171875, 5.45703125, 5.65234375, 5.84765625, 6.04296875, 6.23828125]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 8.0, 5.0, 2.0, 7.0, 11.0, 17.0, 25.0, 35.0, 52.0, 80.0, 113.0, 178.0, 248.0, 381.0, 577.0, 864.0, 1256.0, 1840.0, 2951.0, 4765.0, 7662.0, 12692.0, 22361.0, 43130.0, 93370.0, 236044.0, 347861.0, 139205.0, 60609.0, 29932.0, 16184.0, 9658.0, 5766.0, 3681.0, 2399.0, 1565.0, 1006.0, 654.0, 417.0, 297.0, 191.0, 145.0, 95.0, 65.0, 46.0, 37.0, 23.0, 20.0, 10.0, 7.0, 8.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.3828125, -3.281005859375, -3.17919921875, -3.077392578125, -2.9755859375, -2.873779296875, -2.77197265625, -2.670166015625, -2.568359375, -2.466552734375, -2.36474609375, -2.262939453125, -2.1611328125, -2.059326171875, -1.95751953125, -1.855712890625, -1.75390625, -1.652099609375, -1.55029296875, -1.448486328125, -1.3466796875, -1.244873046875, -1.14306640625, -1.041259765625, -0.939453125, -0.837646484375, -0.73583984375, -0.634033203125, -0.5322265625, -0.430419921875, -0.32861328125, -0.226806640625, -0.125, -0.023193359375, 0.07861328125, 0.180419921875, 0.2822265625, 0.384033203125, 0.48583984375, 0.587646484375, 0.689453125, 0.791259765625, 0.89306640625, 0.994873046875, 1.0966796875, 1.198486328125, 1.30029296875, 1.402099609375, 1.50390625, 1.605712890625, 1.70751953125, 1.809326171875, 1.9111328125, 2.012939453125, 2.11474609375, 2.216552734375, 2.318359375, 2.420166015625, 2.52197265625, 2.623779296875, 2.7255859375, 2.827392578125, 2.92919921875, 3.031005859375, 3.1328125]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 6.0, 6.0, 7.0, 15.0, 14.0, 10.0, 8.0, 20.0, 15.0, 23.0, 27.0, 39.0, 53.0, 46.0, 33.0, 44.0, 62.0, 149.0, 1739.0, 219.0, 72.0, 53.0, 52.0, 42.0, 43.0, 24.0, 34.0, 30.0, 21.0, 28.0, 27.0, 13.0, 13.0, 9.0, 15.0, 9.0, 8.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.328125, -21.51904296875, -20.7099609375, -19.90087890625, -19.091796875, -18.28271484375, -17.4736328125, -16.66455078125, -15.85546875, -15.04638671875, -14.2373046875, -13.42822265625, -12.619140625, -11.81005859375, -11.0009765625, -10.19189453125, -9.3828125, -8.57373046875, -7.7646484375, -6.95556640625, -6.146484375, -5.33740234375, -4.5283203125, -3.71923828125, -2.91015625, -2.10107421875, -1.2919921875, -0.48291015625, 0.326171875, 1.13525390625, 1.9443359375, 2.75341796875, 3.5625, 4.37158203125, 5.1806640625, 5.98974609375, 6.798828125, 7.60791015625, 8.4169921875, 9.22607421875, 10.03515625, 10.84423828125, 11.6533203125, 12.46240234375, 13.271484375, 14.08056640625, 14.8896484375, 15.69873046875, 16.5078125, 17.31689453125, 18.1259765625, 18.93505859375, 19.744140625, 20.55322265625, 21.3623046875, 22.17138671875, 22.98046875, 23.78955078125, 24.5986328125, 25.40771484375, 26.216796875, 27.02587890625, 27.8349609375, 28.64404296875, 29.453125]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 5.0, 8.0, 6.0, 9.0, 16.0, 35.0, 23.0, 34.0, 58.0, 55.0, 88.0, 116.0, 182.0, 354.0, 681.0, 4077.0, 3034288.0, 102925.0, 1499.0, 464.0, 260.0, 180.0, 109.0, 60.0, 39.0, 20.0, 29.0, 25.0, 17.0, 11.0, 12.0, 7.0, 4.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-78.5625, -76.484375, -74.40625, -72.328125, -70.25, -68.171875, -66.09375, -64.015625, -61.9375, -59.859375, -57.78125, -55.703125, -53.625, -51.546875, -49.46875, -47.390625, -45.3125, -43.234375, -41.15625, -39.078125, -37.0, -34.921875, -32.84375, -30.765625, -28.6875, -26.609375, -24.53125, -22.453125, -20.375, -18.296875, -16.21875, -14.140625, -12.0625, -9.984375, -7.90625, -5.828125, -3.75, -1.671875, 0.40625, 2.484375, 4.5625, 6.640625, 8.71875, 10.796875, 12.875, 14.953125, 17.03125, 19.109375, 21.1875, 23.265625, 25.34375, 27.421875, 29.5, 31.578125, 33.65625, 35.734375, 37.8125, 39.890625, 41.96875, 44.046875, 46.125, 48.203125, 50.28125, 52.359375, 54.4375]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 8.0, 13.0, 33.0, 93.0, 176.0, 213.0, 219.0, 140.0, 76.0, 27.0, 7.0, 3.0, 1.0, 1.0, 2.0], "bins": [-77.00790405273438, -75.60250854492188, -74.1971206665039, -72.79173278808594, -71.38633728027344, -69.98094177246094, -68.57555389404297, -67.170166015625, -65.7647705078125, -64.359375, -62.95398712158203, -61.5485954284668, -60.14320373535156, -58.73781204223633, -57.332420349121094, -55.92702865600586, -54.521636962890625, -53.11624526977539, -51.710853576660156, -50.30546188354492, -48.90007019042969, -47.49467849731445, -46.08928680419922, -44.683895111083984, -43.27850341796875, -41.873111724853516, -40.46772003173828, -39.06232833862305, -37.65693664550781, -36.25154495239258, -34.846153259277344, -33.44076156616211, -32.035369873046875, -30.62997817993164, -29.224586486816406, -27.819194793701172, -26.413803100585938, -25.008411407470703, -23.60301971435547, -22.197628021240234, -20.792236328125, -19.386844635009766, -17.98145294189453, -16.576061248779297, -15.170669555664062, -13.765277862548828, -12.359886169433594, -10.95449447631836, -9.549103736877441, -8.143712043762207, -6.738320350646973, -5.332928657531738, -3.927536964416504, -2.5221452713012695, -1.1167535781860352, 0.2886381149291992, 1.6940298080444336, 3.099421501159668, 4.504813194274902, 5.910204887390137, 7.315596580505371, 8.720988273620605, 10.12637996673584, 11.531771659851074, 12.937163352966309]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 8.0, 4.0, 2.0, 7.0, 7.0, 9.0, 7.0, 13.0, 10.0, 22.0, 29.0, 24.0, 29.0, 20.0, 33.0, 29.0, 39.0, 26.0, 32.0, 51.0, 52.0, 35.0, 43.0, 43.0, 38.0, 39.0, 41.0, 32.0, 31.0, 31.0, 34.0, 24.0, 24.0, 26.0, 22.0, 8.0, 18.0, 21.0, 8.0, 6.0, 12.0, 2.0, 6.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-63.31575012207031, -61.22175598144531, -59.12776184082031, -57.03377151489258, -54.93977737426758, -52.84578323364258, -50.751792907714844, -48.657798767089844, -46.563804626464844, -44.469810485839844, -42.375816345214844, -40.28182601928711, -38.18783187866211, -36.09383773803711, -33.999847412109375, -31.905853271484375, -29.811859130859375, -27.717864990234375, -25.623872756958008, -23.52988052368164, -21.43588638305664, -19.34189224243164, -17.247900009155273, -15.15390682220459, -13.059913635253906, -10.965920448303223, -8.871927261352539, -6.7779340744018555, -4.683940887451172, -2.5899477005004883, -0.4959545135498047, 1.598038673400879, 3.6920394897460938, 5.786032676696777, 7.880025863647461, 9.974019050598145, 12.068012237548828, 14.162005424499512, 16.255998611450195, 18.349990844726562, 20.443984985351562, 22.537979125976562, 24.63197135925293, 26.725963592529297, 28.819957733154297, 30.913951873779297, 33.00794219970703, 35.10193634033203, 37.19593048095703, 39.28992462158203, 41.38391876220703, 43.477909088134766, 45.571903228759766, 47.665897369384766, 49.7598876953125, 51.8538818359375, 53.9478759765625, 56.0418701171875, 58.1358642578125, 60.229854583740234, 62.323848724365234, 64.41783905029297, 66.51183319091797, 68.60582733154297, 70.69982147216797]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 8.0, 9.0, 5.0, 10.0, 12.0, 5.0, 16.0, 9.0, 22.0, 13.0, 22.0, 19.0, 30.0, 32.0, 27.0, 25.0, 23.0, 44.0, 33.0, 34.0, 34.0, 30.0, 35.0, 32.0, 33.0, 33.0, 33.0, 36.0, 32.0, 35.0, 21.0, 23.0, 28.0, 18.0, 22.0, 20.0, 16.0, 19.0, 16.0, 21.0, 9.0, 13.0, 6.0, 7.0, 6.0, 2.0, 3.0, 5.0, 3.0, 3.0, 3.0, 6.0, 2.0, 1.0, 1.0, 3.0], "bins": [-5.97265625, -5.781494140625, -5.59033203125, -5.399169921875, -5.2080078125, -5.016845703125, -4.82568359375, -4.634521484375, -4.443359375, -4.252197265625, -4.06103515625, -3.869873046875, -3.6787109375, -3.487548828125, -3.29638671875, -3.105224609375, -2.9140625, -2.722900390625, -2.53173828125, -2.340576171875, -2.1494140625, -1.958251953125, -1.76708984375, -1.575927734375, -1.384765625, -1.193603515625, -1.00244140625, -0.811279296875, -0.6201171875, -0.428955078125, -0.23779296875, -0.046630859375, 0.14453125, 0.335693359375, 0.52685546875, 0.718017578125, 0.9091796875, 1.100341796875, 1.29150390625, 1.482666015625, 1.673828125, 1.864990234375, 2.05615234375, 2.247314453125, 2.4384765625, 2.629638671875, 2.82080078125, 3.011962890625, 3.203125, 3.394287109375, 3.58544921875, 3.776611328125, 3.9677734375, 4.158935546875, 4.35009765625, 4.541259765625, 4.732421875, 4.923583984375, 5.11474609375, 5.305908203125, 5.4970703125, 5.688232421875, 5.87939453125, 6.070556640625, 6.26171875]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 7.0, 13.0, 15.0, 18.0, 28.0, 43.0, 53.0, 73.0, 104.0, 136.0, 231.0, 347.0, 610.0, 1163.0, 2351.0, 5673.0, 16109.0, 66709.0, 369911.0, 1421316.0, 1677084.0, 513443.0, 86435.0, 19875.0, 6569.0, 2761.0, 1344.0, 662.0, 398.0, 234.0, 165.0, 96.0, 74.0, 64.0, 49.0, 40.0, 26.0, 16.0, 12.0, 13.0, 10.0, 4.0, 2.0, 2.0, 3.0], "bins": [-12.4375, -12.119384765625, -11.80126953125, -11.483154296875, -11.1650390625, -10.846923828125, -10.52880859375, -10.210693359375, -9.892578125, -9.574462890625, -9.25634765625, -8.938232421875, -8.6201171875, -8.302001953125, -7.98388671875, -7.665771484375, -7.34765625, -7.029541015625, -6.71142578125, -6.393310546875, -6.0751953125, -5.757080078125, -5.43896484375, -5.120849609375, -4.802734375, -4.484619140625, -4.16650390625, -3.848388671875, -3.5302734375, -3.212158203125, -2.89404296875, -2.575927734375, -2.2578125, -1.939697265625, -1.62158203125, -1.303466796875, -0.9853515625, -0.667236328125, -0.34912109375, -0.031005859375, 0.287109375, 0.605224609375, 0.92333984375, 1.241455078125, 1.5595703125, 1.877685546875, 2.19580078125, 2.513916015625, 2.83203125, 3.150146484375, 3.46826171875, 3.786376953125, 4.1044921875, 4.422607421875, 4.74072265625, 5.058837890625, 5.376953125, 5.695068359375, 6.01318359375, 6.331298828125, 6.6494140625, 6.967529296875, 7.28564453125, 7.603759765625, 7.921875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 5.0, 1.0, 3.0, 1.0, 9.0, 9.0, 8.0, 9.0, 10.0, 12.0, 13.0, 18.0, 20.0, 29.0, 42.0, 57.0, 69.0, 85.0, 102.0, 161.0, 176.0, 241.0, 291.0, 335.0, 366.0, 383.0, 319.0, 281.0, 227.0, 176.0, 123.0, 113.0, 78.0, 76.0, 58.0, 39.0, 37.0, 22.0, 23.0, 19.0, 19.0, 8.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.4375, -10.0361328125, -9.634765625, -9.2333984375, -8.83203125, -8.4306640625, -8.029296875, -7.6279296875, -7.2265625, -6.8251953125, -6.423828125, -6.0224609375, -5.62109375, -5.2197265625, -4.818359375, -4.4169921875, -4.015625, -3.6142578125, -3.212890625, -2.8115234375, -2.41015625, -2.0087890625, -1.607421875, -1.2060546875, -0.8046875, -0.4033203125, -0.001953125, 0.3994140625, 0.80078125, 1.2021484375, 1.603515625, 2.0048828125, 2.40625, 2.8076171875, 3.208984375, 3.6103515625, 4.01171875, 4.4130859375, 4.814453125, 5.2158203125, 5.6171875, 6.0185546875, 6.419921875, 6.8212890625, 7.22265625, 7.6240234375, 8.025390625, 8.4267578125, 8.828125, 9.2294921875, 9.630859375, 10.0322265625, 10.43359375, 10.8349609375, 11.236328125, 11.6376953125, 12.0390625, 12.4404296875, 12.841796875, 13.2431640625, 13.64453125, 14.0458984375, 14.447265625, 14.8486328125, 15.25]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 6.0, 0.0, 4.0, 5.0, 10.0, 14.0, 12.0, 23.0, 20.0, 15.0, 40.0, 27.0, 54.0, 73.0, 80.0, 108.0, 152.0, 245.0, 389.0, 1067.0, 14258.0, 3378750.0, 791433.0, 5569.0, 775.0, 321.0, 221.0, 149.0, 100.0, 70.0, 59.0, 46.0, 50.0, 29.0, 24.0, 17.0, 20.0, 8.0, 6.0, 13.0, 3.0, 6.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0], "bins": [-65.9375, -64.04638671875, -62.1552734375, -60.26416015625, -58.373046875, -56.48193359375, -54.5908203125, -52.69970703125, -50.80859375, -48.91748046875, -47.0263671875, -45.13525390625, -43.244140625, -41.35302734375, -39.4619140625, -37.57080078125, -35.6796875, -33.78857421875, -31.8974609375, -30.00634765625, -28.115234375, -26.22412109375, -24.3330078125, -22.44189453125, -20.55078125, -18.65966796875, -16.7685546875, -14.87744140625, -12.986328125, -11.09521484375, -9.2041015625, -7.31298828125, -5.421875, -3.53076171875, -1.6396484375, 0.25146484375, 2.142578125, 4.03369140625, 5.9248046875, 7.81591796875, 9.70703125, 11.59814453125, 13.4892578125, 15.38037109375, 17.271484375, 19.16259765625, 21.0537109375, 22.94482421875, 24.8359375, 26.72705078125, 28.6181640625, 30.50927734375, 32.400390625, 34.29150390625, 36.1826171875, 38.07373046875, 39.96484375, 41.85595703125, 43.7470703125, 45.63818359375, 47.529296875, 49.42041015625, 51.3115234375, 53.20263671875, 55.09375]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 7.0, 11.0, 10.0, 14.0, 16.0, 19.0, 26.0, 50.0, 42.0, 58.0, 63.0, 74.0, 82.0, 82.0, 89.0, 91.0, 58.0, 59.0, 38.0, 33.0, 28.0, 19.0, 14.0, 11.0, 9.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.831884384155273, -21.42334747314453, -20.014812469482422, -18.60627555847168, -17.19774055480957, -15.789203643798828, -14.380667686462402, -12.972131729125977, -11.56359577178955, -10.155059814453125, -8.7465238571167, -7.337987422943115, -5.9294514656066895, -4.520915508270264, -3.1123790740966797, -1.703843116760254, -0.2953071594238281, 1.1132289171218872, 2.5217649936676025, 3.9303011894226074, 5.338837146759033, 6.747373104095459, 8.155909538269043, 9.564445495605469, 10.972981452941895, 12.38151741027832, 13.790053367614746, 15.198589324951172, 16.607126235961914, 18.015661239624023, 19.424198150634766, 20.832733154296875, 22.241268157958984, 23.649805068969727, 25.058340072631836, 26.466876983642578, 27.875411987304688, 29.28394889831543, 30.692485809326172, 32.10102081298828, 33.50955581665039, 34.9180908203125, 36.326629638671875, 37.735164642333984, 39.143699645996094, 40.5522346496582, 41.96077346801758, 43.36930847167969, 44.77784729003906, 46.18638229370117, 47.59492111206055, 49.003456115722656, 50.411991119384766, 51.820526123046875, 53.22906494140625, 54.63759994506836, 56.04613494873047, 57.45466995239258, 58.86320877075195, 60.27174377441406, 61.68027877807617, 63.08881378173828, 64.49735260009766, 65.9058837890625, 67.31442260742188]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 12.0, 7.0, 7.0, 6.0, 12.0, 16.0, 19.0, 27.0, 22.0, 27.0, 31.0, 35.0, 39.0, 44.0, 39.0, 30.0, 36.0, 49.0, 46.0, 37.0, 39.0, 33.0, 43.0, 35.0, 31.0, 30.0, 29.0, 26.0, 24.0, 29.0, 27.0, 20.0, 15.0, 13.0, 9.0, 15.0, 11.0, 6.0, 8.0, 2.0, 8.0, 3.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0], "bins": [-53.66212463378906, -52.12750244140625, -50.59288024902344, -49.058258056640625, -47.52363204956055, -45.989009857177734, -44.45438766479492, -42.91976547241211, -41.3851432800293, -39.850521087646484, -38.31589889526367, -36.781272888183594, -35.24665069580078, -33.71202850341797, -32.177406311035156, -30.642784118652344, -29.1081600189209, -27.573537826538086, -26.03891372680664, -24.504291534423828, -22.969669342041016, -21.435047149658203, -19.900423049926758, -18.365800857543945, -16.8311767578125, -15.296553611755371, -13.761931419372559, -12.22730827331543, -10.692686080932617, -9.158062934875488, -7.623439788818359, -6.088817596435547, -4.554195404052734, -3.0195727348327637, -1.4849498271942139, 0.04967308044433594, 1.5842957496643066, 3.1189184188842773, 4.653541564941406, 6.188163757324219, 7.722786903381348, 9.257410049438477, 10.792032241821289, 12.326655387878418, 13.861278533935547, 15.39590072631836, 16.930522918701172, 18.465145111083984, 19.99976921081543, 21.534391403198242, 23.069015502929688, 24.6036376953125, 26.138259887695312, 27.672882080078125, 29.20750617980957, 30.742128372192383, 32.27675247192383, 33.81137466430664, 35.34599685668945, 36.88062286376953, 38.415245056152344, 39.949867248535156, 41.48448944091797, 43.01911163330078, 44.553733825683594]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 9.0, 13.0, 10.0, 11.0, 19.0, 12.0, 18.0, 16.0, 20.0, 18.0, 21.0, 14.0, 39.0, 41.0, 32.0, 40.0, 40.0, 21.0, 29.0, 44.0, 41.0, 34.0, 33.0, 38.0, 34.0, 27.0, 29.0, 30.0, 32.0, 28.0, 23.0, 23.0, 21.0, 21.0, 20.0, 24.0, 6.0, 8.0, 15.0, 7.0, 8.0, 1.0, 6.0, 8.0, 2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 3.0, 4.0, 0.0, 1.0], "bins": [-6.0703125, -5.87359619140625, -5.6768798828125, -5.48016357421875, -5.283447265625, -5.08673095703125, -4.8900146484375, -4.69329833984375, -4.49658203125, -4.29986572265625, -4.1031494140625, -3.90643310546875, -3.709716796875, -3.51300048828125, -3.3162841796875, -3.11956787109375, -2.9228515625, -2.72613525390625, -2.5294189453125, -2.33270263671875, -2.135986328125, -1.93927001953125, -1.7425537109375, -1.54583740234375, -1.34912109375, -1.15240478515625, -0.9556884765625, -0.75897216796875, -0.562255859375, -0.36553955078125, -0.1688232421875, 0.02789306640625, 0.224609375, 0.42132568359375, 0.6180419921875, 0.81475830078125, 1.011474609375, 1.20819091796875, 1.4049072265625, 1.60162353515625, 1.79833984375, 1.99505615234375, 2.1917724609375, 2.38848876953125, 2.585205078125, 2.78192138671875, 2.9786376953125, 3.17535400390625, 3.3720703125, 3.56878662109375, 3.7655029296875, 3.96221923828125, 4.158935546875, 4.35565185546875, 4.5523681640625, 4.74908447265625, 4.94580078125, 5.14251708984375, 5.3392333984375, 5.53594970703125, 5.732666015625, 5.92938232421875, 6.1260986328125, 6.32281494140625, 6.51953125]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 6.0, 1.0, 3.0, 7.0, 8.0, 10.0, 30.0, 32.0, 39.0, 70.0, 98.0, 123.0, 213.0, 329.0, 491.0, 771.0, 1147.0, 1708.0, 2510.0, 3928.0, 5996.0, 8971.0, 13847.0, 20933.0, 32373.0, 50135.0, 77998.0, 125635.0, 199954.0, 184197.0, 113842.0, 71252.0, 45859.0, 29566.0, 19456.0, 12794.0, 8237.0, 5389.0, 3506.0, 2369.0, 1569.0, 982.0, 745.0, 490.0, 296.0, 227.0, 156.0, 96.0, 52.0, 47.0, 27.0, 12.0, 10.0, 11.0, 10.0, 2.0, 4.0, 1.0, 1.0, 3.0], "bins": [-1.0263671875, -0.9951705932617188, -0.9639739990234375, -0.9327774047851562, -0.901580810546875, -0.8703842163085938, -0.8391876220703125, -0.8079910278320312, -0.77679443359375, -0.7455978393554688, -0.7144012451171875, -0.6832046508789062, -0.652008056640625, -0.6208114624023438, -0.5896148681640625, -0.5584182739257812, -0.5272216796875, -0.49602508544921875, -0.4648284912109375, -0.43363189697265625, -0.402435302734375, -0.37123870849609375, -0.3400421142578125, -0.30884552001953125, -0.27764892578125, -0.24645233154296875, -0.2152557373046875, -0.18405914306640625, -0.152862548828125, -0.12166595458984375, -0.0904693603515625, -0.05927276611328125, -0.028076171875, 0.00312042236328125, 0.0343170166015625, 0.06551361083984375, 0.096710205078125, 0.12790679931640625, 0.1591033935546875, 0.19029998779296875, 0.22149658203125, 0.25269317626953125, 0.2838897705078125, 0.31508636474609375, 0.346282958984375, 0.37747955322265625, 0.4086761474609375, 0.43987274169921875, 0.4710693359375, 0.5022659301757812, 0.5334625244140625, 0.5646591186523438, 0.595855712890625, 0.6270523071289062, 0.6582489013671875, 0.6894454956054688, 0.72064208984375, 0.7518386840820312, 0.7830352783203125, 0.8142318725585938, 0.845428466796875, 0.8766250610351562, 0.9078216552734375, 0.9390182495117188, 0.97021484375]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 4.0, 6.0, 4.0, 4.0, 4.0, 6.0, 10.0, 8.0, 15.0, 8.0, 13.0, 17.0, 20.0, 20.0, 20.0, 32.0, 31.0, 33.0, 29.0, 39.0, 47.0, 52.0, 45.0, 1064.0, 42.0, 35.0, 40.0, 41.0, 37.0, 39.0, 33.0, 39.0, 28.0, 25.0, 23.0, 26.0, 21.0, 16.0, 10.0, 10.0, 10.0, 9.0, 6.0, 8.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.00390625, -3.860107421875, -3.71630859375, -3.572509765625, -3.4287109375, -3.284912109375, -3.14111328125, -2.997314453125, -2.853515625, -2.709716796875, -2.56591796875, -2.422119140625, -2.2783203125, -2.134521484375, -1.99072265625, -1.846923828125, -1.703125, -1.559326171875, -1.41552734375, -1.271728515625, -1.1279296875, -0.984130859375, -0.84033203125, -0.696533203125, -0.552734375, -0.408935546875, -0.26513671875, -0.121337890625, 0.0224609375, 0.166259765625, 0.31005859375, 0.453857421875, 0.59765625, 0.741455078125, 0.88525390625, 1.029052734375, 1.1728515625, 1.316650390625, 1.46044921875, 1.604248046875, 1.748046875, 1.891845703125, 2.03564453125, 2.179443359375, 2.3232421875, 2.467041015625, 2.61083984375, 2.754638671875, 2.8984375, 3.042236328125, 3.18603515625, 3.329833984375, 3.4736328125, 3.617431640625, 3.76123046875, 3.905029296875, 4.048828125, 4.192626953125, 4.33642578125, 4.480224609375, 4.6240234375, 4.767822265625, 4.91162109375, 5.055419921875, 5.19921875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 3.0, 3.0, 12.0, 16.0, 17.0, 26.0, 45.0, 61.0, 94.0, 116.0, 184.0, 288.0, 442.0, 630.0, 995.0, 1431.0, 2174.0, 3116.0, 4750.0, 7234.0, 10626.0, 15837.0, 24025.0, 35958.0, 54169.0, 81564.0, 124827.0, 1231444.0, 167791.0, 111383.0, 72680.0, 48415.0, 32446.0, 21393.0, 14114.0, 9551.0, 6264.0, 4183.0, 2925.0, 1925.0, 1298.0, 848.0, 635.0, 383.0, 273.0, 189.0, 122.0, 86.0, 58.0, 36.0, 27.0, 10.0, 7.0, 3.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.78857421875, -0.7630233764648438, -0.7374725341796875, -0.7119216918945312, -0.686370849609375, -0.6608200073242188, -0.6352691650390625, -0.6097183227539062, -0.58416748046875, -0.5586166381835938, -0.5330657958984375, -0.5075149536132812, -0.481964111328125, -0.45641326904296875, -0.4308624267578125, -0.40531158447265625, -0.3797607421875, -0.35420989990234375, -0.3286590576171875, -0.30310821533203125, -0.277557373046875, -0.25200653076171875, -0.2264556884765625, -0.20090484619140625, -0.17535400390625, -0.14980316162109375, -0.1242523193359375, -0.09870147705078125, -0.073150634765625, -0.04759979248046875, -0.0220489501953125, 0.00350189208984375, 0.029052734375, 0.05460357666015625, 0.0801544189453125, 0.10570526123046875, 0.131256103515625, 0.15680694580078125, 0.1823577880859375, 0.20790863037109375, 0.23345947265625, 0.25901031494140625, 0.2845611572265625, 0.31011199951171875, 0.335662841796875, 0.36121368408203125, 0.3867645263671875, 0.41231536865234375, 0.4378662109375, 0.46341705322265625, 0.4889678955078125, 0.5145187377929688, 0.540069580078125, 0.5656204223632812, 0.5911712646484375, 0.6167221069335938, 0.64227294921875, 0.6678237915039062, 0.6933746337890625, 0.7189254760742188, 0.744476318359375, 0.7700271606445312, 0.7955780029296875, 0.8211288452148438, 0.8466796875]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 7.0, 5.0, 7.0, 7.0, 10.0, 7.0, 16.0, 20.0, 31.0, 41.0, 36.0, 42.0, 67.0, 98.0, 82.0, 72.0, 59.0, 52.0, 71.0, 53.0, 39.0, 30.0, 31.0, 32.0, 20.0, 15.0, 4.0, 7.0, 9.0, 7.0, 5.0, 4.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0019407272338867188, -0.0018734186887741089, -0.001806110143661499, -0.0017388015985488892, -0.0016714930534362793, -0.0016041845083236694, -0.0015368759632110596, -0.0014695674180984497, -0.0014022588729858398, -0.00133495032787323, -0.0012676417827606201, -0.0012003332376480103, -0.0011330246925354004, -0.0010657161474227905, -0.0009984076023101807, -0.0009310990571975708, -0.0008637905120849609, -0.0007964819669723511, -0.0007291734218597412, -0.0006618648767471313, -0.0005945563316345215, -0.0005272477865219116, -0.00045993924140930176, -0.0003926306962966919, -0.00032532215118408203, -0.00025801360607147217, -0.0001907050609588623, -0.00012339651584625244, -5.608797073364258e-05, 1.1220574378967285e-05, 7.852911949157715e-05, 0.000145837664604187, 0.00021314620971679688, 0.00028045475482940674, 0.0003477632999420166, 0.00041507184505462646, 0.00048238039016723633, 0.0005496889352798462, 0.0006169974803924561, 0.0006843060255050659, 0.0007516145706176758, 0.0008189231157302856, 0.0008862316608428955, 0.0009535402059555054, 0.0010208487510681152, 0.001088157296180725, 0.001155465841293335, 0.0012227743864059448, 0.0012900829315185547, 0.0013573914766311646, 0.0014247000217437744, 0.0014920085668563843, 0.0015593171119689941, 0.001626625657081604, 0.0016939342021942139, 0.0017612427473068237, 0.0018285512924194336, 0.0018958598375320435, 0.0019631683826446533, 0.002030476927757263, 0.002097785472869873, 0.002165094017982483, 0.0022324025630950928, 0.0022997111082077026, 0.0023670196533203125]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 4.0, 5.0, 5.0, 8.0, 8.0, 12.0, 9.0, 15.0, 23.0, 30.0, 41.0, 51.0, 70.0, 91.0, 201.0, 578.0, 3636.0, 1034777.0, 7668.0, 626.0, 253.0, 136.0, 81.0, 53.0, 37.0, 25.0, 36.0, 13.0, 8.0, 8.0, 11.0, 10.0, 5.0, 3.0, 4.0, 6.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.05267333984375, -0.051192283630371094, -0.04971122741699219, -0.04823017120361328, -0.046749114990234375, -0.04526805877685547, -0.04378700256347656, -0.042305946350097656, -0.04082489013671875, -0.039343833923339844, -0.03786277770996094, -0.03638172149658203, -0.034900665283203125, -0.03341960906982422, -0.03193855285644531, -0.030457496643066406, -0.0289764404296875, -0.027495384216308594, -0.026014328002929688, -0.02453327178955078, -0.023052215576171875, -0.02157115936279297, -0.020090103149414062, -0.018609046936035156, -0.01712799072265625, -0.015646934509277344, -0.014165878295898438, -0.012684822082519531, -0.011203765869140625, -0.009722709655761719, -0.008241653442382812, -0.006760597229003906, -0.005279541015625, -0.0037984848022460938, -0.0023174285888671875, -0.0008363723754882812, 0.000644683837890625, 0.0021257400512695312, 0.0036067962646484375, 0.005087852478027344, 0.00656890869140625, 0.008049964904785156, 0.009531021118164062, 0.011012077331542969, 0.012493133544921875, 0.013974189758300781, 0.015455245971679688, 0.016936302185058594, 0.0184173583984375, 0.019898414611816406, 0.021379470825195312, 0.02286052703857422, 0.024341583251953125, 0.02582263946533203, 0.027303695678710938, 0.028784751892089844, 0.03026580810546875, 0.031746864318847656, 0.03322792053222656, 0.03470897674560547, 0.036190032958984375, 0.03767108917236328, 0.03915214538574219, 0.040633201599121094, 0.0421142578125]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 9.0, 94.0, 419.0, 408.0, 77.0, 10.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002539523644372821, -0.002380147809162736, -0.0022207722067832947, -0.0020613963715732098, -0.0019020205363631248, -0.00174264470115304, -0.0015832689823582768, -0.0014238932635635138, -0.0012645174283534288, -0.001105141593143344, -0.0009457658743485808, -0.0007863900973461568, -0.0006270143203437328, -0.00046763854334130883, -0.00030826276633888483, -0.00014888704754412174, 1.0488787665963173e-05, 0.00016986456466838717, 0.0003292403416708112, 0.0004886161186732352, 0.0006479918956756592, 0.0008073676726780832, 0.0009667434496805072, 0.0011261191684752703, 0.0012854950036853552, 0.00144487083889544, 0.0016042465576902032, 0.0017636222764849663, 0.0019229981116950512, 0.002082373946905136, 0.002241749782115221, 0.0024011253844946623, 0.002560501452535391, 0.0027198772877454758, 0.0028792531229555607, 0.003038628725335002, 0.003198004560545087, 0.0033573803957551718, 0.003516755998134613, 0.003676131833344698, 0.003835507668554783, 0.003994883503764868, 0.004154259338974953, 0.004313635174185038, 0.0044730110093951225, 0.00463238637894392, 0.004791762214154005, 0.00495113804936409, 0.005110513884574175, 0.00526988971978426, 0.005429265554994345, 0.00558864139020443, 0.005748016759753227, 0.005907392594963312, 0.006066768430173397, 0.006226144265383482, 0.006385520100593567, 0.006544895935803652, 0.006704271771013737, 0.006863647606223822, 0.0070230234414339066, 0.007182398810982704, 0.007341774646192789, 0.007501150481402874, 0.007660526316612959]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 5.0, 6.0, 5.0, 3.0, 1.0, 7.0, 5.0, 6.0, 11.0, 13.0, 16.0, 15.0, 16.0, 25.0, 20.0, 22.0, 36.0, 25.0, 25.0, 39.0, 29.0, 26.0, 33.0, 30.0, 37.0, 33.0, 44.0, 46.0, 32.0, 36.0, 34.0, 38.0, 29.0, 26.0, 18.0, 27.0, 23.0, 26.0, 26.0, 18.0, 13.0, 19.0, 17.0, 9.0, 10.0, 6.0, 6.0, 5.0, 6.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0009249448776245117, -0.0008970508351922035, -0.0008691567927598953, -0.0008412627503275871, -0.0008133687078952789, -0.0007854746654629707, -0.0007575806230306625, -0.0007296865805983543, -0.0007017925381660461, -0.0006738984957337379, -0.0006460044533014297, -0.0006181104108691216, -0.0005902163684368134, -0.0005623223260045052, -0.000534428283572197, -0.0005065342411398888, -0.00047864019870758057, -0.00045074615627527237, -0.00042285211384296417, -0.000394958071410656, -0.0003670640289783478, -0.0003391699865460396, -0.0003112759441137314, -0.0002833819016814232, -0.000255487859249115, -0.0002275938168168068, -0.0001996997743844986, -0.0001718057319521904, -0.0001439116895198822, -0.000116017647087574, -8.812360465526581e-05, -6.022956222295761e-05, -3.2335519790649414e-05, -4.441477358341217e-06, 2.345256507396698e-05, 5.134660750627518e-05, 7.924064993858337e-05, 0.00010713469237089157, 0.00013502873480319977, 0.00016292277723550797, 0.00019081681966781616, 0.00021871086210012436, 0.00024660490453243256, 0.00027449894696474075, 0.00030239298939704895, 0.00033028703182935715, 0.00035818107426166534, 0.00038607511669397354, 0.00041396915912628174, 0.00044186320155858994, 0.00046975724399089813, 0.0004976512864232063, 0.0005255453288555145, 0.0005534393712878227, 0.0005813334137201309, 0.0006092274561524391, 0.0006371214985847473, 0.0006650155410170555, 0.0006929095834493637, 0.0007208036258816719, 0.0007486976683139801, 0.0007765917107462883, 0.0008044857531785965, 0.0008323797956109047, 0.0008602738380432129]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 9.0, 13.0, 10.0, 11.0, 19.0, 12.0, 18.0, 16.0, 20.0, 18.0, 21.0, 14.0, 39.0, 41.0, 32.0, 40.0, 40.0, 21.0, 29.0, 44.0, 41.0, 34.0, 33.0, 38.0, 34.0, 27.0, 29.0, 30.0, 32.0, 28.0, 23.0, 23.0, 21.0, 21.0, 20.0, 24.0, 6.0, 8.0, 15.0, 7.0, 8.0, 1.0, 6.0, 8.0, 2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 3.0, 4.0, 0.0, 1.0], "bins": [-6.0703125, -5.87359619140625, -5.6768798828125, -5.48016357421875, -5.283447265625, -5.08673095703125, -4.8900146484375, -4.69329833984375, -4.49658203125, -4.29986572265625, -4.1031494140625, -3.90643310546875, -3.709716796875, -3.51300048828125, -3.3162841796875, -3.11956787109375, -2.9228515625, -2.72613525390625, -2.5294189453125, -2.33270263671875, -2.135986328125, -1.93927001953125, -1.7425537109375, -1.54583740234375, -1.34912109375, -1.15240478515625, -0.9556884765625, -0.75897216796875, -0.562255859375, -0.36553955078125, -0.1688232421875, 0.02789306640625, 0.224609375, 0.42132568359375, 0.6180419921875, 0.81475830078125, 1.011474609375, 1.20819091796875, 1.4049072265625, 1.60162353515625, 1.79833984375, 1.99505615234375, 2.1917724609375, 2.38848876953125, 2.585205078125, 2.78192138671875, 2.9786376953125, 3.17535400390625, 3.3720703125, 3.56878662109375, 3.7655029296875, 3.96221923828125, 4.158935546875, 4.35565185546875, 4.5523681640625, 4.74908447265625, 4.94580078125, 5.14251708984375, 5.3392333984375, 5.53594970703125, 5.732666015625, 5.92938232421875, 6.1260986328125, 6.32281494140625, 6.51953125]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 8.0, 3.0, 5.0, 5.0, 23.0, 18.0, 27.0, 48.0, 79.0, 91.0, 148.0, 187.0, 300.0, 422.0, 739.0, 1142.0, 2050.0, 3930.0, 7369.0, 15137.0, 31468.0, 68924.0, 164716.0, 380561.0, 211066.0, 84144.0, 38463.0, 17927.0, 8831.0, 4436.0, 2449.0, 1406.0, 859.0, 499.0, 334.0, 223.0, 152.0, 105.0, 92.0, 48.0, 30.0, 24.0, 19.0, 16.0, 8.0, 9.0, 8.0, 7.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.39453125, -4.25103759765625, -4.1075439453125, -3.96405029296875, -3.820556640625, -3.67706298828125, -3.5335693359375, -3.39007568359375, -3.24658203125, -3.10308837890625, -2.9595947265625, -2.81610107421875, -2.672607421875, -2.52911376953125, -2.3856201171875, -2.24212646484375, -2.0986328125, -1.95513916015625, -1.8116455078125, -1.66815185546875, -1.524658203125, -1.38116455078125, -1.2376708984375, -1.09417724609375, -0.95068359375, -0.80718994140625, -0.6636962890625, -0.52020263671875, -0.376708984375, -0.23321533203125, -0.0897216796875, 0.05377197265625, 0.197265625, 0.34075927734375, 0.4842529296875, 0.62774658203125, 0.771240234375, 0.91473388671875, 1.0582275390625, 1.20172119140625, 1.34521484375, 1.48870849609375, 1.6322021484375, 1.77569580078125, 1.919189453125, 2.06268310546875, 2.2061767578125, 2.34967041015625, 2.4931640625, 2.63665771484375, 2.7801513671875, 2.92364501953125, 3.067138671875, 3.21063232421875, 3.3541259765625, 3.49761962890625, 3.64111328125, 3.78460693359375, 3.9281005859375, 4.07159423828125, 4.215087890625, 4.35858154296875, 4.5020751953125, 4.64556884765625, 4.7890625]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 7.0, 6.0, 3.0, 7.0, 14.0, 16.0, 17.0, 23.0, 27.0, 26.0, 35.0, 39.0, 32.0, 59.0, 57.0, 80.0, 151.0, 1691.0, 277.0, 82.0, 59.0, 55.0, 44.0, 38.0, 28.0, 22.0, 25.0, 24.0, 29.0, 16.0, 15.0, 11.0, 7.0, 9.0, 9.0, 0.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-34.4375, -33.50048828125, -32.5634765625, -31.62646484375, -30.689453125, -29.75244140625, -28.8154296875, -27.87841796875, -26.94140625, -26.00439453125, -25.0673828125, -24.13037109375, -23.193359375, -22.25634765625, -21.3193359375, -20.38232421875, -19.4453125, -18.50830078125, -17.5712890625, -16.63427734375, -15.697265625, -14.76025390625, -13.8232421875, -12.88623046875, -11.94921875, -11.01220703125, -10.0751953125, -9.13818359375, -8.201171875, -7.26416015625, -6.3271484375, -5.39013671875, -4.453125, -3.51611328125, -2.5791015625, -1.64208984375, -0.705078125, 0.23193359375, 1.1689453125, 2.10595703125, 3.04296875, 3.97998046875, 4.9169921875, 5.85400390625, 6.791015625, 7.72802734375, 8.6650390625, 9.60205078125, 10.5390625, 11.47607421875, 12.4130859375, 13.35009765625, 14.287109375, 15.22412109375, 16.1611328125, 17.09814453125, 18.03515625, 18.97216796875, 19.9091796875, 20.84619140625, 21.783203125, 22.72021484375, 23.6572265625, 24.59423828125, 25.53125]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 12.0, 4.0, 13.0, 22.0, 19.0, 20.0, 38.0, 40.0, 55.0, 63.0, 105.0, 126.0, 175.0, 247.0, 450.0, 1498.0, 171382.0, 2966596.0, 3136.0, 596.0, 332.0, 233.0, 138.0, 97.0, 74.0, 50.0, 51.0, 31.0, 30.0, 16.0, 14.0, 8.0, 5.0, 12.0, 3.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.46875, -55.35205078125, -53.2353515625, -51.11865234375, -49.001953125, -46.88525390625, -44.7685546875, -42.65185546875, -40.53515625, -38.41845703125, -36.3017578125, -34.18505859375, -32.068359375, -29.95166015625, -27.8349609375, -25.71826171875, -23.6015625, -21.48486328125, -19.3681640625, -17.25146484375, -15.134765625, -13.01806640625, -10.9013671875, -8.78466796875, -6.66796875, -4.55126953125, -2.4345703125, -0.31787109375, 1.798828125, 3.91552734375, 6.0322265625, 8.14892578125, 10.265625, 12.38232421875, 14.4990234375, 16.61572265625, 18.732421875, 20.84912109375, 22.9658203125, 25.08251953125, 27.19921875, 29.31591796875, 31.4326171875, 33.54931640625, 35.666015625, 37.78271484375, 39.8994140625, 42.01611328125, 44.1328125, 46.24951171875, 48.3662109375, 50.48291015625, 52.599609375, 54.71630859375, 56.8330078125, 58.94970703125, 61.06640625, 63.18310546875, 65.2998046875, 67.41650390625, 69.533203125, 71.64990234375, 73.7666015625, 75.88330078125, 78.0]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 15.0, 166.0, 460.0, 319.0, 48.0, 3.0, 4.0, 2.0], "bins": [-185.8696746826172, -182.70724487304688, -179.5447998046875, -176.3823699951172, -173.21994018554688, -170.0574951171875, -166.8950653076172, -163.73263549804688, -160.5701904296875, -157.4077606201172, -154.2453155517578, -151.0828857421875, -147.9204559326172, -144.7580108642578, -141.5955810546875, -138.43313598632812, -135.2707061767578, -132.1082763671875, -128.94583129882812, -125.78340148925781, -122.62096405029297, -119.45852661132812, -116.29609680175781, -113.13365936279297, -109.97122955322266, -106.80879211425781, -103.6463623046875, -100.48392486572266, -97.32148742675781, -94.15904998779297, -90.99662017822266, -87.83418273925781, -84.67174530029297, -81.50930786132812, -78.34687805175781, -75.18444061279297, -72.02200317382812, -68.85956573486328, -65.69713592529297, -62.534698486328125, -59.37226104736328, -56.2098274230957, -53.04738998413086, -49.88495635986328, -46.72251892089844, -43.56008529663086, -40.39765167236328, -37.23521423339844, -34.07278060913086, -30.91034507751465, -27.747909545898438, -24.58547592163086, -21.423038482666016, -18.260604858398438, -15.098169326782227, -11.935733795166016, -8.773298263549805, -5.610862731933594, -2.448427677154541, 0.7140073776245117, 3.8764429092407227, 7.038878440856934, 10.201313018798828, 13.363748550415039, 16.52618408203125]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 7.0, 3.0, 3.0, 3.0, 6.0, 4.0, 5.0, 17.0, 8.0, 11.0, 19.0, 17.0, 24.0, 17.0, 33.0, 31.0, 26.0, 35.0, 37.0, 38.0, 41.0, 37.0, 34.0, 36.0, 34.0, 49.0, 41.0, 35.0, 47.0, 39.0, 33.0, 23.0, 30.0, 27.0, 34.0, 17.0, 18.0, 16.0, 9.0, 12.0, 17.0, 2.0, 6.0, 6.0, 6.0, 5.0, 3.0, 2.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-54.16265869140625, -52.25460433959961, -50.34654998779297, -48.43849563598633, -46.53044128417969, -44.62238693237305, -42.714332580566406, -40.806278228759766, -38.898223876953125, -36.990169525146484, -35.082115173339844, -33.1740608215332, -31.266006469726562, -29.357952117919922, -27.44989776611328, -25.54184341430664, -23.6337890625, -21.72573471069336, -19.81768035888672, -17.909626007080078, -16.001571655273438, -14.093517303466797, -12.185462951660156, -10.277408599853516, -8.369354248046875, -6.461299896240234, -4.553245544433594, -2.645191192626953, -0.7371368408203125, 1.1709175109863281, 3.0789718627929688, 4.987026214599609, 6.89508056640625, 8.80313491821289, 10.711189270019531, 12.619243621826172, 14.527297973632812, 16.435352325439453, 18.343406677246094, 20.251461029052734, 22.159515380859375, 24.067569732666016, 25.975624084472656, 27.883678436279297, 29.791732788085938, 31.699787139892578, 33.60784149169922, 35.51589584350586, 37.4239501953125, 39.33200454711914, 41.24005889892578, 43.14811325073242, 45.05616760253906, 46.9642219543457, 48.872276306152344, 50.780330657958984, 52.688385009765625, 54.596439361572266, 56.504493713378906, 58.41254806518555, 60.32060241699219, 62.22865676879883, 64.13671112060547, 66.04476928710938, 67.95281982421875]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 9.0, 7.0, 8.0, 9.0, 11.0, 18.0, 12.0, 13.0, 15.0, 18.0, 19.0, 22.0, 14.0, 31.0, 30.0, 35.0, 53.0, 34.0, 33.0, 23.0, 37.0, 44.0, 33.0, 36.0, 31.0, 31.0, 35.0, 41.0, 33.0, 25.0, 26.0, 25.0, 16.0, 25.0, 19.0, 26.0, 14.0, 18.0, 12.0, 12.0, 6.0, 11.0, 6.0, 4.0, 3.0, 6.0, 4.0, 3.0, 1.0, 1.0, 3.0, 3.0, 0.0, 3.0, 3.0], "bins": [-6.3984375, -6.19512939453125, -5.9918212890625, -5.78851318359375, -5.585205078125, -5.38189697265625, -5.1785888671875, -4.97528076171875, -4.77197265625, -4.56866455078125, -4.3653564453125, -4.16204833984375, -3.958740234375, -3.75543212890625, -3.5521240234375, -3.34881591796875, -3.1455078125, -2.94219970703125, -2.7388916015625, -2.53558349609375, -2.332275390625, -2.12896728515625, -1.9256591796875, -1.72235107421875, -1.51904296875, -1.31573486328125, -1.1124267578125, -0.90911865234375, -0.705810546875, -0.50250244140625, -0.2991943359375, -0.09588623046875, 0.107421875, 0.31072998046875, 0.5140380859375, 0.71734619140625, 0.920654296875, 1.12396240234375, 1.3272705078125, 1.53057861328125, 1.73388671875, 1.93719482421875, 2.1405029296875, 2.34381103515625, 2.547119140625, 2.75042724609375, 2.9537353515625, 3.15704345703125, 3.3603515625, 3.56365966796875, 3.7669677734375, 3.97027587890625, 4.173583984375, 4.37689208984375, 4.5802001953125, 4.78350830078125, 4.98681640625, 5.19012451171875, 5.3934326171875, 5.59674072265625, 5.800048828125, 6.00335693359375, 6.2066650390625, 6.40997314453125, 6.61328125]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 6.0, 7.0, 6.0, 7.0, 13.0, 10.0, 17.0, 9.0, 17.0, 20.0, 18.0, 15.0, 19.0, 24.0, 22.0, 44.0, 36.0, 73.0, 162.0, 548.0, 2917.0, 31630.0, 1675492.0, 2428421.0, 49747.0, 3740.0, 677.0, 201.0, 76.0, 47.0, 39.0, 25.0, 24.0, 24.0, 13.0, 16.0, 25.0, 20.0, 15.0, 14.0, 9.0, 6.0, 3.0, 9.0, 5.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0], "bins": [-26.140625, -25.29931640625, -24.4580078125, -23.61669921875, -22.775390625, -21.93408203125, -21.0927734375, -20.25146484375, -19.41015625, -18.56884765625, -17.7275390625, -16.88623046875, -16.044921875, -15.20361328125, -14.3623046875, -13.52099609375, -12.6796875, -11.83837890625, -10.9970703125, -10.15576171875, -9.314453125, -8.47314453125, -7.6318359375, -6.79052734375, -5.94921875, -5.10791015625, -4.2666015625, -3.42529296875, -2.583984375, -1.74267578125, -0.9013671875, -0.06005859375, 0.78125, 1.62255859375, 2.4638671875, 3.30517578125, 4.146484375, 4.98779296875, 5.8291015625, 6.67041015625, 7.51171875, 8.35302734375, 9.1943359375, 10.03564453125, 10.876953125, 11.71826171875, 12.5595703125, 13.40087890625, 14.2421875, 15.08349609375, 15.9248046875, 16.76611328125, 17.607421875, 18.44873046875, 19.2900390625, 20.13134765625, 20.97265625, 21.81396484375, 22.6552734375, 23.49658203125, 24.337890625, 25.17919921875, 26.0205078125, 26.86181640625, 27.703125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 7.0, 8.0, 11.0, 14.0, 17.0, 34.0, 25.0, 25.0, 49.0, 67.0, 60.0, 85.0, 120.0, 148.0, 194.0, 244.0, 338.0, 379.0, 388.0, 384.0, 315.0, 269.0, 209.0, 162.0, 128.0, 86.0, 81.0, 57.0, 40.0, 27.0, 25.0, 17.0, 14.0, 12.0, 11.0, 4.0, 10.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 3.0], "bins": [-15.65625, -15.2490234375, -14.841796875, -14.4345703125, -14.02734375, -13.6201171875, -13.212890625, -12.8056640625, -12.3984375, -11.9912109375, -11.583984375, -11.1767578125, -10.76953125, -10.3623046875, -9.955078125, -9.5478515625, -9.140625, -8.7333984375, -8.326171875, -7.9189453125, -7.51171875, -7.1044921875, -6.697265625, -6.2900390625, -5.8828125, -5.4755859375, -5.068359375, -4.6611328125, -4.25390625, -3.8466796875, -3.439453125, -3.0322265625, -2.625, -2.2177734375, -1.810546875, -1.4033203125, -0.99609375, -0.5888671875, -0.181640625, 0.2255859375, 0.6328125, 1.0400390625, 1.447265625, 1.8544921875, 2.26171875, 2.6689453125, 3.076171875, 3.4833984375, 3.890625, 4.2978515625, 4.705078125, 5.1123046875, 5.51953125, 5.9267578125, 6.333984375, 6.7412109375, 7.1484375, 7.5556640625, 7.962890625, 8.3701171875, 8.77734375, 9.1845703125, 9.591796875, 9.9990234375, 10.40625]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 4.0, 5.0, 7.0, 6.0, 8.0, 16.0, 16.0, 29.0, 33.0, 35.0, 49.0, 97.0, 99.0, 169.0, 256.0, 461.0, 1560.0, 175870.0, 4002877.0, 10867.0, 777.0, 347.0, 202.0, 141.0, 82.0, 69.0, 54.0, 25.0, 30.0, 19.0, 19.0, 13.0, 11.0, 8.0, 7.0, 5.0, 3.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.25, -63.8212890625, -61.392578125, -58.9638671875, -56.53515625, -54.1064453125, -51.677734375, -49.2490234375, -46.8203125, -44.3916015625, -41.962890625, -39.5341796875, -37.10546875, -34.6767578125, -32.248046875, -29.8193359375, -27.390625, -24.9619140625, -22.533203125, -20.1044921875, -17.67578125, -15.2470703125, -12.818359375, -10.3896484375, -7.9609375, -5.5322265625, -3.103515625, -0.6748046875, 1.75390625, 4.1826171875, 6.611328125, 9.0400390625, 11.46875, 13.8974609375, 16.326171875, 18.7548828125, 21.18359375, 23.6123046875, 26.041015625, 28.4697265625, 30.8984375, 33.3271484375, 35.755859375, 38.1845703125, 40.61328125, 43.0419921875, 45.470703125, 47.8994140625, 50.328125, 52.7568359375, 55.185546875, 57.6142578125, 60.04296875, 62.4716796875, 64.900390625, 67.3291015625, 69.7578125, 72.1865234375, 74.615234375, 77.0439453125, 79.47265625, 81.9013671875, 84.330078125, 86.7587890625, 89.1875]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 10.0, 96.0, 292.0, 409.0, 176.0, 29.0, 6.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-247.19850158691406, -240.38058471679688, -233.56268310546875, -226.74476623535156, -219.92684936523438, -213.1089324951172, -206.291015625, -199.47311401367188, -192.6551971435547, -185.8372802734375, -179.01937866210938, -172.2014617919922, -165.383544921875, -158.5656280517578, -151.74771118164062, -144.9298095703125, -138.1118927001953, -131.29397583007812, -124.47606658935547, -117.65815734863281, -110.84024047851562, -104.02232360839844, -97.20441436767578, -90.38650512695312, -83.56858825683594, -76.75067138671875, -69.9327621459961, -63.11484909057617, -56.29693603515625, -49.47902297973633, -42.661109924316406, -35.843196868896484, -29.025299072265625, -22.207386016845703, -15.389472961425781, -8.57155990600586, -1.7536468505859375, 5.064266204833984, 11.882179260253906, 18.700092315673828, 25.51800537109375, 32.33591842651367, 39.153831481933594, 45.971744537353516, 52.78965759277344, 59.60757064819336, 66.42548370361328, 73.24339294433594, 80.06130981445312, 86.87922668457031, 93.69713592529297, 100.51504516601562, 107.33296203613281, 114.15087890625, 120.96878814697266, 127.78669738769531, 134.6046142578125, 141.4225311279297, 148.24044799804688, 155.058349609375, 161.8762664794922, 168.69418334960938, 175.5120849609375, 182.3300018310547, 189.14791870117188]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 5.0, 8.0, 6.0, 8.0, 14.0, 20.0, 17.0, 19.0, 19.0, 25.0, 32.0, 30.0, 36.0, 35.0, 39.0, 44.0, 49.0, 48.0, 40.0, 34.0, 31.0, 49.0, 39.0, 39.0, 35.0, 21.0, 36.0, 29.0, 28.0, 24.0, 27.0, 20.0, 18.0, 11.0, 19.0, 9.0, 6.0, 9.0, 4.0, 3.0, 6.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-51.380706787109375, -49.83909606933594, -48.297489166259766, -46.75587844848633, -45.21426773071289, -43.67266082763672, -42.13105010986328, -40.589439392089844, -39.047828674316406, -37.50621795654297, -35.9646110534668, -34.42300033569336, -32.88138961791992, -31.339780807495117, -29.798171997070312, -28.256561279296875, -26.714954376220703, -25.1733455657959, -23.63173484802246, -22.090126037597656, -20.54851531982422, -19.006906509399414, -17.46529769897461, -15.923687934875488, -14.382078170776367, -12.840468406677246, -11.298858642578125, -9.75724983215332, -8.2156400680542, -6.674030303955078, -5.132421493530273, -3.5908117294311523, -2.0492019653320312, -0.5075924396514893, 1.0340170860290527, 2.5756263732910156, 4.117236137390137, 5.658845901489258, 7.2004547119140625, 8.742064476013184, 10.283674240112305, 11.825284004211426, 13.366893768310547, 14.908502578735352, 16.450111389160156, 17.991722106933594, 19.5333309173584, 21.074939727783203, 22.61655044555664, 24.158159255981445, 25.699769973754883, 27.241378784179688, 28.782989501953125, 30.32459831237793, 31.866207122802734, 33.40781784057617, 34.949424743652344, 36.49103546142578, 38.03264236450195, 39.57425308227539, 41.11586380004883, 42.657470703125, 44.19908142089844, 45.740692138671875, 47.28230285644531]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 5.0, 9.0, 5.0, 10.0, 14.0, 16.0, 16.0, 17.0, 23.0, 13.0, 21.0, 25.0, 23.0, 42.0, 29.0, 38.0, 38.0, 43.0, 37.0, 36.0, 39.0, 44.0, 30.0, 47.0, 40.0, 25.0, 41.0, 34.0, 30.0, 24.0, 26.0, 20.0, 22.0, 22.0, 22.0, 12.0, 11.0, 7.0, 16.0, 7.0, 5.0, 4.0, 1.0, 2.0, 5.0, 5.0, 1.0, 6.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.52734375, -6.30364990234375, -6.0799560546875, -5.85626220703125, -5.632568359375, -5.40887451171875, -5.1851806640625, -4.96148681640625, -4.73779296875, -4.51409912109375, -4.2904052734375, -4.06671142578125, -3.843017578125, -3.61932373046875, -3.3956298828125, -3.17193603515625, -2.9482421875, -2.72454833984375, -2.5008544921875, -2.27716064453125, -2.053466796875, -1.82977294921875, -1.6060791015625, -1.38238525390625, -1.15869140625, -0.93499755859375, -0.7113037109375, -0.48760986328125, -0.263916015625, -0.04022216796875, 0.1834716796875, 0.40716552734375, 0.630859375, 0.85455322265625, 1.0782470703125, 1.30194091796875, 1.525634765625, 1.74932861328125, 1.9730224609375, 2.19671630859375, 2.42041015625, 2.64410400390625, 2.8677978515625, 3.09149169921875, 3.315185546875, 3.53887939453125, 3.7625732421875, 3.98626708984375, 4.2099609375, 4.43365478515625, 4.6573486328125, 4.88104248046875, 5.104736328125, 5.32843017578125, 5.5521240234375, 5.77581787109375, 5.99951171875, 6.22320556640625, 6.4468994140625, 6.67059326171875, 6.894287109375, 7.11798095703125, 7.3416748046875, 7.56536865234375, 7.7890625]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 5.0, 10.0, 20.0, 23.0, 38.0, 62.0, 82.0, 114.0, 199.0, 249.0, 375.0, 547.0, 771.0, 1169.0, 1695.0, 2435.0, 3682.0, 5495.0, 8040.0, 12034.0, 18359.0, 26891.0, 40721.0, 61028.0, 94501.0, 148852.0, 200418.0, 146404.0, 92568.0, 60323.0, 39958.0, 26946.0, 17963.0, 11907.0, 7997.0, 5404.0, 3589.0, 2480.0, 1681.0, 1089.0, 799.0, 508.0, 360.0, 247.0, 187.0, 117.0, 71.0, 51.0, 39.0, 18.0, 22.0, 5.0, 7.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.94140625, -0.9105224609375, -0.879638671875, -0.8487548828125, -0.81787109375, -0.7869873046875, -0.756103515625, -0.7252197265625, -0.6943359375, -0.6634521484375, -0.632568359375, -0.6016845703125, -0.57080078125, -0.5399169921875, -0.509033203125, -0.4781494140625, -0.447265625, -0.4163818359375, -0.385498046875, -0.3546142578125, -0.32373046875, -0.2928466796875, -0.261962890625, -0.2310791015625, -0.2001953125, -0.1693115234375, -0.138427734375, -0.1075439453125, -0.07666015625, -0.0457763671875, -0.014892578125, 0.0159912109375, 0.046875, 0.0777587890625, 0.108642578125, 0.1395263671875, 0.17041015625, 0.2012939453125, 0.232177734375, 0.2630615234375, 0.2939453125, 0.3248291015625, 0.355712890625, 0.3865966796875, 0.41748046875, 0.4483642578125, 0.479248046875, 0.5101318359375, 0.541015625, 0.5718994140625, 0.602783203125, 0.6336669921875, 0.66455078125, 0.6954345703125, 0.726318359375, 0.7572021484375, 0.7880859375, 0.8189697265625, 0.849853515625, 0.8807373046875, 0.91162109375, 0.9425048828125, 0.973388671875, 1.0042724609375, 1.03515625]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 7.0, 11.0, 10.0, 9.0, 10.0, 12.0, 11.0, 15.0, 17.0, 17.0, 23.0, 19.0, 18.0, 25.0, 38.0, 40.0, 40.0, 49.0, 47.0, 40.0, 1070.0, 42.0, 38.0, 38.0, 41.0, 32.0, 52.0, 38.0, 31.0, 21.0, 21.0, 28.0, 20.0, 17.0, 19.0, 17.0, 6.0, 7.0, 5.0, 8.0, 8.0, 7.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.078125, -4.9241943359375, -4.770263671875, -4.6163330078125, -4.46240234375, -4.3084716796875, -4.154541015625, -4.0006103515625, -3.8466796875, -3.6927490234375, -3.538818359375, -3.3848876953125, -3.23095703125, -3.0770263671875, -2.923095703125, -2.7691650390625, -2.615234375, -2.4613037109375, -2.307373046875, -2.1534423828125, -1.99951171875, -1.8455810546875, -1.691650390625, -1.5377197265625, -1.3837890625, -1.2298583984375, -1.075927734375, -0.9219970703125, -0.76806640625, -0.6141357421875, -0.460205078125, -0.3062744140625, -0.15234375, 0.0015869140625, 0.155517578125, 0.3094482421875, 0.46337890625, 0.6173095703125, 0.771240234375, 0.9251708984375, 1.0791015625, 1.2330322265625, 1.386962890625, 1.5408935546875, 1.69482421875, 1.8487548828125, 2.002685546875, 2.1566162109375, 2.310546875, 2.4644775390625, 2.618408203125, 2.7723388671875, 2.92626953125, 3.0802001953125, 3.234130859375, 3.3880615234375, 3.5419921875, 3.6959228515625, 3.849853515625, 4.0037841796875, 4.15771484375, 4.3116455078125, 4.465576171875, 4.6195068359375, 4.7734375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 7.0, 9.0, 9.0, 19.0, 22.0, 35.0, 59.0, 82.0, 142.0, 253.0, 379.0, 538.0, 954.0, 1358.0, 2200.0, 3480.0, 5607.0, 8729.0, 13539.0, 21325.0, 33152.0, 53236.0, 88243.0, 149082.0, 1271338.0, 174569.0, 102753.0, 61545.0, 37790.0, 24353.0, 15070.0, 9953.0, 6226.0, 4059.0, 2515.0, 1637.0, 1091.0, 650.0, 426.0, 239.0, 156.0, 113.0, 68.0, 55.0, 26.0, 25.0, 10.0, 7.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.96630859375, -0.9347763061523438, -0.9032440185546875, -0.8717117309570312, -0.840179443359375, -0.8086471557617188, -0.7771148681640625, -0.7455825805664062, -0.71405029296875, -0.6825180053710938, -0.6509857177734375, -0.6194534301757812, -0.587921142578125, -0.5563888549804688, -0.5248565673828125, -0.49332427978515625, -0.4617919921875, -0.43025970458984375, -0.3987274169921875, -0.36719512939453125, -0.335662841796875, -0.30413055419921875, -0.2725982666015625, -0.24106597900390625, -0.20953369140625, -0.17800140380859375, -0.1464691162109375, -0.11493682861328125, -0.083404541015625, -0.05187225341796875, -0.0203399658203125, 0.01119232177734375, 0.042724609375, 0.07425689697265625, 0.1057891845703125, 0.13732147216796875, 0.168853759765625, 0.20038604736328125, 0.2319183349609375, 0.26345062255859375, 0.29498291015625, 0.32651519775390625, 0.3580474853515625, 0.38957977294921875, 0.421112060546875, 0.45264434814453125, 0.4841766357421875, 0.5157089233398438, 0.5472412109375, 0.5787734985351562, 0.6103057861328125, 0.6418380737304688, 0.673370361328125, 0.7049026489257812, 0.7364349365234375, 0.7679672241210938, 0.79949951171875, 0.8310317993164062, 0.8625640869140625, 0.8940963745117188, 0.925628662109375, 0.9571609497070312, 0.9886932373046875, 1.0202255249023438, 1.0517578125]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 4.0, 6.0, 9.0, 10.0, 7.0, 11.0, 19.0, 19.0, 32.0, 56.0, 53.0, 73.0, 77.0, 88.0, 116.0, 93.0, 60.0, 51.0, 50.0, 39.0, 28.0, 27.0, 22.0, 14.0, 15.0, 4.0, 6.0, 3.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0025882720947265625, -0.002512216567993164, -0.0024361610412597656, -0.002360105514526367, -0.0022840499877929688, -0.0022079944610595703, -0.002131938934326172, -0.0020558834075927734, -0.001979827880859375, -0.0019037723541259766, -0.0018277168273925781, -0.0017516613006591797, -0.0016756057739257812, -0.0015995502471923828, -0.0015234947204589844, -0.001447439193725586, -0.0013713836669921875, -0.001295328140258789, -0.0012192726135253906, -0.0011432170867919922, -0.0010671615600585938, -0.0009911060333251953, -0.0009150505065917969, -0.0008389949798583984, -0.000762939453125, -0.0006868839263916016, -0.0006108283996582031, -0.0005347728729248047, -0.00045871734619140625, -0.0003826618194580078, -0.0003066062927246094, -0.00023055076599121094, -0.0001544952392578125, -7.843971252441406e-05, -2.384185791015625e-06, 7.367134094238281e-05, 0.00014972686767578125, 0.0002257823944091797, 0.0003018379211425781, 0.00037789344787597656, 0.000453948974609375, 0.0005300045013427734, 0.0006060600280761719, 0.0006821155548095703, 0.0007581710815429688, 0.0008342266082763672, 0.0009102821350097656, 0.000986337661743164, 0.0010623931884765625, 0.001138448715209961, 0.0012145042419433594, 0.0012905597686767578, 0.0013666152954101562, 0.0014426708221435547, 0.0015187263488769531, 0.0015947818756103516, 0.00167083740234375, 0.0017468929290771484, 0.0018229484558105469, 0.0018990039825439453, 0.0019750595092773438, 0.002051115036010742, 0.0021271705627441406, 0.002203226089477539, 0.0022792816162109375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 3.0, 5.0, 5.0, 6.0, 14.0, 16.0, 11.0, 33.0, 37.0, 42.0, 55.0, 104.0, 225.0, 611.0, 28148.0, 1017358.0, 1222.0, 285.0, 144.0, 74.0, 44.0, 29.0, 23.0, 14.0, 7.0, 6.0, 9.0, 7.0, 11.0, 0.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.054473876953125, -0.05267000198364258, -0.050866127014160156, -0.049062252044677734, -0.04725837707519531, -0.04545450210571289, -0.04365062713623047, -0.04184675216674805, -0.040042877197265625, -0.0382390022277832, -0.03643512725830078, -0.03463125228881836, -0.03282737731933594, -0.031023502349853516, -0.029219627380371094, -0.027415752410888672, -0.02561187744140625, -0.023808002471923828, -0.022004127502441406, -0.020200252532958984, -0.018396377563476562, -0.01659250259399414, -0.014788627624511719, -0.012984752655029297, -0.011180877685546875, -0.009377002716064453, -0.007573127746582031, -0.005769252777099609, -0.0039653778076171875, -0.0021615028381347656, -0.00035762786865234375, 0.0014462471008300781, 0.0032501220703125, 0.005053997039794922, 0.006857872009277344, 0.008661746978759766, 0.010465621948242188, 0.01226949691772461, 0.014073371887207031, 0.015877246856689453, 0.017681121826171875, 0.019484996795654297, 0.02128887176513672, 0.02309274673461914, 0.024896621704101562, 0.026700496673583984, 0.028504371643066406, 0.030308246612548828, 0.03211212158203125, 0.03391599655151367, 0.035719871520996094, 0.037523746490478516, 0.03932762145996094, 0.04113149642944336, 0.04293537139892578, 0.0447392463684082, 0.046543121337890625, 0.04834699630737305, 0.05015087127685547, 0.05195474624633789, 0.05375862121582031, 0.055562496185302734, 0.057366371154785156, 0.05917024612426758, 0.06097412109375]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 14.0, 161.0, 499.0, 291.0, 41.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0025693662464618683, -0.0024316562339663506, -0.002293946221470833, -0.0021562364418059587, -0.002018526429310441, -0.0018808164168149233, -0.0017431065207347274, -0.0016053966246545315, -0.0014676866121590137, -0.001329976599663496, -0.0011922667035833001, -0.0010545568075031042, -0.0009168467950075865, -0.0007791368407197297, -0.0006414268864318728, -0.000503716932144016, -0.0003660069778561592, -0.0002282970235683024, -9.058706928044558e-05, 4.712288500741124e-05, 0.00018483283929526806, 0.0003225427935831249, 0.0004602527478709817, 0.0005979627021588385, 0.0007356726564466953, 0.0008733826107345521, 0.001011092565022409, 0.0011488024611026049, 0.0012865124735981226, 0.0014242224860936403, 0.0015619323821738362, 0.0016996422782540321, 0.0018373527564108372, 0.001975062768906355, 0.0021127727814018726, 0.0022504825610667467, 0.0023881925735622644, 0.002525902586057782, 0.0026636123657226562, 0.002801322378218174, 0.0029390323907136917, 0.0030767424032092094, 0.003214452415704727, 0.0033521621953696012, 0.003489872207865119, 0.0036275822203606367, 0.003765292000025511, 0.0039030020125210285, 0.004040712025016546, 0.004178422037512064, 0.004316132050007582, 0.0044538420625030994, 0.00459155160933733, 0.004729261621832848, 0.004866971634328365, 0.005004681646823883, 0.005142391659319401, 0.0052801016718149185, 0.005417811684310436, 0.005555521696805954, 0.005693231709301472, 0.005830941256135702, 0.00596865126863122, 0.006106361281126738, 0.006244071293622255]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 3.0, 4.0, 7.0, 7.0, 11.0, 10.0, 15.0, 24.0, 16.0, 28.0, 19.0, 18.0, 23.0, 27.0, 32.0, 26.0, 39.0, 32.0, 41.0, 30.0, 36.0, 40.0, 46.0, 30.0, 47.0, 38.0, 39.0, 34.0, 25.0, 26.0, 18.0, 29.0, 27.0, 29.0, 19.0, 19.0, 19.0, 14.0, 12.0, 7.0, 13.0, 8.0, 5.0, 4.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0008105039596557617, -0.000783972442150116, -0.0007574409246444702, -0.0007309094071388245, -0.0007043778896331787, -0.000677846372127533, -0.0006513148546218872, -0.0006247833371162415, -0.0005982518196105957, -0.00057172030210495, -0.0005451887845993042, -0.0005186572670936584, -0.0004921257495880127, -0.00046559423208236694, -0.0004390627145767212, -0.00041253119707107544, -0.0003859996795654297, -0.00035946816205978394, -0.0003329366445541382, -0.00030640512704849243, -0.0002798736095428467, -0.00025334209203720093, -0.00022681057453155518, -0.00020027905702590942, -0.00017374753952026367, -0.00014721602201461792, -0.00012068450450897217, -9.415298700332642e-05, -6.762146949768066e-05, -4.108995199203491e-05, -1.455843448638916e-05, 1.1973083019256592e-05, 3.8504600524902344e-05, 6.50361180305481e-05, 9.156763553619385e-05, 0.0001180991530418396, 0.00014463067054748535, 0.0001711621880531311, 0.00019769370555877686, 0.0002242252230644226, 0.00025075674057006836, 0.0002772882580757141, 0.00030381977558135986, 0.0003303512930870056, 0.00035688281059265137, 0.0003834143280982971, 0.00040994584560394287, 0.0004364773631095886, 0.0004630088806152344, 0.0004895403981208801, 0.0005160719156265259, 0.0005426034331321716, 0.0005691349506378174, 0.0005956664681434631, 0.0006221979856491089, 0.0006487295031547546, 0.0006752610206604004, 0.0007017925381660461, 0.0007283240556716919, 0.0007548555731773376, 0.0007813870906829834, 0.0008079186081886292, 0.0008344501256942749, 0.0008609816431999207, 0.0008875131607055664]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 5.0, 9.0, 5.0, 10.0, 14.0, 16.0, 16.0, 17.0, 23.0, 13.0, 21.0, 25.0, 23.0, 42.0, 29.0, 38.0, 38.0, 43.0, 37.0, 36.0, 39.0, 44.0, 30.0, 47.0, 40.0, 25.0, 41.0, 34.0, 30.0, 24.0, 26.0, 20.0, 22.0, 22.0, 22.0, 12.0, 11.0, 7.0, 16.0, 7.0, 5.0, 4.0, 1.0, 2.0, 5.0, 5.0, 1.0, 6.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.52734375, -6.30364990234375, -6.0799560546875, -5.85626220703125, -5.632568359375, -5.40887451171875, -5.1851806640625, -4.96148681640625, -4.73779296875, -4.51409912109375, -4.2904052734375, -4.06671142578125, -3.843017578125, -3.61932373046875, -3.3956298828125, -3.17193603515625, -2.9482421875, -2.72454833984375, -2.5008544921875, -2.27716064453125, -2.053466796875, -1.82977294921875, -1.6060791015625, -1.38238525390625, -1.15869140625, -0.93499755859375, -0.7113037109375, -0.48760986328125, -0.263916015625, -0.04022216796875, 0.1834716796875, 0.40716552734375, 0.630859375, 0.85455322265625, 1.0782470703125, 1.30194091796875, 1.525634765625, 1.74932861328125, 1.9730224609375, 2.19671630859375, 2.42041015625, 2.64410400390625, 2.8677978515625, 3.09149169921875, 3.315185546875, 3.53887939453125, 3.7625732421875, 3.98626708984375, 4.2099609375, 4.43365478515625, 4.6573486328125, 4.88104248046875, 5.104736328125, 5.32843017578125, 5.5521240234375, 5.77581787109375, 5.99951171875, 6.22320556640625, 6.4468994140625, 6.67059326171875, 6.894287109375, 7.11798095703125, 7.3416748046875, 7.56536865234375, 7.7890625]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 8.0, 7.0, 8.0, 29.0, 20.0, 38.0, 51.0, 78.0, 112.0, 149.0, 202.0, 328.0, 466.0, 885.0, 1562.0, 2837.0, 5641.0, 12122.0, 29697.0, 81469.0, 252799.0, 439947.0, 137187.0, 47649.0, 18381.0, 8036.0, 3850.0, 2084.0, 1100.0, 654.0, 386.0, 242.0, 144.0, 112.0, 76.0, 57.0, 51.0, 22.0, 21.0, 23.0, 11.0, 8.0, 8.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.59375, -4.4117431640625, -4.229736328125, -4.0477294921875, -3.86572265625, -3.6837158203125, -3.501708984375, -3.3197021484375, -3.1376953125, -2.9556884765625, -2.773681640625, -2.5916748046875, -2.40966796875, -2.2276611328125, -2.045654296875, -1.8636474609375, -1.681640625, -1.4996337890625, -1.317626953125, -1.1356201171875, -0.95361328125, -0.7716064453125, -0.589599609375, -0.4075927734375, -0.2255859375, -0.0435791015625, 0.138427734375, 0.3204345703125, 0.50244140625, 0.6844482421875, 0.866455078125, 1.0484619140625, 1.23046875, 1.4124755859375, 1.594482421875, 1.7764892578125, 1.95849609375, 2.1405029296875, 2.322509765625, 2.5045166015625, 2.6865234375, 2.8685302734375, 3.050537109375, 3.2325439453125, 3.41455078125, 3.5965576171875, 3.778564453125, 3.9605712890625, 4.142578125, 4.3245849609375, 4.506591796875, 4.6885986328125, 4.87060546875, 5.0526123046875, 5.234619140625, 5.4166259765625, 5.5986328125, 5.7806396484375, 5.962646484375, 6.1446533203125, 6.32666015625, 6.5086669921875, 6.690673828125, 6.8726806640625, 7.0546875]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 5.0, 2.0, 6.0, 8.0, 4.0, 9.0, 23.0, 11.0, 20.0, 32.0, 15.0, 30.0, 28.0, 39.0, 39.0, 42.0, 59.0, 59.0, 66.0, 121.0, 1463.0, 404.0, 129.0, 63.0, 50.0, 45.0, 40.0, 30.0, 35.0, 33.0, 20.0, 23.0, 26.0, 23.0, 11.0, 9.0, 6.0, 5.0, 8.0, 3.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.171875, -22.34375, -21.515625, -20.6875, -19.859375, -19.03125, -18.203125, -17.375, -16.546875, -15.71875, -14.890625, -14.0625, -13.234375, -12.40625, -11.578125, -10.75, -9.921875, -9.09375, -8.265625, -7.4375, -6.609375, -5.78125, -4.953125, -4.125, -3.296875, -2.46875, -1.640625, -0.8125, 0.015625, 0.84375, 1.671875, 2.5, 3.328125, 4.15625, 4.984375, 5.8125, 6.640625, 7.46875, 8.296875, 9.125, 9.953125, 10.78125, 11.609375, 12.4375, 13.265625, 14.09375, 14.921875, 15.75, 16.578125, 17.40625, 18.234375, 19.0625, 19.890625, 20.71875, 21.546875, 22.375, 23.203125, 24.03125, 24.859375, 25.6875, 26.515625, 27.34375, 28.171875, 29.0, 29.828125]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 10.0, 15.0, 23.0, 38.0, 50.0, 68.0, 108.0, 161.0, 310.0, 581.0, 3460.0, 3129814.0, 9328.0, 791.0, 376.0, 191.0, 129.0, 76.0, 66.0, 41.0, 26.0, 16.0, 9.0, 7.0, 8.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-118.625, -115.3837890625, -112.142578125, -108.9013671875, -105.66015625, -102.4189453125, -99.177734375, -95.9365234375, -92.6953125, -89.4541015625, -86.212890625, -82.9716796875, -79.73046875, -76.4892578125, -73.248046875, -70.0068359375, -66.765625, -63.5244140625, -60.283203125, -57.0419921875, -53.80078125, -50.5595703125, -47.318359375, -44.0771484375, -40.8359375, -37.5947265625, -34.353515625, -31.1123046875, -27.87109375, -24.6298828125, -21.388671875, -18.1474609375, -14.90625, -11.6650390625, -8.423828125, -5.1826171875, -1.94140625, 1.2998046875, 4.541015625, 7.7822265625, 11.0234375, 14.2646484375, 17.505859375, 20.7470703125, 23.98828125, 27.2294921875, 30.470703125, 33.7119140625, 36.953125, 40.1943359375, 43.435546875, 46.6767578125, 49.91796875, 53.1591796875, 56.400390625, 59.6416015625, 62.8828125, 66.1240234375, 69.365234375, 72.6064453125, 75.84765625, 79.0888671875, 82.330078125, 85.5712890625, 88.8125]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 8.0, 608.0, 400.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-446.26690673828125, -437.6774597167969, -429.0880126953125, -420.49859619140625, -411.9091491699219, -403.3197021484375, -394.7302551269531, -386.14080810546875, -377.5513916015625, -368.9619445800781, -360.37249755859375, -351.7830810546875, -343.1936340332031, -334.60418701171875, -326.0147399902344, -317.42529296875, -308.83587646484375, -300.2464294433594, -291.656982421875, -283.06756591796875, -274.4781188964844, -265.888671875, -257.2992248535156, -248.7097930908203, -240.12033081054688, -231.5308837890625, -222.9414520263672, -214.3520050048828, -205.7625732421875, -197.17312622070312, -188.58367919921875, -179.99424743652344, -171.40481567382812, -162.81536865234375, -154.22593688964844, -145.63648986816406, -137.04705810546875, -128.45761108398438, -119.86817169189453, -111.27873229980469, -102.68930053710938, -94.09986114501953, -85.51042175292969, -76.92097473144531, -68.33154296875, -59.74209976196289, -51.15265655517578, -42.56321716308594, -33.973777770996094, -25.38433837890625, -16.794897079467773, -8.205455780029297, 0.3839836120605469, 8.97342300415039, 17.5628662109375, 26.152305603027344, 34.74174499511719, 43.33118438720703, 51.920623779296875, 60.510066986083984, 69.09950256347656, 77.68894958496094, 86.27838897705078, 94.86782836914062, 103.45726776123047]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 5.0, 4.0, 6.0, 6.0, 7.0, 10.0, 16.0, 17.0, 13.0, 21.0, 29.0, 25.0, 35.0, 37.0, 29.0, 36.0, 43.0, 33.0, 30.0, 51.0, 53.0, 45.0, 47.0, 41.0, 45.0, 33.0, 30.0, 39.0, 26.0, 31.0, 20.0, 29.0, 23.0, 14.0, 14.0, 6.0, 17.0, 8.0, 12.0, 5.0, 6.0, 1.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.63656616210938, -71.29840087890625, -68.96024322509766, -66.62207794189453, -64.2839126586914, -61.94575500488281, -59.60758972167969, -57.26942825317383, -54.93126678466797, -52.59310531616211, -50.254940032958984, -47.916778564453125, -45.578617095947266, -43.240455627441406, -40.90229034423828, -38.56412887573242, -36.2259635925293, -33.88780212402344, -31.549638748168945, -29.211475372314453, -26.873313903808594, -24.5351505279541, -22.19698715209961, -19.85882568359375, -17.520662307739258, -15.182499885559082, -12.844337463378906, -10.506174087524414, -8.168011665344238, -5.8298492431640625, -3.4916858673095703, -1.153524398803711, 1.1846389770507812, 3.522801637649536, 5.860964298248291, 8.199127197265625, 10.5372896194458, 12.875452041625977, 15.213615417480469, 17.551776885986328, 19.88994026184082, 22.228103637695312, 24.566265106201172, 26.904428482055664, 29.242591857910156, 31.580753326416016, 33.918914794921875, 36.257080078125, 38.59524154663086, 40.93340301513672, 43.271568298339844, 45.6097297668457, 47.94789123535156, 50.28605651855469, 52.62421798706055, 54.962379455566406, 57.30054473876953, 59.63870620727539, 61.976871490478516, 64.31503295898438, 66.6531982421875, 68.9913558959961, 71.32952117919922, 73.66767883300781, 76.00584411621094]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 7.0, 6.0, 8.0, 9.0, 13.0, 17.0, 18.0, 17.0, 19.0, 16.0, 24.0, 33.0, 39.0, 24.0, 45.0, 38.0, 32.0, 30.0, 42.0, 43.0, 41.0, 26.0, 39.0, 32.0, 27.0, 44.0, 31.0, 27.0, 34.0, 25.0, 21.0, 27.0, 16.0, 30.0, 14.0, 15.0, 15.0, 14.0, 12.0, 4.0, 3.0, 1.0, 4.0, 3.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.91796875, -6.6854248046875, -6.452880859375, -6.2203369140625, -5.98779296875, -5.7552490234375, -5.522705078125, -5.2901611328125, -5.0576171875, -4.8250732421875, -4.592529296875, -4.3599853515625, -4.12744140625, -3.8948974609375, -3.662353515625, -3.4298095703125, -3.197265625, -2.9647216796875, -2.732177734375, -2.4996337890625, -2.26708984375, -2.0345458984375, -1.802001953125, -1.5694580078125, -1.3369140625, -1.1043701171875, -0.871826171875, -0.6392822265625, -0.40673828125, -0.1741943359375, 0.058349609375, 0.2908935546875, 0.5234375, 0.7559814453125, 0.988525390625, 1.2210693359375, 1.45361328125, 1.6861572265625, 1.918701171875, 2.1512451171875, 2.3837890625, 2.6163330078125, 2.848876953125, 3.0814208984375, 3.31396484375, 3.5465087890625, 3.779052734375, 4.0115966796875, 4.244140625, 4.4766845703125, 4.709228515625, 4.9417724609375, 5.17431640625, 5.4068603515625, 5.639404296875, 5.8719482421875, 6.1044921875, 6.3370361328125, 6.569580078125, 6.8021240234375, 7.03466796875, 7.2672119140625, 7.499755859375, 7.7322998046875, 7.96484375]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 9.0, 12.0, 5.0, 7.0, 8.0, 13.0, 15.0, 17.0, 25.0, 11.0, 27.0, 31.0, 38.0, 25.0, 33.0, 57.0, 91.0, 301.0, 1151.0, 6002.0, 100222.0, 2837205.0, 1218902.0, 25788.0, 2915.0, 740.0, 223.0, 87.0, 51.0, 33.0, 34.0, 20.0, 33.0, 16.0, 19.0, 23.0, 14.0, 21.0, 9.0, 12.0, 10.0, 6.0, 5.0, 3.0, 4.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0], "bins": [-25.734375, -24.899169921875, -24.06396484375, -23.228759765625, -22.3935546875, -21.558349609375, -20.72314453125, -19.887939453125, -19.052734375, -18.217529296875, -17.38232421875, -16.547119140625, -15.7119140625, -14.876708984375, -14.04150390625, -13.206298828125, -12.37109375, -11.535888671875, -10.70068359375, -9.865478515625, -9.0302734375, -8.195068359375, -7.35986328125, -6.524658203125, -5.689453125, -4.854248046875, -4.01904296875, -3.183837890625, -2.3486328125, -1.513427734375, -0.67822265625, 0.156982421875, 0.9921875, 1.827392578125, 2.66259765625, 3.497802734375, 4.3330078125, 5.168212890625, 6.00341796875, 6.838623046875, 7.673828125, 8.509033203125, 9.34423828125, 10.179443359375, 11.0146484375, 11.849853515625, 12.68505859375, 13.520263671875, 14.35546875, 15.190673828125, 16.02587890625, 16.861083984375, 17.6962890625, 18.531494140625, 19.36669921875, 20.201904296875, 21.037109375, 21.872314453125, 22.70751953125, 23.542724609375, 24.3779296875, 25.213134765625, 26.04833984375, 26.883544921875, 27.71875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 1.0, 6.0, 14.0, 11.0, 15.0, 9.0, 28.0, 34.0, 43.0, 46.0, 68.0, 94.0, 107.0, 182.0, 228.0, 336.0, 396.0, 493.0, 483.0, 384.0, 298.0, 217.0, 150.0, 105.0, 85.0, 83.0, 53.0, 38.0, 16.0, 18.0, 14.0, 5.0, 7.0, 5.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.53125, -12.026123046875, -11.52099609375, -11.015869140625, -10.5107421875, -10.005615234375, -9.50048828125, -8.995361328125, -8.490234375, -7.985107421875, -7.47998046875, -6.974853515625, -6.4697265625, -5.964599609375, -5.45947265625, -4.954345703125, -4.44921875, -3.944091796875, -3.43896484375, -2.933837890625, -2.4287109375, -1.923583984375, -1.41845703125, -0.913330078125, -0.408203125, 0.096923828125, 0.60205078125, 1.107177734375, 1.6123046875, 2.117431640625, 2.62255859375, 3.127685546875, 3.6328125, 4.137939453125, 4.64306640625, 5.148193359375, 5.6533203125, 6.158447265625, 6.66357421875, 7.168701171875, 7.673828125, 8.178955078125, 8.68408203125, 9.189208984375, 9.6943359375, 10.199462890625, 10.70458984375, 11.209716796875, 11.71484375, 12.219970703125, 12.72509765625, 13.230224609375, 13.7353515625, 14.240478515625, 14.74560546875, 15.250732421875, 15.755859375, 16.260986328125, 16.76611328125, 17.271240234375, 17.7763671875, 18.281494140625, 18.78662109375, 19.291748046875, 19.796875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 8.0, 3.0, 7.0, 7.0, 13.0, 18.0, 21.0, 31.0, 46.0, 64.0, 70.0, 105.0, 134.0, 175.0, 233.0, 334.0, 614.0, 2358.0, 482984.0, 3697316.0, 7537.0, 829.0, 377.0, 249.0, 166.0, 131.0, 89.0, 86.0, 57.0, 53.0, 37.0, 26.0, 25.0, 32.0, 9.0, 9.0, 15.0, 4.0, 8.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.875, -66.591796875, -64.30859375, -62.025390625, -59.7421875, -57.458984375, -55.17578125, -52.892578125, -50.609375, -48.326171875, -46.04296875, -43.759765625, -41.4765625, -39.193359375, -36.91015625, -34.626953125, -32.34375, -30.060546875, -27.77734375, -25.494140625, -23.2109375, -20.927734375, -18.64453125, -16.361328125, -14.078125, -11.794921875, -9.51171875, -7.228515625, -4.9453125, -2.662109375, -0.37890625, 1.904296875, 4.1875, 6.470703125, 8.75390625, 11.037109375, 13.3203125, 15.603515625, 17.88671875, 20.169921875, 22.453125, 24.736328125, 27.01953125, 29.302734375, 31.5859375, 33.869140625, 36.15234375, 38.435546875, 40.71875, 43.001953125, 45.28515625, 47.568359375, 49.8515625, 52.134765625, 54.41796875, 56.701171875, 58.984375, 61.267578125, 63.55078125, 65.833984375, 68.1171875, 70.400390625, 72.68359375, 74.966796875, 77.25]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 8.0, 10.0, 47.0, 84.0, 179.0, 228.0, 195.0, 146.0, 70.0, 24.0, 12.0, 7.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-97.67079162597656, -94.01847076416016, -90.36614990234375, -86.71383666992188, -83.06151580810547, -79.40919494628906, -75.75687408447266, -72.10455322265625, -68.45223236083984, -64.79991149902344, -61.1475944519043, -57.49527359008789, -53.842952728271484, -50.190635681152344, -46.53831481933594, -42.88599395751953, -39.23367691040039, -35.581356048583984, -31.92903709411621, -28.276718139648438, -24.62439727783203, -20.972078323364258, -17.319759368896484, -13.667438507080078, -10.015119552612305, -6.362799644470215, -2.710480213165283, 0.9418392181396484, 4.594159126281738, 8.246479034423828, 11.898797988891602, 15.551118850708008, 19.20343780517578, 22.855756759643555, 26.50807762145996, 30.160396575927734, 33.81271743774414, 37.46503448486328, 41.11735534667969, 44.769676208496094, 48.4219970703125, 52.074317932128906, 55.72663497924805, 59.37895584106445, 63.03127670288086, 66.68359375, 70.3359146118164, 73.98823547363281, 77.64054870605469, 81.2928695678711, 84.9451904296875, 88.59750366210938, 92.24982452392578, 95.90214538574219, 99.5544662475586, 103.206787109375, 106.8591079711914, 110.51142883300781, 114.16374969482422, 117.81607055664062, 121.4683837890625, 125.1207046508789, 128.7730255126953, 132.42535400390625, 136.07766723632812]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 6.0, 5.0, 2.0, 7.0, 8.0, 6.0, 9.0, 8.0, 14.0, 14.0, 19.0, 25.0, 18.0, 22.0, 19.0, 27.0, 21.0, 30.0, 25.0, 32.0, 21.0, 41.0, 40.0, 38.0, 46.0, 34.0, 39.0, 35.0, 37.0, 30.0, 28.0, 31.0, 29.0, 25.0, 27.0, 26.0, 23.0, 16.0, 27.0, 15.0, 10.0, 11.0, 11.0, 14.0, 6.0, 5.0, 6.0, 5.0, 3.0, 4.0, 4.0, 5.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-44.66520309448242, -43.26557159423828, -41.865936279296875, -40.466304779052734, -39.066673278808594, -37.66703796386719, -36.26740646362305, -34.867774963378906, -33.4681396484375, -32.06850814819336, -30.668874740600586, -29.269241333007812, -27.869609832763672, -26.4699764251709, -25.070343017578125, -23.670711517333984, -22.271080017089844, -20.87144660949707, -19.47181510925293, -18.072181701660156, -16.672550201416016, -15.272916793823242, -13.873283386230469, -12.473650932312012, -11.074018478393555, -9.674386024475098, -8.27475357055664, -6.875120162963867, -5.47548770904541, -4.075855255126953, -2.6762218475341797, -1.2765893936157227, 0.12303924560546875, 1.5226719379425049, 2.922304630279541, 4.321937561035156, 5.721570014953613, 7.12120246887207, 8.520835876464844, 9.9204683303833, 11.320100784301758, 12.719733238220215, 14.119365692138672, 15.518999099731445, 16.91863250732422, 18.31826400756836, 19.717897415161133, 21.117530822753906, 22.517162322998047, 23.91679573059082, 25.31642723083496, 26.716060638427734, 28.115692138671875, 29.51532554626465, 30.914958953857422, 32.31459045410156, 33.71422576904297, 35.11385726928711, 36.513492584228516, 37.913124084472656, 39.3127555847168, 40.71238708496094, 42.112022399902344, 43.511653900146484, 44.911285400390625]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 6.0, 6.0, 5.0, 8.0, 9.0, 11.0, 12.0, 17.0, 12.0, 13.0, 14.0, 30.0, 21.0, 34.0, 40.0, 17.0, 37.0, 39.0, 43.0, 36.0, 42.0, 37.0, 35.0, 44.0, 33.0, 31.0, 30.0, 29.0, 31.0, 37.0, 29.0, 22.0, 22.0, 26.0, 21.0, 16.0, 17.0, 19.0, 17.0, 15.0, 8.0, 8.0, 7.0, 7.0, 1.0, 4.0, 4.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.73046875, -6.5057373046875, -6.281005859375, -6.0562744140625, -5.83154296875, -5.6068115234375, -5.382080078125, -5.1573486328125, -4.9326171875, -4.7078857421875, -4.483154296875, -4.2584228515625, -4.03369140625, -3.8089599609375, -3.584228515625, -3.3594970703125, -3.134765625, -2.9100341796875, -2.685302734375, -2.4605712890625, -2.23583984375, -2.0111083984375, -1.786376953125, -1.5616455078125, -1.3369140625, -1.1121826171875, -0.887451171875, -0.6627197265625, -0.43798828125, -0.2132568359375, 0.011474609375, 0.2362060546875, 0.4609375, 0.6856689453125, 0.910400390625, 1.1351318359375, 1.35986328125, 1.5845947265625, 1.809326171875, 2.0340576171875, 2.2587890625, 2.4835205078125, 2.708251953125, 2.9329833984375, 3.15771484375, 3.3824462890625, 3.607177734375, 3.8319091796875, 4.056640625, 4.2813720703125, 4.506103515625, 4.7308349609375, 4.95556640625, 5.1802978515625, 5.405029296875, 5.6297607421875, 5.8544921875, 6.0792236328125, 6.303955078125, 6.5286865234375, 6.75341796875, 6.9781494140625, 7.202880859375, 7.4276123046875, 7.65234375]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 9.0, 6.0, 13.0, 13.0, 31.0, 63.0, 80.0, 135.0, 196.0, 282.0, 530.0, 719.0, 1143.0, 1699.0, 2689.0, 3944.0, 5913.0, 8764.0, 13254.0, 20579.0, 31210.0, 47709.0, 72824.0, 111570.0, 180168.0, 194906.0, 121791.0, 78296.0, 51532.0, 33485.0, 21991.0, 14623.0, 9597.0, 6306.0, 4238.0, 2816.0, 1886.0, 1227.0, 822.0, 505.0, 352.0, 235.0, 160.0, 84.0, 56.0, 49.0, 24.0, 14.0, 12.0, 5.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0361328125, -1.0028076171875, -0.969482421875, -0.9361572265625, -0.90283203125, -0.8695068359375, -0.836181640625, -0.8028564453125, -0.76953125, -0.7362060546875, -0.702880859375, -0.6695556640625, -0.63623046875, -0.6029052734375, -0.569580078125, -0.5362548828125, -0.5029296875, -0.4696044921875, -0.436279296875, -0.4029541015625, -0.36962890625, -0.3363037109375, -0.302978515625, -0.2696533203125, -0.236328125, -0.2030029296875, -0.169677734375, -0.1363525390625, -0.10302734375, -0.0697021484375, -0.036376953125, -0.0030517578125, 0.0302734375, 0.0635986328125, 0.096923828125, 0.1302490234375, 0.16357421875, 0.1968994140625, 0.230224609375, 0.2635498046875, 0.296875, 0.3302001953125, 0.363525390625, 0.3968505859375, 0.43017578125, 0.4635009765625, 0.496826171875, 0.5301513671875, 0.5634765625, 0.5968017578125, 0.630126953125, 0.6634521484375, 0.69677734375, 0.7301025390625, 0.763427734375, 0.7967529296875, 0.830078125, 0.8634033203125, 0.896728515625, 0.9300537109375, 0.96337890625, 0.9967041015625, 1.030029296875, 1.0633544921875, 1.0966796875]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 4.0, 0.0, 5.0, 1.0, 7.0, 9.0, 13.0, 7.0, 7.0, 15.0, 15.0, 17.0, 22.0, 23.0, 34.0, 31.0, 28.0, 31.0, 34.0, 41.0, 39.0, 40.0, 40.0, 45.0, 1068.0, 39.0, 49.0, 32.0, 42.0, 39.0, 34.0, 27.0, 33.0, 21.0, 19.0, 15.0, 18.0, 23.0, 16.0, 13.0, 11.0, 8.0, 11.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1484375, -4.98284912109375, -4.8172607421875, -4.65167236328125, -4.486083984375, -4.32049560546875, -4.1549072265625, -3.98931884765625, -3.82373046875, -3.65814208984375, -3.4925537109375, -3.32696533203125, -3.161376953125, -2.99578857421875, -2.8302001953125, -2.66461181640625, -2.4990234375, -2.33343505859375, -2.1678466796875, -2.00225830078125, -1.836669921875, -1.67108154296875, -1.5054931640625, -1.33990478515625, -1.17431640625, -1.00872802734375, -0.8431396484375, -0.67755126953125, -0.511962890625, -0.34637451171875, -0.1807861328125, -0.01519775390625, 0.150390625, 0.31597900390625, 0.4815673828125, 0.64715576171875, 0.812744140625, 0.97833251953125, 1.1439208984375, 1.30950927734375, 1.47509765625, 1.64068603515625, 1.8062744140625, 1.97186279296875, 2.137451171875, 2.30303955078125, 2.4686279296875, 2.63421630859375, 2.7998046875, 2.96539306640625, 3.1309814453125, 3.29656982421875, 3.462158203125, 3.62774658203125, 3.7933349609375, 3.95892333984375, 4.12451171875, 4.29010009765625, 4.4556884765625, 4.62127685546875, 4.786865234375, 4.95245361328125, 5.1180419921875, 5.28363037109375, 5.44921875]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 11.0, 14.0, 31.0, 38.0, 58.0, 74.0, 125.0, 173.0, 250.0, 349.0, 576.0, 900.0, 1331.0, 2092.0, 3159.0, 4913.0, 7306.0, 11623.0, 17846.0, 27776.0, 44486.0, 70525.0, 111512.0, 176367.0, 1251410.0, 133307.0, 84631.0, 52667.0, 33453.0, 21090.0, 13559.0, 8772.0, 5691.0, 3759.0, 2401.0, 1646.0, 1064.0, 725.0, 463.0, 335.0, 207.0, 138.0, 94.0, 49.0, 45.0, 28.0, 26.0, 9.0, 15.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.048828125, -1.0162506103515625, -0.983673095703125, -0.9510955810546875, -0.91851806640625, -0.8859405517578125, -0.853363037109375, -0.8207855224609375, -0.7882080078125, -0.7556304931640625, -0.723052978515625, -0.6904754638671875, -0.65789794921875, -0.6253204345703125, -0.592742919921875, -0.5601654052734375, -0.527587890625, -0.4950103759765625, -0.462432861328125, -0.4298553466796875, -0.39727783203125, -0.3647003173828125, -0.332122802734375, -0.2995452880859375, -0.2669677734375, -0.2343902587890625, -0.201812744140625, -0.1692352294921875, -0.13665771484375, -0.1040802001953125, -0.071502685546875, -0.0389251708984375, -0.00634765625, 0.0262298583984375, 0.058807373046875, 0.0913848876953125, 0.12396240234375, 0.1565399169921875, 0.189117431640625, 0.2216949462890625, 0.2542724609375, 0.2868499755859375, 0.319427490234375, 0.3520050048828125, 0.38458251953125, 0.4171600341796875, 0.449737548828125, 0.4823150634765625, 0.514892578125, 0.5474700927734375, 0.580047607421875, 0.6126251220703125, 0.64520263671875, 0.6777801513671875, 0.710357666015625, 0.7429351806640625, 0.7755126953125, 0.8080902099609375, 0.840667724609375, 0.8732452392578125, 0.90582275390625, 0.9384002685546875, 0.970977783203125, 1.0035552978515625, 1.0361328125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 7.0, 2.0, 5.0, 7.0, 12.0, 12.0, 18.0, 26.0, 23.0, 25.0, 30.0, 50.0, 39.0, 41.0, 59.0, 70.0, 67.0, 80.0, 70.0, 58.0, 58.0, 46.0, 40.0, 34.0, 28.0, 12.0, 15.0, 16.0, 16.0, 13.0, 3.0, 8.0, 7.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.002178192138671875, -0.0021116137504577637, -0.0020450353622436523, -0.001978456974029541, -0.0019118785858154297, -0.0018453001976013184, -0.001778721809387207, -0.0017121434211730957, -0.0016455650329589844, -0.001578986644744873, -0.0015124082565307617, -0.0014458298683166504, -0.001379251480102539, -0.0013126730918884277, -0.0012460947036743164, -0.001179516315460205, -0.0011129379272460938, -0.0010463595390319824, -0.000979781150817871, -0.0009132027626037598, -0.0008466243743896484, -0.0007800459861755371, -0.0007134675979614258, -0.0006468892097473145, -0.0005803108215332031, -0.0005137324333190918, -0.00044715404510498047, -0.00038057565689086914, -0.0003139972686767578, -0.0002474188804626465, -0.00018084049224853516, -0.00011426210403442383, -4.76837158203125e-05, 1.8894672393798828e-05, 8.547306060791016e-05, 0.00015205144882202148, 0.0002186298370361328, 0.00028520822525024414, 0.00035178661346435547, 0.0004183650016784668, 0.0004849433898925781, 0.0005515217781066895, 0.0006181001663208008, 0.0006846785545349121, 0.0007512569427490234, 0.0008178353309631348, 0.0008844137191772461, 0.0009509921073913574, 0.0010175704956054688, 0.00108414888381958, 0.0011507272720336914, 0.0012173056602478027, 0.001283884048461914, 0.0013504624366760254, 0.0014170408248901367, 0.001483619213104248, 0.0015501976013183594, 0.0016167759895324707, 0.001683354377746582, 0.0017499327659606934, 0.0018165111541748047, 0.001883089542388916, 0.0019496679306030273, 0.0020162463188171387, 0.00208282470703125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 4.0, 8.0, 10.0, 7.0, 14.0, 14.0, 12.0, 22.0, 30.0, 36.0, 45.0, 66.0, 99.0, 184.0, 419.0, 3466.0, 1039629.0, 3568.0, 390.0, 169.0, 88.0, 66.0, 43.0, 34.0, 35.0, 28.0, 17.0, 14.0, 10.0, 6.0, 4.0, 4.0, 5.0, 4.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.045257568359375, -0.043612003326416016, -0.04196643829345703, -0.04032087326049805, -0.03867530822753906, -0.03702974319458008, -0.035384178161621094, -0.03373861312866211, -0.032093048095703125, -0.03044748306274414, -0.028801918029785156, -0.027156352996826172, -0.025510787963867188, -0.023865222930908203, -0.02221965789794922, -0.020574092864990234, -0.01892852783203125, -0.017282962799072266, -0.01563739776611328, -0.013991832733154297, -0.012346267700195312, -0.010700702667236328, -0.009055137634277344, -0.007409572601318359, -0.005764007568359375, -0.004118442535400391, -0.0024728775024414062, -0.0008273124694824219, 0.0008182525634765625, 0.002463817596435547, 0.004109382629394531, 0.005754947662353516, 0.0074005126953125, 0.009046077728271484, 0.010691642761230469, 0.012337207794189453, 0.013982772827148438, 0.015628337860107422, 0.017273902893066406, 0.01891946792602539, 0.020565032958984375, 0.02221059799194336, 0.023856163024902344, 0.025501728057861328, 0.027147293090820312, 0.028792858123779297, 0.03043842315673828, 0.032083988189697266, 0.03372955322265625, 0.035375118255615234, 0.03702068328857422, 0.0386662483215332, 0.04031181335449219, 0.04195737838745117, 0.043602943420410156, 0.04524850845336914, 0.046894073486328125, 0.04853963851928711, 0.050185203552246094, 0.05183076858520508, 0.05347633361816406, 0.05512189865112305, 0.05676746368408203, 0.058413028717041016, 0.06005859375]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 14.0, 35.0, 103.0, 228.0, 309.0, 198.0, 84.0, 33.0, 7.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004105939995497465, -0.004026070237159729, -0.003946200478821993, -0.0038663307204842567, -0.0037864609621465206, -0.0037065912038087845, -0.0036267214454710484, -0.0035468516871333122, -0.003466981928795576, -0.00338711217045784, -0.003307242412120104, -0.0032273726537823677, -0.0031475028954446316, -0.0030676331371068954, -0.0029877633787691593, -0.002907893620431423, -0.0028280240949243307, -0.0027481543365865946, -0.0026682845782488585, -0.0025884148199111223, -0.002508545061573386, -0.00242867530323565, -0.002348805544897914, -0.0022689360193908215, -0.0021890662610530853, -0.002109196502715349, -0.002029326744377613, -0.001949456986039877, -0.0018695872277021408, -0.0017897174693644047, -0.0017098478274419904, -0.0016299780691042542, -0.0015501080779358745, -0.0014702383195981383, -0.0013903685612604022, -0.001310498802922666, -0.0012306291610002518, -0.0011507594026625156, -0.0010708896443247795, -0.0009910198859870434, -0.0009111501276493073, -0.0008312803693115711, -0.000751410610973835, -0.0006715409108437598, -0.0005916711525060236, -0.0005118013941682875, -0.00043193166493438184, -0.00035206193570047617, -0.00027219217736274004, -0.00019232243357691914, -0.00011245268979109824, -3.2582946005277336e-05, 4.7286797780543566e-05, 0.0001271565561182797, 0.00020702628535218537, 0.00028689601458609104, 0.00036676577292382717, 0.0004466355312615633, 0.0005265052895992994, 0.0006063749897293746, 0.0006862447480671108, 0.0007661145064048469, 0.0008459842065349221, 0.0009258539648726583, 0.0010057237232103944]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 2.0, 2.0, 1.0, 6.0, 7.0, 4.0, 8.0, 7.0, 16.0, 9.0, 15.0, 17.0, 11.0, 25.0, 20.0, 21.0, 37.0, 32.0, 26.0, 46.0, 32.0, 33.0, 38.0, 49.0, 37.0, 31.0, 36.0, 36.0, 34.0, 35.0, 41.0, 37.0, 29.0, 31.0, 24.0, 27.0, 19.0, 20.0, 16.0, 12.0, 11.0, 12.0, 11.0, 13.0, 6.0, 9.0, 4.0, 4.0, 5.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008845329284667969, -0.0008559860289096832, -0.0008274391293525696, -0.0007988922297954559, -0.0007703453302383423, -0.0007417984306812286, -0.000713251531124115, -0.0006847046315670013, -0.0006561577320098877, -0.000627610832452774, -0.0005990639328956604, -0.0005705170333385468, -0.0005419701337814331, -0.0005134232342243195, -0.0004848763346672058, -0.00045632943511009216, -0.0004277825355529785, -0.00039923563599586487, -0.0003706887364387512, -0.0003421418368816376, -0.0003135949373245239, -0.0002850480377674103, -0.00025650113821029663, -0.00022795423865318298, -0.00019940733909606934, -0.0001708604395389557, -0.00014231353998184204, -0.0001137666404247284, -8.521974086761475e-05, -5.66728413105011e-05, -2.812594175338745e-05, 4.209578037261963e-07, 2.8967857360839844e-05, 5.751475691795349e-05, 8.606165647506714e-05, 0.00011460855603218079, 0.00014315545558929443, 0.00017170235514640808, 0.00020024925470352173, 0.00022879615426063538, 0.000257343053817749, 0.00028588995337486267, 0.0003144368529319763, 0.00034298375248908997, 0.0003715306520462036, 0.00040007755160331726, 0.0004286244511604309, 0.00045717135071754456, 0.0004857182502746582, 0.0005142651498317719, 0.0005428120493888855, 0.0005713589489459991, 0.0005999058485031128, 0.0006284527480602264, 0.0006569996476173401, 0.0006855465471744537, 0.0007140934467315674, 0.000742640346288681, 0.0007711872458457947, 0.0007997341454029083, 0.000828281044960022, 0.0008568279445171356, 0.0008853748440742493, 0.0009139217436313629, 0.0009424686431884766]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 6.0, 6.0, 5.0, 8.0, 9.0, 11.0, 12.0, 17.0, 12.0, 13.0, 14.0, 30.0, 21.0, 34.0, 40.0, 17.0, 37.0, 39.0, 43.0, 36.0, 42.0, 37.0, 35.0, 44.0, 33.0, 31.0, 30.0, 29.0, 31.0, 37.0, 29.0, 22.0, 22.0, 26.0, 21.0, 17.0, 16.0, 19.0, 17.0, 15.0, 8.0, 7.0, 8.0, 7.0, 1.0, 4.0, 4.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.73046875, -6.5057373046875, -6.281005859375, -6.0562744140625, -5.83154296875, -5.6068115234375, -5.382080078125, -5.1573486328125, -4.9326171875, -4.7078857421875, -4.483154296875, -4.2584228515625, -4.03369140625, -3.8089599609375, -3.584228515625, -3.3594970703125, -3.134765625, -2.9100341796875, -2.685302734375, -2.4605712890625, -2.23583984375, -2.0111083984375, -1.786376953125, -1.5616455078125, -1.3369140625, -1.1121826171875, -0.887451171875, -0.6627197265625, -0.43798828125, -0.2132568359375, 0.011474609375, 0.2362060546875, 0.4609375, 0.6856689453125, 0.910400390625, 1.1351318359375, 1.35986328125, 1.5845947265625, 1.809326171875, 2.0340576171875, 2.2587890625, 2.4835205078125, 2.708251953125, 2.9329833984375, 3.15771484375, 3.3824462890625, 3.607177734375, 3.8319091796875, 4.056640625, 4.2813720703125, 4.506103515625, 4.7308349609375, 4.95556640625, 5.1802978515625, 5.405029296875, 5.6297607421875, 5.8544921875, 6.0792236328125, 6.303955078125, 6.5286865234375, 6.75341796875, 6.9781494140625, 7.202880859375, 7.4276123046875, 7.65234375]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 2.0, 6.0, 8.0, 16.0, 15.0, 17.0, 40.0, 45.0, 61.0, 81.0, 109.0, 135.0, 193.0, 284.0, 427.0, 632.0, 997.0, 1807.0, 3298.0, 6005.0, 12248.0, 26092.0, 61734.0, 165667.0, 399695.0, 223175.0, 80697.0, 33321.0, 14836.0, 7340.0, 3862.0, 2121.0, 1256.0, 732.0, 469.0, 347.0, 208.0, 163.0, 104.0, 80.0, 68.0, 38.0, 32.0, 24.0, 22.0, 13.0, 14.0, 12.0, 4.0, 3.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6171875, -4.45599365234375, -4.2947998046875, -4.13360595703125, -3.972412109375, -3.81121826171875, -3.6500244140625, -3.48883056640625, -3.32763671875, -3.16644287109375, -3.0052490234375, -2.84405517578125, -2.682861328125, -2.52166748046875, -2.3604736328125, -2.19927978515625, -2.0380859375, -1.87689208984375, -1.7156982421875, -1.55450439453125, -1.393310546875, -1.23211669921875, -1.0709228515625, -0.90972900390625, -0.74853515625, -0.58734130859375, -0.4261474609375, -0.26495361328125, -0.103759765625, 0.05743408203125, 0.2186279296875, 0.37982177734375, 0.541015625, 0.70220947265625, 0.8634033203125, 1.02459716796875, 1.185791015625, 1.34698486328125, 1.5081787109375, 1.66937255859375, 1.83056640625, 1.99176025390625, 2.1529541015625, 2.31414794921875, 2.475341796875, 2.63653564453125, 2.7977294921875, 2.95892333984375, 3.1201171875, 3.28131103515625, 3.4425048828125, 3.60369873046875, 3.764892578125, 3.92608642578125, 4.0872802734375, 4.24847412109375, 4.40966796875, 4.57086181640625, 4.7320556640625, 4.89324951171875, 5.054443359375, 5.21563720703125, 5.3768310546875, 5.53802490234375, 5.69921875]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 5.0, 0.0, 1.0, 2.0, 3.0, 6.0, 2.0, 6.0, 6.0, 6.0, 11.0, 9.0, 15.0, 13.0, 18.0, 16.0, 19.0, 21.0, 16.0, 25.0, 30.0, 28.0, 35.0, 37.0, 49.0, 67.0, 75.0, 242.0, 1632.0, 147.0, 70.0, 60.0, 42.0, 37.0, 38.0, 29.0, 40.0, 29.0, 30.0, 19.0, 12.0, 18.0, 23.0, 13.0, 9.0, 7.0, 9.0, 13.0, 6.0, 2.0, 2.0, 2.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-21.84375, -21.146484375, -20.44921875, -19.751953125, -19.0546875, -18.357421875, -17.66015625, -16.962890625, -16.265625, -15.568359375, -14.87109375, -14.173828125, -13.4765625, -12.779296875, -12.08203125, -11.384765625, -10.6875, -9.990234375, -9.29296875, -8.595703125, -7.8984375, -7.201171875, -6.50390625, -5.806640625, -5.109375, -4.412109375, -3.71484375, -3.017578125, -2.3203125, -1.623046875, -0.92578125, -0.228515625, 0.46875, 1.166015625, 1.86328125, 2.560546875, 3.2578125, 3.955078125, 4.65234375, 5.349609375, 6.046875, 6.744140625, 7.44140625, 8.138671875, 8.8359375, 9.533203125, 10.23046875, 10.927734375, 11.625, 12.322265625, 13.01953125, 13.716796875, 14.4140625, 15.111328125, 15.80859375, 16.505859375, 17.203125, 17.900390625, 18.59765625, 19.294921875, 19.9921875, 20.689453125, 21.38671875, 22.083984375, 22.78125]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 4.0, 1.0, 0.0, 4.0, 2.0, 2.0, 9.0, 3.0, 0.0, 10.0, 15.0, 7.0, 17.0, 30.0, 39.0, 45.0, 70.0, 70.0, 136.0, 173.0, 236.0, 366.0, 676.0, 7416.0, 3113837.0, 20469.0, 821.0, 376.0, 246.0, 164.0, 108.0, 89.0, 78.0, 48.0, 39.0, 26.0, 19.0, 16.0, 14.0, 8.0, 8.0, 8.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.875, -64.5361328125, -62.197265625, -59.8583984375, -57.51953125, -55.1806640625, -52.841796875, -50.5029296875, -48.1640625, -45.8251953125, -43.486328125, -41.1474609375, -38.80859375, -36.4697265625, -34.130859375, -31.7919921875, -29.453125, -27.1142578125, -24.775390625, -22.4365234375, -20.09765625, -17.7587890625, -15.419921875, -13.0810546875, -10.7421875, -8.4033203125, -6.064453125, -3.7255859375, -1.38671875, 0.9521484375, 3.291015625, 5.6298828125, 7.96875, 10.3076171875, 12.646484375, 14.9853515625, 17.32421875, 19.6630859375, 22.001953125, 24.3408203125, 26.6796875, 29.0185546875, 31.357421875, 33.6962890625, 36.03515625, 38.3740234375, 40.712890625, 43.0517578125, 45.390625, 47.7294921875, 50.068359375, 52.4072265625, 54.74609375, 57.0849609375, 59.423828125, 61.7626953125, 64.1015625, 66.4404296875, 68.779296875, 71.1181640625, 73.45703125, 75.7958984375, 78.134765625, 80.4736328125, 82.8125]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [2.0, 29.0, 815.0, 172.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.58217430114746, -12.40479850769043, -5.227422714233398, 1.9499530792236328, 9.127328872680664, 16.304704666137695, 23.482080459594727, 30.659456253051758, 37.836830139160156, 45.01420593261719, 52.19158172607422, 59.36895751953125, 66.54633331298828, 73.72370910644531, 80.90108489990234, 88.07846069335938, 95.2558364868164, 102.43321228027344, 109.61058807373047, 116.7879638671875, 123.96533966064453, 131.14271545410156, 138.32009887695312, 145.49746704101562, 152.6748504638672, 159.85223388671875, 167.02960205078125, 174.20697021484375, 181.3843536376953, 188.56173706054688, 195.73910522460938, 202.91647338867188, 210.09384155273438, 217.27120971679688, 224.44859313964844, 231.6259765625, 238.8033447265625, 245.980712890625, 253.15809631347656, 260.3354797363281, 267.5128479003906, 274.6902160644531, 281.86761474609375, 289.04498291015625, 296.22235107421875, 303.39971923828125, 310.57708740234375, 317.7544860839844, 324.9318542480469, 332.1092224121094, 339.28662109375, 346.4639892578125, 353.641357421875, 360.8187255859375, 367.99609375, 375.1734924316406, 382.3508605957031, 389.5282287597656, 396.70562744140625, 403.88299560546875, 411.06036376953125, 418.23773193359375, 425.41510009765625, 432.5924987792969, 439.7698669433594]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 3.0, 9.0, 7.0, 9.0, 8.0, 13.0, 13.0, 14.0, 21.0, 16.0, 25.0, 25.0, 35.0, 35.0, 43.0, 39.0, 55.0, 44.0, 42.0, 51.0, 57.0, 36.0, 47.0, 34.0, 40.0, 37.0, 34.0, 42.0, 29.0, 31.0, 17.0, 19.0, 13.0, 20.0, 10.0, 5.0, 4.0, 10.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-76.5431900024414, -74.22920989990234, -71.91523742675781, -69.60125732421875, -67.28728485107422, -64.97330474853516, -62.659332275390625, -60.34535217285156, -58.03137969970703, -55.717403411865234, -53.40342712402344, -51.08945083618164, -48.775474548339844, -46.46149826049805, -44.14752197265625, -41.83354187011719, -39.51956558227539, -37.205589294433594, -34.8916130065918, -32.57763671875, -30.263660430908203, -27.949684143066406, -25.635705947875977, -23.32172966003418, -21.007753372192383, -18.693777084350586, -16.37980079650879, -14.065823554992676, -11.751847267150879, -9.437870979309082, -7.123893737792969, -4.809917449951172, -2.495941162109375, -0.18196463584899902, 2.132011890411377, 4.445988655090332, 6.759964942932129, 9.073941230773926, 11.387918472290039, 13.701894760131836, 16.015871047973633, 18.32984733581543, 20.643823623657227, 22.957801818847656, 25.271778106689453, 27.58575439453125, 29.899730682373047, 32.213706970214844, 34.52768325805664, 36.84165954589844, 39.155635833740234, 41.46961212158203, 43.78358840942383, 46.097564697265625, 48.41154479980469, 50.72551727294922, 53.03949737548828, 55.35347366333008, 57.667449951171875, 59.98142623901367, 62.29540252685547, 64.60938262939453, 66.92335510253906, 69.23733520507812, 71.55130767822266]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 11.0, 8.0, 9.0, 11.0, 13.0, 8.0, 15.0, 16.0, 13.0, 20.0, 20.0, 37.0, 25.0, 39.0, 32.0, 29.0, 41.0, 35.0, 51.0, 29.0, 43.0, 38.0, 34.0, 35.0, 33.0, 29.0, 30.0, 26.0, 27.0, 35.0, 23.0, 23.0, 16.0, 15.0, 18.0, 21.0, 14.0, 11.0, 11.0, 16.0, 6.0, 5.0, 7.0, 5.0, 3.0, 4.0, 4.0, 1.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.92578125, -6.697021484375, -6.46826171875, -6.239501953125, -6.0107421875, -5.781982421875, -5.55322265625, -5.324462890625, -5.095703125, -4.866943359375, -4.63818359375, -4.409423828125, -4.1806640625, -3.951904296875, -3.72314453125, -3.494384765625, -3.265625, -3.036865234375, -2.80810546875, -2.579345703125, -2.3505859375, -2.121826171875, -1.89306640625, -1.664306640625, -1.435546875, -1.206787109375, -0.97802734375, -0.749267578125, -0.5205078125, -0.291748046875, -0.06298828125, 0.165771484375, 0.39453125, 0.623291015625, 0.85205078125, 1.080810546875, 1.3095703125, 1.538330078125, 1.76708984375, 1.995849609375, 2.224609375, 2.453369140625, 2.68212890625, 2.910888671875, 3.1396484375, 3.368408203125, 3.59716796875, 3.825927734375, 4.0546875, 4.283447265625, 4.51220703125, 4.740966796875, 4.9697265625, 5.198486328125, 5.42724609375, 5.656005859375, 5.884765625, 6.113525390625, 6.34228515625, 6.571044921875, 6.7998046875, 7.028564453125, 7.25732421875, 7.486083984375, 7.71484375]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 4.0, 6.0, 9.0, 9.0, 16.0, 7.0, 11.0, 12.0, 17.0, 13.0, 22.0, 23.0, 32.0, 46.0, 67.0, 115.0, 186.0, 369.0, 882.0, 2690.0, 11395.0, 134189.0, 2009562.0, 1911760.0, 108268.0, 10255.0, 2486.0, 841.0, 355.0, 197.0, 115.0, 65.0, 40.0, 36.0, 31.0, 23.0, 17.0, 17.0, 10.0, 16.0, 17.0, 9.0, 9.0, 12.0, 3.0, 3.0, 4.0, 3.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-18.75, -18.12451171875, -17.4990234375, -16.87353515625, -16.248046875, -15.62255859375, -14.9970703125, -14.37158203125, -13.74609375, -13.12060546875, -12.4951171875, -11.86962890625, -11.244140625, -10.61865234375, -9.9931640625, -9.36767578125, -8.7421875, -8.11669921875, -7.4912109375, -6.86572265625, -6.240234375, -5.61474609375, -4.9892578125, -4.36376953125, -3.73828125, -3.11279296875, -2.4873046875, -1.86181640625, -1.236328125, -0.61083984375, 0.0146484375, 0.64013671875, 1.265625, 1.89111328125, 2.5166015625, 3.14208984375, 3.767578125, 4.39306640625, 5.0185546875, 5.64404296875, 6.26953125, 6.89501953125, 7.5205078125, 8.14599609375, 8.771484375, 9.39697265625, 10.0224609375, 10.64794921875, 11.2734375, 11.89892578125, 12.5244140625, 13.14990234375, 13.775390625, 14.40087890625, 15.0263671875, 15.65185546875, 16.27734375, 16.90283203125, 17.5283203125, 18.15380859375, 18.779296875, 19.40478515625, 20.0302734375, 20.65576171875, 21.28125]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 4.0, 2.0, 7.0, 16.0, 5.0, 17.0, 24.0, 23.0, 35.0, 37.0, 44.0, 68.0, 80.0, 115.0, 133.0, 176.0, 215.0, 257.0, 344.0, 402.0, 358.0, 372.0, 304.0, 226.0, 187.0, 137.0, 92.0, 81.0, 62.0, 50.0, 54.0, 32.0, 28.0, 22.0, 17.0, 16.0, 8.0, 7.0, 9.0, 2.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6875, -10.2791748046875, -9.870849609375, -9.4625244140625, -9.05419921875, -8.6458740234375, -8.237548828125, -7.8292236328125, -7.4208984375, -7.0125732421875, -6.604248046875, -6.1959228515625, -5.78759765625, -5.3792724609375, -4.970947265625, -4.5626220703125, -4.154296875, -3.7459716796875, -3.337646484375, -2.9293212890625, -2.52099609375, -2.1126708984375, -1.704345703125, -1.2960205078125, -0.8876953125, -0.4793701171875, -0.071044921875, 0.3372802734375, 0.74560546875, 1.1539306640625, 1.562255859375, 1.9705810546875, 2.37890625, 2.7872314453125, 3.195556640625, 3.6038818359375, 4.01220703125, 4.4205322265625, 4.828857421875, 5.2371826171875, 5.6455078125, 6.0538330078125, 6.462158203125, 6.8704833984375, 7.27880859375, 7.6871337890625, 8.095458984375, 8.5037841796875, 8.912109375, 9.3204345703125, 9.728759765625, 10.1370849609375, 10.54541015625, 10.9537353515625, 11.362060546875, 11.7703857421875, 12.1787109375, 12.5870361328125, 12.995361328125, 13.4036865234375, 13.81201171875, 14.2203369140625, 14.628662109375, 15.0369873046875, 15.4453125]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 8.0, 11.0, 10.0, 9.0, 10.0, 28.0, 27.0, 34.0, 41.0, 52.0, 70.0, 80.0, 128.0, 121.0, 190.0, 260.0, 416.0, 923.0, 46247.0, 4109348.0, 33803.0, 820.0, 475.0, 288.0, 218.0, 155.0, 115.0, 83.0, 61.0, 62.0, 50.0, 20.0, 34.0, 28.0, 9.0, 15.0, 7.0, 8.0, 6.0, 5.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-74.625, -72.3271484375, -70.029296875, -67.7314453125, -65.43359375, -63.1357421875, -60.837890625, -58.5400390625, -56.2421875, -53.9443359375, -51.646484375, -49.3486328125, -47.05078125, -44.7529296875, -42.455078125, -40.1572265625, -37.859375, -35.5615234375, -33.263671875, -30.9658203125, -28.66796875, -26.3701171875, -24.072265625, -21.7744140625, -19.4765625, -17.1787109375, -14.880859375, -12.5830078125, -10.28515625, -7.9873046875, -5.689453125, -3.3916015625, -1.09375, 1.2041015625, 3.501953125, 5.7998046875, 8.09765625, 10.3955078125, 12.693359375, 14.9912109375, 17.2890625, 19.5869140625, 21.884765625, 24.1826171875, 26.48046875, 28.7783203125, 31.076171875, 33.3740234375, 35.671875, 37.9697265625, 40.267578125, 42.5654296875, 44.86328125, 47.1611328125, 49.458984375, 51.7568359375, 54.0546875, 56.3525390625, 58.650390625, 60.9482421875, 63.24609375, 65.5439453125, 67.841796875, 70.1396484375, 72.4375]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 9.0, 31.0, 89.0, 213.0, 249.0, 214.0, 121.0, 64.0, 12.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.55559539794922, -95.68846893310547, -91.82134246826172, -87.95421600341797, -84.08708190917969, -80.21995544433594, -76.35282897949219, -72.48570251464844, -68.61857604980469, -64.75144958496094, -60.88432312011719, -57.01719284057617, -53.15006637573242, -49.28293991088867, -45.415809631347656, -41.548683166503906, -37.681556701660156, -33.814430236816406, -29.947301864624023, -26.08017349243164, -22.21304702758789, -18.34592056274414, -14.478792190551758, -10.611663818359375, -6.744537353515625, -2.8774099349975586, 0.9897174835205078, 4.856844902038574, 8.72397232055664, 12.59109878540039, 16.458227157592773, 20.325355529785156, 24.192489624023438, 28.059616088867188, 31.92674446105957, 35.79387283325195, 39.6609992980957, 43.52812576293945, 47.39525604248047, 51.26238250732422, 55.12950897216797, 58.99663543701172, 62.86376190185547, 66.73088836669922, 70.5980224609375, 74.46514892578125, 78.332275390625, 82.19940185546875, 86.0665283203125, 89.93365478515625, 93.80078125, 97.66790771484375, 101.5350341796875, 105.40216064453125, 109.26929473876953, 113.13642120361328, 117.00354766845703, 120.87067413330078, 124.73780059814453, 128.6049346923828, 132.47206115722656, 136.3391876220703, 140.20631408691406, 144.0734405517578, 147.94056701660156]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 3.0, 4.0, 6.0, 11.0, 11.0, 11.0, 22.0, 28.0, 20.0, 24.0, 25.0, 33.0, 42.0, 46.0, 45.0, 39.0, 49.0, 49.0, 47.0, 49.0, 46.0, 35.0, 64.0, 41.0, 45.0, 31.0, 34.0, 23.0, 20.0, 15.0, 17.0, 16.0, 13.0, 11.0, 9.0, 9.0, 5.0, 1.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-62.331787109375, -60.52672576904297, -58.7216682434082, -56.91661071777344, -55.111549377441406, -53.306488037109375, -51.50143051147461, -49.696372985839844, -47.89131164550781, -46.08625030517578, -44.281192779541016, -42.47613525390625, -40.67107391357422, -38.86601257324219, -37.06095504760742, -35.255897521972656, -33.450836181640625, -31.645776748657227, -29.840717315673828, -28.03565788269043, -26.23059844970703, -24.425539016723633, -22.620479583740234, -20.815420150756836, -19.010360717773438, -17.20530128479004, -15.40024185180664, -13.595182418823242, -11.790122985839844, -9.985063552856445, -8.180004119873047, -6.374944686889648, -4.56988525390625, -2.7648258209228516, -0.9597663879394531, 0.8452930450439453, 2.6503524780273438, 4.455411911010742, 6.260471343994141, 8.065530776977539, 9.870590209960938, 11.675649642944336, 13.480709075927734, 15.285768508911133, 17.09082794189453, 18.89588737487793, 20.700946807861328, 22.506006240844727, 24.311065673828125, 26.116125106811523, 27.921184539794922, 29.72624397277832, 31.53130340576172, 33.33636474609375, 35.141422271728516, 36.94647979736328, 38.75154113769531, 40.556602478027344, 42.36166000366211, 44.166717529296875, 45.971778869628906, 47.77684020996094, 49.5818977355957, 51.38695526123047, 53.1920166015625]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 7.0, 11.0, 9.0, 6.0, 17.0, 6.0, 13.0, 18.0, 19.0, 22.0, 19.0, 29.0, 29.0, 22.0, 37.0, 32.0, 36.0, 50.0, 37.0, 40.0, 33.0, 55.0, 32.0, 39.0, 31.0, 24.0, 38.0, 33.0, 20.0, 32.0, 19.0, 29.0, 18.0, 16.0, 19.0, 16.0, 15.0, 14.0, 6.0, 8.0, 13.0, 5.0, 6.0, 4.0, 4.0, 2.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.70703125, -6.47802734375, -6.2490234375, -6.02001953125, -5.791015625, -5.56201171875, -5.3330078125, -5.10400390625, -4.875, -4.64599609375, -4.4169921875, -4.18798828125, -3.958984375, -3.72998046875, -3.5009765625, -3.27197265625, -3.04296875, -2.81396484375, -2.5849609375, -2.35595703125, -2.126953125, -1.89794921875, -1.6689453125, -1.43994140625, -1.2109375, -0.98193359375, -0.7529296875, -0.52392578125, -0.294921875, -0.06591796875, 0.1630859375, 0.39208984375, 0.62109375, 0.85009765625, 1.0791015625, 1.30810546875, 1.537109375, 1.76611328125, 1.9951171875, 2.22412109375, 2.453125, 2.68212890625, 2.9111328125, 3.14013671875, 3.369140625, 3.59814453125, 3.8271484375, 4.05615234375, 4.28515625, 4.51416015625, 4.7431640625, 4.97216796875, 5.201171875, 5.43017578125, 5.6591796875, 5.88818359375, 6.1171875, 6.34619140625, 6.5751953125, 6.80419921875, 7.033203125, 7.26220703125, 7.4912109375, 7.72021484375, 7.94921875]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 6.0, 7.0, 14.0, 9.0, 14.0, 21.0, 41.0, 68.0, 90.0, 145.0, 238.0, 353.0, 475.0, 775.0, 1168.0, 1686.0, 2556.0, 3947.0, 5795.0, 8764.0, 12952.0, 19375.0, 29528.0, 44489.0, 67979.0, 104105.0, 161181.0, 195636.0, 133743.0, 86192.0, 56937.0, 37061.0, 24332.0, 16238.0, 11006.0, 7146.0, 4808.0, 3272.0, 2169.0, 1418.0, 917.0, 665.0, 462.0, 245.0, 165.0, 123.0, 87.0, 49.0, 34.0, 29.0, 22.0, 10.0, 9.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.98486328125, -0.9523391723632812, -0.9198150634765625, -0.8872909545898438, -0.854766845703125, -0.8222427368164062, -0.7897186279296875, -0.7571945190429688, -0.72467041015625, -0.6921463012695312, -0.6596221923828125, -0.6270980834960938, -0.594573974609375, -0.5620498657226562, -0.5295257568359375, -0.49700164794921875, -0.4644775390625, -0.43195343017578125, -0.3994293212890625, -0.36690521240234375, -0.334381103515625, -0.30185699462890625, -0.2693328857421875, -0.23680877685546875, -0.20428466796875, -0.17176055908203125, -0.1392364501953125, -0.10671234130859375, -0.074188232421875, -0.04166412353515625, -0.0091400146484375, 0.02338409423828125, 0.055908203125, 0.08843231201171875, 0.1209564208984375, 0.15348052978515625, 0.186004638671875, 0.21852874755859375, 0.2510528564453125, 0.28357696533203125, 0.31610107421875, 0.34862518310546875, 0.3811492919921875, 0.41367340087890625, 0.446197509765625, 0.47872161865234375, 0.5112457275390625, 0.5437698364257812, 0.5762939453125, 0.6088180541992188, 0.6413421630859375, 0.6738662719726562, 0.706390380859375, 0.7389144897460938, 0.7714385986328125, 0.8039627075195312, 0.83648681640625, 0.8690109252929688, 0.9015350341796875, 0.9340591430664062, 0.966583251953125, 0.9991073608398438, 1.0316314697265625, 1.0641555786132812, 1.0966796875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 5.0, 6.0, 5.0, 8.0, 7.0, 15.0, 3.0, 14.0, 8.0, 9.0, 11.0, 16.0, 12.0, 13.0, 27.0, 22.0, 27.0, 25.0, 30.0, 22.0, 29.0, 33.0, 43.0, 40.0, 40.0, 36.0, 1050.0, 41.0, 39.0, 43.0, 45.0, 22.0, 37.0, 30.0, 27.0, 24.0, 25.0, 20.0, 18.0, 12.0, 24.0, 10.0, 17.0, 8.0, 6.0, 9.0, 4.0, 8.0, 6.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.08984375, -3.95098876953125, -3.8121337890625, -3.67327880859375, -3.534423828125, -3.39556884765625, -3.2567138671875, -3.11785888671875, -2.97900390625, -2.84014892578125, -2.7012939453125, -2.56243896484375, -2.423583984375, -2.28472900390625, -2.1458740234375, -2.00701904296875, -1.8681640625, -1.72930908203125, -1.5904541015625, -1.45159912109375, -1.312744140625, -1.17388916015625, -1.0350341796875, -0.89617919921875, -0.75732421875, -0.61846923828125, -0.4796142578125, -0.34075927734375, -0.201904296875, -0.06304931640625, 0.0758056640625, 0.21466064453125, 0.353515625, 0.49237060546875, 0.6312255859375, 0.77008056640625, 0.908935546875, 1.04779052734375, 1.1866455078125, 1.32550048828125, 1.46435546875, 1.60321044921875, 1.7420654296875, 1.88092041015625, 2.019775390625, 2.15863037109375, 2.2974853515625, 2.43634033203125, 2.5751953125, 2.71405029296875, 2.8529052734375, 2.99176025390625, 3.130615234375, 3.26947021484375, 3.4083251953125, 3.54718017578125, 3.68603515625, 3.82489013671875, 3.9637451171875, 4.10260009765625, 4.241455078125, 4.38031005859375, 4.5191650390625, 4.65802001953125, 4.796875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 10.0, 14.0, 25.0, 35.0, 52.0, 77.0, 110.0, 187.0, 281.0, 436.0, 680.0, 1050.0, 1578.0, 2398.0, 3724.0, 5751.0, 8921.0, 13597.0, 20887.0, 32869.0, 51438.0, 81986.0, 130514.0, 1245213.0, 180424.0, 115427.0, 72368.0, 45296.0, 28742.0, 18470.0, 12003.0, 7745.0, 5146.0, 3389.0, 2179.0, 1432.0, 929.0, 638.0, 387.0, 277.0, 162.0, 109.0, 63.0, 37.0, 23.0, 19.0, 17.0, 7.0, 7.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.041015625, -1.00933837890625, -0.9776611328125, -0.94598388671875, -0.914306640625, -0.88262939453125, -0.8509521484375, -0.81927490234375, -0.78759765625, -0.75592041015625, -0.7242431640625, -0.69256591796875, -0.660888671875, -0.62921142578125, -0.5975341796875, -0.56585693359375, -0.5341796875, -0.50250244140625, -0.4708251953125, -0.43914794921875, -0.407470703125, -0.37579345703125, -0.3441162109375, -0.31243896484375, -0.28076171875, -0.24908447265625, -0.2174072265625, -0.18572998046875, -0.154052734375, -0.12237548828125, -0.0906982421875, -0.05902099609375, -0.02734375, 0.00433349609375, 0.0360107421875, 0.06768798828125, 0.099365234375, 0.13104248046875, 0.1627197265625, 0.19439697265625, 0.22607421875, 0.25775146484375, 0.2894287109375, 0.32110595703125, 0.352783203125, 0.38446044921875, 0.4161376953125, 0.44781494140625, 0.4794921875, 0.51116943359375, 0.5428466796875, 0.57452392578125, 0.606201171875, 0.63787841796875, 0.6695556640625, 0.70123291015625, 0.73291015625, 0.76458740234375, 0.7962646484375, 0.82794189453125, 0.859619140625, 0.89129638671875, 0.9229736328125, 0.95465087890625, 0.986328125]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 3.0, 11.0, 2.0, 5.0, 4.0, 12.0, 8.0, 15.0, 8.0, 16.0, 21.0, 23.0, 27.0, 34.0, 42.0, 44.0, 40.0, 61.0, 43.0, 54.0, 48.0, 54.0, 43.0, 37.0, 49.0, 48.0, 36.0, 41.0, 34.0, 28.0, 25.0, 17.0, 16.0, 14.0, 7.0, 8.0, 4.0, 3.0, 5.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0017833709716796875, -0.0017272084951400757, -0.0016710460186004639, -0.001614883542060852, -0.0015587210655212402, -0.0015025585889816284, -0.0014463961124420166, -0.0013902336359024048, -0.001334071159362793, -0.0012779086828231812, -0.0012217462062835693, -0.0011655837297439575, -0.0011094212532043457, -0.0010532587766647339, -0.000997096300125122, -0.0009409338235855103, -0.0008847713470458984, -0.0008286088705062866, -0.0007724463939666748, -0.000716283917427063, -0.0006601214408874512, -0.0006039589643478394, -0.0005477964878082275, -0.0004916340112686157, -0.0004354715347290039, -0.0003793090581893921, -0.0003231465816497803, -0.00026698410511016846, -0.00021082162857055664, -0.00015465915203094482, -9.849667549133301e-05, -4.233419895172119e-05, 1.3828277587890625e-05, 6.999075412750244e-05, 0.00012615323066711426, 0.00018231570720672607, 0.0002384781837463379, 0.0002946406602859497, 0.0003508031368255615, 0.00040696561336517334, 0.00046312808990478516, 0.000519290566444397, 0.0005754530429840088, 0.0006316155195236206, 0.0006877779960632324, 0.0007439404726028442, 0.0008001029491424561, 0.0008562654256820679, 0.0009124279022216797, 0.0009685903787612915, 0.0010247528553009033, 0.0010809153318405151, 0.001137077808380127, 0.0011932402849197388, 0.0012494027614593506, 0.0013055652379989624, 0.0013617277145385742, 0.001417890191078186, 0.0014740526676177979, 0.0015302151441574097, 0.0015863776206970215, 0.0016425400972366333, 0.0016987025737762451, 0.001754865050315857, 0.0018110275268554688]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 7.0, 2.0, 5.0, 7.0, 5.0, 6.0, 12.0, 17.0, 26.0, 13.0, 27.0, 47.0, 49.0, 54.0, 64.0, 74.0, 119.0, 278.0, 696.0, 7042.0, 1034554.0, 4049.0, 626.0, 239.0, 119.0, 71.0, 72.0, 50.0, 44.0, 33.0, 17.0, 28.0, 17.0, 15.0, 18.0, 7.0, 6.0, 11.0, 6.0, 2.0, 5.0, 4.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.04229736328125, -0.040993690490722656, -0.03969001770019531, -0.03838634490966797, -0.037082672119140625, -0.03577899932861328, -0.03447532653808594, -0.033171653747558594, -0.03186798095703125, -0.030564308166503906, -0.029260635375976562, -0.02795696258544922, -0.026653289794921875, -0.02534961700439453, -0.024045944213867188, -0.022742271423339844, -0.0214385986328125, -0.020134925842285156, -0.018831253051757812, -0.01752758026123047, -0.016223907470703125, -0.014920234680175781, -0.013616561889648438, -0.012312889099121094, -0.01100921630859375, -0.009705543518066406, -0.008401870727539062, -0.007098197937011719, -0.005794525146484375, -0.004490852355957031, -0.0031871795654296875, -0.0018835067749023438, -0.000579833984375, 0.0007238388061523438, 0.0020275115966796875, 0.0033311843872070312, 0.004634857177734375, 0.005938529968261719, 0.0072422027587890625, 0.008545875549316406, 0.00984954833984375, 0.011153221130371094, 0.012456893920898438, 0.013760566711425781, 0.015064239501953125, 0.01636791229248047, 0.017671585083007812, 0.018975257873535156, 0.0202789306640625, 0.021582603454589844, 0.022886276245117188, 0.02418994903564453, 0.025493621826171875, 0.02679729461669922, 0.028100967407226562, 0.029404640197753906, 0.03070831298828125, 0.032011985778808594, 0.03331565856933594, 0.03461933135986328, 0.035923004150390625, 0.03722667694091797, 0.03853034973144531, 0.039834022521972656, 0.0411376953125]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 82.0, 609.0, 306.0, 14.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.010601067915558815, -0.010411077179014683, -0.010221085511147976, -0.010031094774603844, -0.009841103106737137, -0.009651112370193005, -0.009461120702326298, -0.009271129965782166, -0.009081138297915459, -0.008891147561371326, -0.00870115589350462, -0.008511165156960487, -0.00832117348909378, -0.008131182752549648, -0.007941191084682941, -0.007751200348138809, -0.00756120914593339, -0.00737121794372797, -0.007181226741522551, -0.006991235539317131, -0.0068012443371117115, -0.006611253134906292, -0.00642126239836216, -0.006231270730495453, -0.006041279993951321, -0.005851288791745901, -0.005661297589540482, -0.005471306387335062, -0.0052813151851296425, -0.005091323982924223, -0.004901332780718803, -0.004711342044174671, -0.004521349910646677, -0.0043313587084412575, -0.004141367506235838, -0.003951376304030418, -0.003761385101824999, -0.0035713938996195793, -0.0033814029302448034, -0.003191411728039384, -0.003001420758664608, -0.0028114295564591885, -0.002621438354253769, -0.0024314471520483494, -0.00224145594984293, -0.0020514647476375103, -0.0018614737782627344, -0.0016714825760573149, -0.0014814912574365735, -0.001291500055231154, -0.0011015089694410563, -0.0009115177672356367, -0.0007215265650302172, -0.0005315353628247976, -0.0003415442770346999, -0.00015155307482928038, 3.8438127376139164e-05, 0.00022842930047772825, 0.00041842047357931733, 0.000608411617577076, 0.0007984028197824955, 0.000988394021987915, 0.0011783851077780128, 0.0013683763099834323, 0.0015583675121888518]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 1.0, 4.0, 4.0, 9.0, 11.0, 11.0, 11.0, 15.0, 20.0, 26.0, 28.0, 21.0, 17.0, 30.0, 29.0, 41.0, 37.0, 41.0, 32.0, 43.0, 37.0, 30.0, 56.0, 39.0, 44.0, 30.0, 49.0, 41.0, 33.0, 29.0, 32.0, 26.0, 20.0, 19.0, 17.0, 16.0, 13.0, 7.0, 13.0, 9.0, 2.0, 3.0, 1.0, 4.0, 6.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010439157485961914, -0.0010119974613189697, -0.000980079174041748, -0.0009481608867645264, -0.0009162425994873047, -0.000884324312210083, -0.0008524060249328613, -0.0008204877376556396, -0.000788569450378418, -0.0007566511631011963, -0.0007247328758239746, -0.0006928145885467529, -0.0006608963012695312, -0.0006289780139923096, -0.0005970597267150879, -0.0005651414394378662, -0.0005332231521606445, -0.0005013048648834229, -0.00046938657760620117, -0.0004374682903289795, -0.0004055500030517578, -0.00037363171577453613, -0.00034171342849731445, -0.0003097951412200928, -0.0002778768539428711, -0.0002459585666656494, -0.00021404027938842773, -0.00018212199211120605, -0.00015020370483398438, -0.0001182854175567627, -8.636713027954102e-05, -5.4448843002319336e-05, -2.2530555725097656e-05, 9.387731552124023e-06, 4.13060188293457e-05, 7.322430610656738e-05, 0.00010514259338378906, 0.00013706088066101074, 0.00016897916793823242, 0.0002008974552154541, 0.00023281574249267578, 0.00026473402976989746, 0.00029665231704711914, 0.0003285706043243408, 0.0003604888916015625, 0.0003924071788787842, 0.00042432546615600586, 0.00045624375343322754, 0.0004881620407104492, 0.0005200803279876709, 0.0005519986152648926, 0.0005839169025421143, 0.0006158351898193359, 0.0006477534770965576, 0.0006796717643737793, 0.000711590051651001, 0.0007435083389282227, 0.0007754266262054443, 0.000807344913482666, 0.0008392632007598877, 0.0008711814880371094, 0.0009030997753143311, 0.0009350180625915527, 0.0009669363498687744, 0.000998854637145996]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 7.0, 11.0, 9.0, 6.0, 17.0, 6.0, 13.0, 18.0, 19.0, 22.0, 19.0, 29.0, 29.0, 22.0, 37.0, 32.0, 36.0, 50.0, 37.0, 40.0, 34.0, 54.0, 32.0, 39.0, 31.0, 24.0, 38.0, 33.0, 20.0, 32.0, 19.0, 29.0, 18.0, 16.0, 19.0, 16.0, 15.0, 14.0, 6.0, 8.0, 13.0, 5.0, 6.0, 4.0, 4.0, 2.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.70703125, -6.47802734375, -6.2490234375, -6.02001953125, -5.791015625, -5.56201171875, -5.3330078125, -5.10400390625, -4.875, -4.64599609375, -4.4169921875, -4.18798828125, -3.958984375, -3.72998046875, -3.5009765625, -3.27197265625, -3.04296875, -2.81396484375, -2.5849609375, -2.35595703125, -2.126953125, -1.89794921875, -1.6689453125, -1.43994140625, -1.2109375, -0.98193359375, -0.7529296875, -0.52392578125, -0.294921875, -0.06591796875, 0.1630859375, 0.39208984375, 0.62109375, 0.85009765625, 1.0791015625, 1.30810546875, 1.537109375, 1.76611328125, 1.9951171875, 2.22412109375, 2.453125, 2.68212890625, 2.9111328125, 3.14013671875, 3.369140625, 3.59814453125, 3.8271484375, 4.05615234375, 4.28515625, 4.51416015625, 4.7431640625, 4.97216796875, 5.201171875, 5.43017578125, 5.6591796875, 5.88818359375, 6.1171875, 6.34619140625, 6.5751953125, 6.80419921875, 7.033203125, 7.26220703125, 7.4912109375, 7.72021484375, 7.94921875]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 4.0, 11.0, 10.0, 14.0, 11.0, 22.0, 15.0, 29.0, 42.0, 51.0, 71.0, 97.0, 129.0, 199.0, 352.0, 583.0, 1165.0, 2466.0, 6013.0, 16936.0, 58012.0, 246051.0, 526306.0, 136032.0, 34655.0, 11072.0, 4110.0, 1844.0, 875.0, 475.0, 280.0, 165.0, 127.0, 85.0, 62.0, 37.0, 26.0, 29.0, 20.0, 11.0, 14.0, 14.0, 6.0, 8.0, 5.0, 4.0, 2.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.51171875, -6.28948974609375, -6.0672607421875, -5.84503173828125, -5.622802734375, -5.40057373046875, -5.1783447265625, -4.95611572265625, -4.73388671875, -4.51165771484375, -4.2894287109375, -4.06719970703125, -3.844970703125, -3.62274169921875, -3.4005126953125, -3.17828369140625, -2.9560546875, -2.73382568359375, -2.5115966796875, -2.28936767578125, -2.067138671875, -1.84490966796875, -1.6226806640625, -1.40045166015625, -1.17822265625, -0.95599365234375, -0.7337646484375, -0.51153564453125, -0.289306640625, -0.06707763671875, 0.1551513671875, 0.37738037109375, 0.599609375, 0.82183837890625, 1.0440673828125, 1.26629638671875, 1.488525390625, 1.71075439453125, 1.9329833984375, 2.15521240234375, 2.37744140625, 2.59967041015625, 2.8218994140625, 3.04412841796875, 3.266357421875, 3.48858642578125, 3.7108154296875, 3.93304443359375, 4.1552734375, 4.37750244140625, 4.5997314453125, 4.82196044921875, 5.044189453125, 5.26641845703125, 5.4886474609375, 5.71087646484375, 5.93310546875, 6.15533447265625, 6.3775634765625, 6.59979248046875, 6.822021484375, 7.04425048828125, 7.2664794921875, 7.48870849609375, 7.7109375]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 6.0, 9.0, 11.0, 13.0, 9.0, 10.0, 17.0, 12.0, 28.0, 21.0, 20.0, 33.0, 31.0, 39.0, 33.0, 34.0, 41.0, 45.0, 89.0, 223.0, 1712.0, 145.0, 63.0, 40.0, 48.0, 30.0, 34.0, 37.0, 28.0, 20.0, 35.0, 19.0, 21.0, 21.0, 14.0, 10.0, 10.0, 8.0, 4.0, 5.0, 6.0, 6.0, 3.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.59375, -23.78271484375, -22.9716796875, -22.16064453125, -21.349609375, -20.53857421875, -19.7275390625, -18.91650390625, -18.10546875, -17.29443359375, -16.4833984375, -15.67236328125, -14.861328125, -14.05029296875, -13.2392578125, -12.42822265625, -11.6171875, -10.80615234375, -9.9951171875, -9.18408203125, -8.373046875, -7.56201171875, -6.7509765625, -5.93994140625, -5.12890625, -4.31787109375, -3.5068359375, -2.69580078125, -1.884765625, -1.07373046875, -0.2626953125, 0.54833984375, 1.359375, 2.17041015625, 2.9814453125, 3.79248046875, 4.603515625, 5.41455078125, 6.2255859375, 7.03662109375, 7.84765625, 8.65869140625, 9.4697265625, 10.28076171875, 11.091796875, 11.90283203125, 12.7138671875, 13.52490234375, 14.3359375, 15.14697265625, 15.9580078125, 16.76904296875, 17.580078125, 18.39111328125, 19.2021484375, 20.01318359375, 20.82421875, 21.63525390625, 22.4462890625, 23.25732421875, 24.068359375, 24.87939453125, 25.6904296875, 26.50146484375, 27.3125]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 8.0, 8.0, 14.0, 21.0, 35.0, 55.0, 114.0, 217.0, 408.0, 1358.0, 3123436.0, 18615.0, 721.0, 340.0, 156.0, 87.0, 46.0, 33.0, 18.0, 9.0, 5.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-138.0, -133.37109375, -128.7421875, -124.11328125, -119.484375, -114.85546875, -110.2265625, -105.59765625, -100.96875, -96.33984375, -91.7109375, -87.08203125, -82.453125, -77.82421875, -73.1953125, -68.56640625, -63.9375, -59.30859375, -54.6796875, -50.05078125, -45.421875, -40.79296875, -36.1640625, -31.53515625, -26.90625, -22.27734375, -17.6484375, -13.01953125, -8.390625, -3.76171875, 0.8671875, 5.49609375, 10.125, 14.75390625, 19.3828125, 24.01171875, 28.640625, 33.26953125, 37.8984375, 42.52734375, 47.15625, 51.78515625, 56.4140625, 61.04296875, 65.671875, 70.30078125, 74.9296875, 79.55859375, 84.1875, 88.81640625, 93.4453125, 98.07421875, 102.703125, 107.33203125, 111.9609375, 116.58984375, 121.21875, 125.84765625, 130.4765625, 135.10546875, 139.734375, 144.36328125, 148.9921875, 153.62109375, 158.25]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 11.0, 429.0, 560.0, 16.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.37947845458984, -62.586734771728516, -57.79398727416992, -53.001243591308594, -48.20849609375, -43.41575241088867, -38.623008728027344, -33.83026123046875, -29.037517547607422, -24.24477195739746, -19.4520263671875, -14.659282684326172, -9.866537094116211, -5.07379150390625, -0.2810478210449219, 4.511699676513672, 9.304443359375, 14.097188949584961, 18.889934539794922, 23.68267822265625, 28.47542381286621, 33.26816940307617, 38.0609130859375, 42.853660583496094, 47.64640426635742, 52.43914794921875, 57.231895446777344, 62.02463912963867, 66.8173828125, 71.6101303100586, 76.40287780761719, 81.19561767578125, 85.98835754394531, 90.7811050415039, 95.57384490966797, 100.36659240722656, 105.15933990478516, 109.95208740234375, 114.74482727050781, 119.5375747680664, 124.330322265625, 129.12306213378906, 133.9158172607422, 138.70855712890625, 143.5012969970703, 148.29405212402344, 153.0867919921875, 157.87954711914062, 162.67227172851562, 167.4650115966797, 172.2577667236328, 177.05050659179688, 181.84324645996094, 186.63600158691406, 191.42874145507812, 196.22149658203125, 201.0142364501953, 205.80697631835938, 210.5997314453125, 215.39247131347656, 220.18521118164062, 224.97796630859375, 229.7707061767578, 234.56344604492188, 239.356201171875]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 6.0, 10.0, 10.0, 9.0, 15.0, 19.0, 23.0, 29.0, 23.0, 25.0, 30.0, 29.0, 41.0, 41.0, 45.0, 36.0, 47.0, 41.0, 46.0, 46.0, 54.0, 53.0, 34.0, 45.0, 30.0, 21.0, 26.0, 22.0, 22.0, 26.0, 17.0, 15.0, 15.0, 12.0, 13.0, 6.0, 5.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.66453552246094, -73.23259735107422, -70.80065155029297, -68.36871337890625, -65.936767578125, -63.504825592041016, -61.07288360595703, -58.64094543457031, -56.20899963378906, -53.77705764770508, -51.345115661621094, -48.91317367553711, -46.481231689453125, -44.04928970336914, -41.617347717285156, -39.18540954589844, -36.75346755981445, -34.32152557373047, -31.889583587646484, -29.4576416015625, -27.025699615478516, -24.59375762939453, -22.16181755065918, -19.729875564575195, -17.29793357849121, -14.865991592407227, -12.434049606323242, -10.002108573913574, -7.57016658782959, -5.1382246017456055, -2.7062835693359375, -0.2743415832519531, 2.1576004028320312, 4.589542388916016, 7.021483898162842, 9.453425407409668, 11.885367393493652, 14.317309379577637, 16.749250411987305, 19.18119239807129, 21.613134384155273, 24.045076370239258, 26.477018356323242, 28.908958435058594, 31.340900421142578, 33.77284240722656, 36.20478439331055, 38.63672637939453, 41.068668365478516, 43.5006103515625, 45.932552337646484, 48.36449432373047, 50.79643630981445, 53.22837829589844, 55.660316467285156, 58.092262268066406, 60.524200439453125, 62.95614242553711, 65.3880844116211, 67.82002258300781, 70.25196838378906, 72.68390655517578, 75.11585235595703, 77.54779052734375, 79.979736328125]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 6.0, 7.0, 11.0, 6.0, 11.0, 10.0, 12.0, 11.0, 14.0, 19.0, 20.0, 23.0, 24.0, 18.0, 34.0, 42.0, 35.0, 34.0, 44.0, 52.0, 29.0, 45.0, 37.0, 37.0, 36.0, 37.0, 38.0, 36.0, 23.0, 26.0, 37.0, 24.0, 16.0, 21.0, 22.0, 19.0, 11.0, 11.0, 14.0, 11.0, 11.0, 7.0, 5.0, 3.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.05859375, -6.81732177734375, -6.5760498046875, -6.33477783203125, -6.093505859375, -5.85223388671875, -5.6109619140625, -5.36968994140625, -5.12841796875, -4.88714599609375, -4.6458740234375, -4.40460205078125, -4.163330078125, -3.92205810546875, -3.6807861328125, -3.43951416015625, -3.1982421875, -2.95697021484375, -2.7156982421875, -2.47442626953125, -2.233154296875, -1.99188232421875, -1.7506103515625, -1.50933837890625, -1.26806640625, -1.02679443359375, -0.7855224609375, -0.54425048828125, -0.302978515625, -0.06170654296875, 0.1795654296875, 0.42083740234375, 0.662109375, 0.90338134765625, 1.1446533203125, 1.38592529296875, 1.627197265625, 1.86846923828125, 2.1097412109375, 2.35101318359375, 2.59228515625, 2.83355712890625, 3.0748291015625, 3.31610107421875, 3.557373046875, 3.79864501953125, 4.0399169921875, 4.28118896484375, 4.5224609375, 4.76373291015625, 5.0050048828125, 5.24627685546875, 5.487548828125, 5.72882080078125, 5.9700927734375, 6.21136474609375, 6.45263671875, 6.69390869140625, 6.9351806640625, 7.17645263671875, 7.417724609375, 7.65899658203125, 7.9002685546875, 8.14154052734375, 8.3828125]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 10.0, 5.0, 15.0, 13.0, 12.0, 10.0, 18.0, 25.0, 26.0, 28.0, 34.0, 30.0, 42.0, 54.0, 63.0, 76.0, 110.0, 127.0, 240.0, 545.0, 1398.0, 5784.0, 50551.0, 897838.0, 2761164.0, 444690.0, 25146.0, 3832.0, 1080.0, 410.0, 201.0, 162.0, 115.0, 67.0, 62.0, 41.0, 39.0, 45.0, 28.0, 35.0, 21.0, 20.0, 19.0, 15.0, 6.0, 7.0, 8.0, 4.0, 4.0, 5.0, 4.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0], "bins": [-18.0625, -17.4677734375, -16.873046875, -16.2783203125, -15.68359375, -15.0888671875, -14.494140625, -13.8994140625, -13.3046875, -12.7099609375, -12.115234375, -11.5205078125, -10.92578125, -10.3310546875, -9.736328125, -9.1416015625, -8.546875, -7.9521484375, -7.357421875, -6.7626953125, -6.16796875, -5.5732421875, -4.978515625, -4.3837890625, -3.7890625, -3.1943359375, -2.599609375, -2.0048828125, -1.41015625, -0.8154296875, -0.220703125, 0.3740234375, 0.96875, 1.5634765625, 2.158203125, 2.7529296875, 3.34765625, 3.9423828125, 4.537109375, 5.1318359375, 5.7265625, 6.3212890625, 6.916015625, 7.5107421875, 8.10546875, 8.7001953125, 9.294921875, 9.8896484375, 10.484375, 11.0791015625, 11.673828125, 12.2685546875, 12.86328125, 13.4580078125, 14.052734375, 14.6474609375, 15.2421875, 15.8369140625, 16.431640625, 17.0263671875, 17.62109375, 18.2158203125, 18.810546875, 19.4052734375, 20.0]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 2.0, 3.0, 7.0, 8.0, 14.0, 18.0, 17.0, 27.0, 34.0, 36.0, 57.0, 84.0, 75.0, 89.0, 132.0, 150.0, 195.0, 264.0, 315.0, 387.0, 425.0, 397.0, 315.0, 236.0, 156.0, 145.0, 107.0, 81.0, 76.0, 40.0, 43.0, 39.0, 17.0, 22.0, 16.0, 17.0, 9.0, 4.0, 5.0, 5.0, 2.0, 0.0, 6.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-13.375, -12.97314453125, -12.5712890625, -12.16943359375, -11.767578125, -11.36572265625, -10.9638671875, -10.56201171875, -10.16015625, -9.75830078125, -9.3564453125, -8.95458984375, -8.552734375, -8.15087890625, -7.7490234375, -7.34716796875, -6.9453125, -6.54345703125, -6.1416015625, -5.73974609375, -5.337890625, -4.93603515625, -4.5341796875, -4.13232421875, -3.73046875, -3.32861328125, -2.9267578125, -2.52490234375, -2.123046875, -1.72119140625, -1.3193359375, -0.91748046875, -0.515625, -0.11376953125, 0.2880859375, 0.68994140625, 1.091796875, 1.49365234375, 1.8955078125, 2.29736328125, 2.69921875, 3.10107421875, 3.5029296875, 3.90478515625, 4.306640625, 4.70849609375, 5.1103515625, 5.51220703125, 5.9140625, 6.31591796875, 6.7177734375, 7.11962890625, 7.521484375, 7.92333984375, 8.3251953125, 8.72705078125, 9.12890625, 9.53076171875, 9.9326171875, 10.33447265625, 10.736328125, 11.13818359375, 11.5400390625, 11.94189453125, 12.34375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 6.0, 5.0, 3.0, 7.0, 12.0, 16.0, 16.0, 10.0, 25.0, 25.0, 38.0, 38.0, 52.0, 67.0, 89.0, 119.0, 137.0, 158.0, 180.0, 227.0, 375.0, 702.0, 6966.0, 3331977.0, 847734.0, 3061.0, 581.0, 372.0, 225.0, 195.0, 160.0, 135.0, 109.0, 97.0, 75.0, 69.0, 41.0, 35.0, 37.0, 25.0, 23.0, 13.0, 10.0, 6.0, 6.0, 8.0, 7.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-64.6875, -62.6591796875, -60.630859375, -58.6025390625, -56.57421875, -54.5458984375, -52.517578125, -50.4892578125, -48.4609375, -46.4326171875, -44.404296875, -42.3759765625, -40.34765625, -38.3193359375, -36.291015625, -34.2626953125, -32.234375, -30.2060546875, -28.177734375, -26.1494140625, -24.12109375, -22.0927734375, -20.064453125, -18.0361328125, -16.0078125, -13.9794921875, -11.951171875, -9.9228515625, -7.89453125, -5.8662109375, -3.837890625, -1.8095703125, 0.21875, 2.2470703125, 4.275390625, 6.3037109375, 8.33203125, 10.3603515625, 12.388671875, 14.4169921875, 16.4453125, 18.4736328125, 20.501953125, 22.5302734375, 24.55859375, 26.5869140625, 28.615234375, 30.6435546875, 32.671875, 34.7001953125, 36.728515625, 38.7568359375, 40.78515625, 42.8134765625, 44.841796875, 46.8701171875, 48.8984375, 50.9267578125, 52.955078125, 54.9833984375, 57.01171875, 59.0400390625, 61.068359375, 63.0966796875, 65.125]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 21.0, 126.0, 411.0, 346.0, 92.0, 18.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-148.4569854736328, -141.6826171875, -134.90823364257812, -128.13385009765625, -121.35948181152344, -114.5851058959961, -107.81072998046875, -101.0363540649414, -94.26197814941406, -87.48760223388672, -80.71322631835938, -73.93885040283203, -67.16447448730469, -60.390098571777344, -53.61572265625, -46.841346740722656, -40.06697082519531, -33.29259490966797, -26.518218994140625, -19.74384307861328, -12.969467163085938, -6.195091247558594, 0.57928466796875, 7.353660583496094, 14.128036499023438, 20.90241241455078, 27.676788330078125, 34.45116424560547, 41.22554016113281, 47.999916076660156, 54.7742919921875, 61.548667907714844, 68.32302856445312, 75.09740447998047, 81.87178039550781, 88.64615631103516, 95.4205322265625, 102.19490814208984, 108.96928405761719, 115.74365997314453, 122.51803588867188, 129.29241943359375, 136.06678771972656, 142.84115600585938, 149.61553955078125, 156.38992309570312, 163.16429138183594, 169.93865966796875, 176.71304321289062, 183.4874267578125, 190.2617950439453, 197.03616333007812, 203.810546875, 210.58493041992188, 217.3592987060547, 224.1336669921875, 230.90805053710938, 237.68243408203125, 244.45680236816406, 251.23117065429688, 258.00555419921875, 264.7799377441406, 271.5543212890625, 278.32867431640625, 285.1030578613281]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 3.0, 8.0, 7.0, 9.0, 15.0, 17.0, 15.0, 22.0, 9.0, 17.0, 28.0, 26.0, 28.0, 40.0, 50.0, 40.0, 43.0, 59.0, 47.0, 33.0, 58.0, 34.0, 39.0, 53.0, 39.0, 35.0, 32.0, 35.0, 21.0, 26.0, 21.0, 27.0, 14.0, 13.0, 3.0, 11.0, 3.0, 9.0, 5.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.80086135864258, -54.11524963378906, -52.42964172363281, -50.7440299987793, -49.05842208862305, -47.37281036376953, -45.68720245361328, -44.001590728759766, -42.31597900390625, -40.630367279052734, -38.944759368896484, -37.25914764404297, -35.57353973388672, -33.8879280090332, -32.20231628417969, -30.516708374023438, -28.831100463867188, -27.145490646362305, -25.459880828857422, -23.774269104003906, -22.088661193847656, -20.40304946899414, -18.717439651489258, -17.031829833984375, -15.346220016479492, -13.66061019897461, -11.975000381469727, -10.289389610290527, -8.603779792785645, -6.918169975280762, -5.2325592041015625, -3.5469493865966797, -1.8613357543945312, -0.17572569847106934, 1.5098843574523926, 3.1954946517944336, 4.881104469299316, 6.566714286804199, 8.252325057983398, 9.937934875488281, 11.623544692993164, 13.309154510498047, 14.99476432800293, 16.680374145507812, 18.365985870361328, 20.051593780517578, 21.737205505371094, 23.422815322875977, 25.10842514038086, 26.794034957885742, 28.479644775390625, 30.16525650024414, 31.85086441040039, 33.536476135253906, 35.222084045410156, 36.90769577026367, 38.59330749511719, 40.2789192199707, 41.96452713012695, 43.65013885498047, 45.33574676513672, 47.021358489990234, 48.70697021484375, 50.392578125, 52.07818603515625]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 7.0, 4.0, 8.0, 14.0, 9.0, 8.0, 9.0, 20.0, 16.0, 14.0, 23.0, 30.0, 14.0, 23.0, 44.0, 30.0, 30.0, 43.0, 28.0, 40.0, 46.0, 48.0, 38.0, 33.0, 39.0, 31.0, 37.0, 32.0, 26.0, 26.0, 29.0, 31.0, 16.0, 17.0, 21.0, 12.0, 11.0, 21.0, 14.0, 8.0, 13.0, 16.0, 6.0, 3.0, 2.0, 1.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-7.4453125, -7.21331787109375, -6.9813232421875, -6.74932861328125, -6.517333984375, -6.28533935546875, -6.0533447265625, -5.82135009765625, -5.58935546875, -5.35736083984375, -5.1253662109375, -4.89337158203125, -4.661376953125, -4.42938232421875, -4.1973876953125, -3.96539306640625, -3.7333984375, -3.50140380859375, -3.2694091796875, -3.03741455078125, -2.805419921875, -2.57342529296875, -2.3414306640625, -2.10943603515625, -1.87744140625, -1.64544677734375, -1.4134521484375, -1.18145751953125, -0.949462890625, -0.71746826171875, -0.4854736328125, -0.25347900390625, -0.021484375, 0.21051025390625, 0.4425048828125, 0.67449951171875, 0.906494140625, 1.13848876953125, 1.3704833984375, 1.60247802734375, 1.83447265625, 2.06646728515625, 2.2984619140625, 2.53045654296875, 2.762451171875, 2.99444580078125, 3.2264404296875, 3.45843505859375, 3.6904296875, 3.92242431640625, 4.1544189453125, 4.38641357421875, 4.618408203125, 4.85040283203125, 5.0823974609375, 5.31439208984375, 5.54638671875, 5.77838134765625, 6.0103759765625, 6.24237060546875, 6.474365234375, 6.70635986328125, 6.9383544921875, 7.17034912109375, 7.40234375]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 4.0, 9.0, 8.0, 12.0, 19.0, 24.0, 40.0, 62.0, 86.0, 130.0, 192.0, 234.0, 381.0, 444.0, 710.0, 1041.0, 1468.0, 2302.0, 3366.0, 4906.0, 7489.0, 11277.0, 16981.0, 25510.0, 39470.0, 60386.0, 92045.0, 139230.0, 195465.0, 151911.0, 100225.0, 66293.0, 42503.0, 28327.0, 18428.0, 12328.0, 8161.0, 5554.0, 3648.0, 2480.0, 1691.0, 1111.0, 797.0, 571.0, 386.0, 262.0, 188.0, 118.0, 83.0, 63.0, 46.0, 43.0, 19.0, 18.0, 9.0, 8.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.0634765625, -1.0298309326171875, -0.996185302734375, -0.9625396728515625, -0.92889404296875, -0.8952484130859375, -0.861602783203125, -0.8279571533203125, -0.7943115234375, -0.7606658935546875, -0.727020263671875, -0.6933746337890625, -0.65972900390625, -0.6260833740234375, -0.592437744140625, -0.5587921142578125, -0.525146484375, -0.4915008544921875, -0.457855224609375, -0.4242095947265625, -0.39056396484375, -0.3569183349609375, -0.323272705078125, -0.2896270751953125, -0.2559814453125, -0.2223358154296875, -0.188690185546875, -0.1550445556640625, -0.12139892578125, -0.0877532958984375, -0.054107666015625, -0.0204620361328125, 0.01318359375, 0.0468292236328125, 0.080474853515625, 0.1141204833984375, 0.14776611328125, 0.1814117431640625, 0.215057373046875, 0.2487030029296875, 0.2823486328125, 0.3159942626953125, 0.349639892578125, 0.3832855224609375, 0.41693115234375, 0.4505767822265625, 0.484222412109375, 0.5178680419921875, 0.551513671875, 0.5851593017578125, 0.618804931640625, 0.6524505615234375, 0.68609619140625, 0.7197418212890625, 0.753387451171875, 0.7870330810546875, 0.8206787109375, 0.8543243408203125, 0.887969970703125, 0.9216156005859375, 0.95526123046875, 0.9889068603515625, 1.022552490234375, 1.0561981201171875, 1.08984375]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 3.0, 2.0, 4.0, 12.0, 2.0, 8.0, 11.0, 14.0, 13.0, 16.0, 20.0, 20.0, 30.0, 36.0, 33.0, 37.0, 33.0, 31.0, 33.0, 45.0, 34.0, 39.0, 1064.0, 35.0, 48.0, 37.0, 45.0, 44.0, 32.0, 35.0, 40.0, 25.0, 22.0, 25.0, 14.0, 16.0, 17.0, 15.0, 8.0, 7.0, 5.0, 8.0, 1.0, 7.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-5.26171875, -5.09674072265625, -4.9317626953125, -4.76678466796875, -4.601806640625, -4.43682861328125, -4.2718505859375, -4.10687255859375, -3.94189453125, -3.77691650390625, -3.6119384765625, -3.44696044921875, -3.281982421875, -3.11700439453125, -2.9520263671875, -2.78704833984375, -2.6220703125, -2.45709228515625, -2.2921142578125, -2.12713623046875, -1.962158203125, -1.79718017578125, -1.6322021484375, -1.46722412109375, -1.30224609375, -1.13726806640625, -0.9722900390625, -0.80731201171875, -0.642333984375, -0.47735595703125, -0.3123779296875, -0.14739990234375, 0.017578125, 0.18255615234375, 0.3475341796875, 0.51251220703125, 0.677490234375, 0.84246826171875, 1.0074462890625, 1.17242431640625, 1.33740234375, 1.50238037109375, 1.6673583984375, 1.83233642578125, 1.997314453125, 2.16229248046875, 2.3272705078125, 2.49224853515625, 2.6572265625, 2.82220458984375, 2.9871826171875, 3.15216064453125, 3.317138671875, 3.48211669921875, 3.6470947265625, 3.81207275390625, 3.97705078125, 4.14202880859375, 4.3070068359375, 4.47198486328125, 4.636962890625, 4.80194091796875, 4.9669189453125, 5.13189697265625, 5.296875]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 12.0, 17.0, 11.0, 25.0, 22.0, 46.0, 67.0, 96.0, 118.0, 172.0, 281.0, 386.0, 549.0, 876.0, 1228.0, 1842.0, 2721.0, 3916.0, 5924.0, 8790.0, 13717.0, 20413.0, 31658.0, 48940.0, 76555.0, 118493.0, 184608.0, 1225779.0, 123189.0, 79653.0, 50835.0, 32636.0, 21406.0, 13997.0, 9264.0, 5967.0, 4159.0, 2756.0, 1897.0, 1333.0, 830.0, 622.0, 424.0, 272.0, 211.0, 137.0, 99.0, 61.0, 48.0, 29.0, 17.0, 15.0, 10.0, 3.0, 1.0, 4.0, 1.0, 3.0, 3.0, 1.0], "bins": [-0.9521484375, -0.921478271484375, -0.89080810546875, -0.860137939453125, -0.8294677734375, -0.798797607421875, -0.76812744140625, -0.737457275390625, -0.706787109375, -0.676116943359375, -0.64544677734375, -0.614776611328125, -0.5841064453125, -0.553436279296875, -0.52276611328125, -0.492095947265625, -0.46142578125, -0.430755615234375, -0.40008544921875, -0.369415283203125, -0.3387451171875, -0.308074951171875, -0.27740478515625, -0.246734619140625, -0.216064453125, -0.185394287109375, -0.15472412109375, -0.124053955078125, -0.0933837890625, -0.062713623046875, -0.03204345703125, -0.001373291015625, 0.029296875, 0.059967041015625, 0.09063720703125, 0.121307373046875, 0.1519775390625, 0.182647705078125, 0.21331787109375, 0.243988037109375, 0.274658203125, 0.305328369140625, 0.33599853515625, 0.366668701171875, 0.3973388671875, 0.428009033203125, 0.45867919921875, 0.489349365234375, 0.52001953125, 0.550689697265625, 0.58135986328125, 0.612030029296875, 0.6427001953125, 0.673370361328125, 0.70404052734375, 0.734710693359375, 0.765380859375, 0.796051025390625, 0.82672119140625, 0.857391357421875, 0.8880615234375, 0.918731689453125, 0.94940185546875, 0.980072021484375, 1.0107421875]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 3.0, 5.0, 6.0, 7.0, 9.0, 10.0, 16.0, 25.0, 25.0, 32.0, 27.0, 49.0, 49.0, 48.0, 48.0, 49.0, 63.0, 60.0, 63.0, 40.0, 56.0, 44.0, 48.0, 27.0, 38.0, 35.0, 19.0, 26.0, 12.0, 9.0, 12.0, 9.0, 3.0, 2.0, 7.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0017633438110351562, -0.0017117857933044434, -0.0016602277755737305, -0.0016086697578430176, -0.0015571117401123047, -0.0015055537223815918, -0.001453995704650879, -0.001402437686920166, -0.0013508796691894531, -0.0012993216514587402, -0.0012477636337280273, -0.0011962056159973145, -0.0011446475982666016, -0.0010930895805358887, -0.0010415315628051758, -0.0009899735450744629, -0.00093841552734375, -0.0008868575096130371, -0.0008352994918823242, -0.0007837414741516113, -0.0007321834564208984, -0.0006806254386901855, -0.0006290674209594727, -0.0005775094032287598, -0.0005259513854980469, -0.000474393367767334, -0.0004228353500366211, -0.0003712773323059082, -0.0003197193145751953, -0.0002681612968444824, -0.00021660327911376953, -0.00016504526138305664, -0.00011348724365234375, -6.192922592163086e-05, -1.0371208190917969e-05, 4.118680953979492e-05, 9.274482727050781e-05, 0.0001443028450012207, 0.0001958608627319336, 0.0002474188804626465, 0.0002989768981933594, 0.00035053491592407227, 0.00040209293365478516, 0.00045365095138549805, 0.0005052089691162109, 0.0005567669868469238, 0.0006083250045776367, 0.0006598830223083496, 0.0007114410400390625, 0.0007629990577697754, 0.0008145570755004883, 0.0008661150932312012, 0.0009176731109619141, 0.000969231128692627, 0.0010207891464233398, 0.0010723471641540527, 0.0011239051818847656, 0.0011754631996154785, 0.0012270212173461914, 0.0012785792350769043, 0.0013301372528076172, 0.00138169527053833, 0.001433253288269043, 0.0014848113059997559, 0.0015363693237304688]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 0.0, 8.0, 0.0, 6.0, 3.0, 8.0, 5.0, 7.0, 8.0, 24.0, 24.0, 21.0, 31.0, 42.0, 39.0, 73.0, 82.0, 115.0, 178.0, 455.0, 2586.0, 1013602.0, 29722.0, 714.0, 263.0, 152.0, 87.0, 65.0, 51.0, 31.0, 28.0, 21.0, 23.0, 23.0, 10.0, 10.0, 9.0, 6.0, 6.0, 6.0, 4.0, 2.0, 3.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.03759765625, -0.036411285400390625, -0.03522491455078125, -0.034038543701171875, -0.0328521728515625, -0.031665802001953125, -0.03047943115234375, -0.029293060302734375, -0.028106689453125, -0.026920318603515625, -0.02573394775390625, -0.024547576904296875, -0.0233612060546875, -0.022174835205078125, -0.02098846435546875, -0.019802093505859375, -0.01861572265625, -0.017429351806640625, -0.01624298095703125, -0.015056610107421875, -0.0138702392578125, -0.012683868408203125, -0.01149749755859375, -0.010311126708984375, -0.009124755859375, -0.007938385009765625, -0.00675201416015625, -0.005565643310546875, -0.0043792724609375, -0.003192901611328125, -0.00200653076171875, -0.000820159912109375, 0.0003662109375, 0.001552581787109375, 0.00273895263671875, 0.003925323486328125, 0.0051116943359375, 0.006298065185546875, 0.00748443603515625, 0.008670806884765625, 0.009857177734375, 0.011043548583984375, 0.01222991943359375, 0.013416290283203125, 0.0146026611328125, 0.015789031982421875, 0.01697540283203125, 0.018161773681640625, 0.01934814453125, 0.020534515380859375, 0.02172088623046875, 0.022907257080078125, 0.0240936279296875, 0.025279998779296875, 0.02646636962890625, 0.027652740478515625, 0.028839111328125, 0.030025482177734375, 0.03121185302734375, 0.032398223876953125, 0.0335845947265625, 0.034770965576171875, 0.03595733642578125, 0.037143707275390625, 0.038330078125]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 12.0, 22.0, 29.0, 52.0, 92.0, 110.0, 144.0, 153.0, 156.0, 86.0, 69.0, 37.0, 24.0, 9.0, 6.0, 1.0, 1.0, 2.0, 3.0], "bins": [-0.002105479361489415, -0.002065099310129881, -0.0020247192587703466, -0.0019843392074108124, -0.0019439592724666, -0.0019035792211070657, -0.0018631991697475314, -0.0018228191183879972, -0.0017824391834437847, -0.0017420591320842505, -0.0017016790807247162, -0.0016612991457805037, -0.0016209190944209695, -0.0015805390430614352, -0.001540158991701901, -0.0014997789403423667, -0.0014593988889828324, -0.0014190188376232982, -0.001378638786263764, -0.0013382588513195515, -0.0012978787999600172, -0.001257498748600483, -0.0012171186972409487, -0.0011767386458814144, -0.0011363585945218801, -0.0010959785431623459, -0.0010555984918028116, -0.0010152185568585992, -0.0009748385054990649, -0.0009344584541395307, -0.0008940784027799964, -0.0008536983514204621, -0.0008133184164762497, -0.0007729383651167154, -0.0007325583719648421, -0.0006921783206053078, -0.0006517983274534345, -0.0006114182760939002, -0.0005710382247343659, -0.0005306581733748317, -0.0004902781220152974, -0.0004498980997595936, -0.0004095180775038898, -0.00036913802614435554, -0.00032875800388865173, -0.0002883779816329479, -0.00024799793027341366, -0.00020761790801770985, -0.0001672379148658365, -0.0001268578926101327, -8.647785580251366e-05, -4.609782627085224e-05, -5.717796739190817e-06, 3.466222551651299e-05, 7.504226232413203e-05, 0.00011542229913175106, 0.00015580232138745487, 0.00019618234364315867, 0.0002365623804507777, 0.00027694241725839674, 0.00031732243951410055, 0.00035770246176980436, 0.00039808248402550817, 0.00043846253538504243, 0.00047884255764074624]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 3.0, 4.0, 6.0, 6.0, 4.0, 15.0, 15.0, 8.0, 14.0, 17.0, 25.0, 20.0, 30.0, 21.0, 32.0, 25.0, 32.0, 39.0, 28.0, 36.0, 43.0, 36.0, 33.0, 34.0, 42.0, 39.0, 37.0, 37.0, 38.0, 31.0, 32.0, 30.0, 26.0, 24.0, 19.0, 20.0, 14.0, 10.0, 15.0, 10.0, 13.0, 8.0, 8.0, 7.0, 5.0, 1.0, 3.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0007726550102233887, -0.0007470259442925453, -0.000721396878361702, -0.0006957678124308586, -0.0006701387465000153, -0.0006445096805691719, -0.0006188806146383286, -0.0005932515487074852, -0.0005676224827766418, -0.0005419934168457985, -0.0005163643509149551, -0.0004907352849841118, -0.00046510621905326843, -0.0004394771531224251, -0.0004138480871915817, -0.00038821902126073837, -0.000362589955329895, -0.00033696088939905167, -0.0003113318234682083, -0.00028570275753736496, -0.0002600736916065216, -0.00023444462567567825, -0.0002088155597448349, -0.00018318649381399155, -0.0001575574278831482, -0.00013192836195230484, -0.00010629929602146149, -8.067023009061813e-05, -5.504116415977478e-05, -2.9412098228931427e-05, -3.7830322980880737e-06, 2.184603363275528e-05, 4.747509956359863e-05, 7.310416549444199e-05, 9.873323142528534e-05, 0.0001243622973561287, 0.00014999136328697205, 0.0001756204292178154, 0.00020124949514865875, 0.0002268785610795021, 0.00025250762701034546, 0.0002781366929411888, 0.00030376575887203217, 0.0003293948248028755, 0.00035502389073371887, 0.0003806529566645622, 0.0004062820225954056, 0.00043191108852624893, 0.0004575401544570923, 0.00048316922038793564, 0.000508798286318779, 0.0005344273522496223, 0.0005600564181804657, 0.000585685484111309, 0.0006113145500421524, 0.0006369436159729958, 0.0006625726819038391, 0.0006882017478346825, 0.0007138308137655258, 0.0007394598796963692, 0.0007650889456272125, 0.0007907180115580559, 0.0008163470774888992, 0.0008419761434197426, 0.0008676052093505859]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 7.0, 4.0, 8.0, 14.0, 9.0, 8.0, 9.0, 20.0, 16.0, 14.0, 23.0, 30.0, 14.0, 23.0, 44.0, 30.0, 30.0, 43.0, 28.0, 40.0, 46.0, 48.0, 38.0, 33.0, 39.0, 31.0, 37.0, 32.0, 26.0, 26.0, 29.0, 31.0, 16.0, 17.0, 21.0, 12.0, 11.0, 21.0, 14.0, 8.0, 13.0, 16.0, 6.0, 3.0, 2.0, 1.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-7.4453125, -7.21331787109375, -6.9813232421875, -6.74932861328125, -6.517333984375, -6.28533935546875, -6.0533447265625, -5.82135009765625, -5.58935546875, -5.35736083984375, -5.1253662109375, -4.89337158203125, -4.661376953125, -4.42938232421875, -4.1973876953125, -3.96539306640625, -3.7333984375, -3.50140380859375, -3.2694091796875, -3.03741455078125, -2.805419921875, -2.57342529296875, -2.3414306640625, -2.10943603515625, -1.87744140625, -1.64544677734375, -1.4134521484375, -1.18145751953125, -0.949462890625, -0.71746826171875, -0.4854736328125, -0.25347900390625, -0.021484375, 0.21051025390625, 0.4425048828125, 0.67449951171875, 0.906494140625, 1.13848876953125, 1.3704833984375, 1.60247802734375, 1.83447265625, 2.06646728515625, 2.2984619140625, 2.53045654296875, 2.762451171875, 2.99444580078125, 3.2264404296875, 3.45843505859375, 3.6904296875, 3.92242431640625, 4.1544189453125, 4.38641357421875, 4.618408203125, 4.85040283203125, 5.0823974609375, 5.31439208984375, 5.54638671875, 5.77838134765625, 6.0103759765625, 6.24237060546875, 6.474365234375, 6.70635986328125, 6.9383544921875, 7.17034912109375, 7.40234375]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 4.0, 5.0, 2.0, 7.0, 11.0, 5.0, 8.0, 16.0, 24.0, 25.0, 49.0, 61.0, 107.0, 175.0, 296.0, 493.0, 905.0, 1616.0, 2939.0, 5550.0, 10590.0, 22013.0, 53815.0, 155357.0, 431130.0, 229212.0, 76272.0, 29136.0, 13569.0, 6691.0, 3751.0, 2046.0, 1085.0, 611.0, 377.0, 237.0, 128.0, 73.0, 46.0, 30.0, 23.0, 23.0, 15.0, 9.0, 9.0, 6.0, 3.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.45703125, -5.28472900390625, -5.1124267578125, -4.94012451171875, -4.767822265625, -4.59552001953125, -4.4232177734375, -4.25091552734375, -4.07861328125, -3.90631103515625, -3.7340087890625, -3.56170654296875, -3.389404296875, -3.21710205078125, -3.0447998046875, -2.87249755859375, -2.7001953125, -2.52789306640625, -2.3555908203125, -2.18328857421875, -2.010986328125, -1.83868408203125, -1.6663818359375, -1.49407958984375, -1.32177734375, -1.14947509765625, -0.9771728515625, -0.80487060546875, -0.632568359375, -0.46026611328125, -0.2879638671875, -0.11566162109375, 0.056640625, 0.22894287109375, 0.4012451171875, 0.57354736328125, 0.745849609375, 0.91815185546875, 1.0904541015625, 1.26275634765625, 1.43505859375, 1.60736083984375, 1.7796630859375, 1.95196533203125, 2.124267578125, 2.29656982421875, 2.4688720703125, 2.64117431640625, 2.8134765625, 2.98577880859375, 3.1580810546875, 3.33038330078125, 3.502685546875, 3.67498779296875, 3.8472900390625, 4.01959228515625, 4.19189453125, 4.36419677734375, 4.5364990234375, 4.70880126953125, 4.881103515625, 5.05340576171875, 5.2257080078125, 5.39801025390625, 5.5703125]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 5.0, 3.0, 5.0, 5.0, 9.0, 14.0, 11.0, 7.0, 30.0, 19.0, 24.0, 26.0, 29.0, 34.0, 42.0, 41.0, 63.0, 63.0, 89.0, 337.0, 1687.0, 102.0, 50.0, 56.0, 50.0, 30.0, 28.0, 43.0, 34.0, 29.0, 14.0, 19.0, 12.0, 11.0, 9.0, 13.0, 4.0, 3.0, 1.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.4375, -25.462890625, -24.48828125, -23.513671875, -22.5390625, -21.564453125, -20.58984375, -19.615234375, -18.640625, -17.666015625, -16.69140625, -15.716796875, -14.7421875, -13.767578125, -12.79296875, -11.818359375, -10.84375, -9.869140625, -8.89453125, -7.919921875, -6.9453125, -5.970703125, -4.99609375, -4.021484375, -3.046875, -2.072265625, -1.09765625, -0.123046875, 0.8515625, 1.826171875, 2.80078125, 3.775390625, 4.75, 5.724609375, 6.69921875, 7.673828125, 8.6484375, 9.623046875, 10.59765625, 11.572265625, 12.546875, 13.521484375, 14.49609375, 15.470703125, 16.4453125, 17.419921875, 18.39453125, 19.369140625, 20.34375, 21.318359375, 22.29296875, 23.267578125, 24.2421875, 25.216796875, 26.19140625, 27.166015625, 28.140625, 29.115234375, 30.08984375, 31.064453125, 32.0390625, 33.013671875, 33.98828125, 34.962890625, 35.9375]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 4.0, 3.0, 5.0, 8.0, 13.0, 14.0, 21.0, 13.0, 22.0, 30.0, 55.0, 46.0, 87.0, 110.0, 156.0, 215.0, 336.0, 724.0, 10956.0, 3119198.0, 11748.0, 698.0, 362.0, 227.0, 179.0, 114.0, 72.0, 65.0, 45.0, 42.0, 37.0, 26.0, 11.0, 22.0, 12.0, 8.0, 5.0, 7.0, 3.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-85.0625, -82.732421875, -80.40234375, -78.072265625, -75.7421875, -73.412109375, -71.08203125, -68.751953125, -66.421875, -64.091796875, -61.76171875, -59.431640625, -57.1015625, -54.771484375, -52.44140625, -50.111328125, -47.78125, -45.451171875, -43.12109375, -40.791015625, -38.4609375, -36.130859375, -33.80078125, -31.470703125, -29.140625, -26.810546875, -24.48046875, -22.150390625, -19.8203125, -17.490234375, -15.16015625, -12.830078125, -10.5, -8.169921875, -5.83984375, -3.509765625, -1.1796875, 1.150390625, 3.48046875, 5.810546875, 8.140625, 10.470703125, 12.80078125, 15.130859375, 17.4609375, 19.791015625, 22.12109375, 24.451171875, 26.78125, 29.111328125, 31.44140625, 33.771484375, 36.1015625, 38.431640625, 40.76171875, 43.091796875, 45.421875, 47.751953125, 50.08203125, 52.412109375, 54.7421875, 57.072265625, 59.40234375, 61.732421875, 64.0625]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [3.0, 80.0, 740.0, 190.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.543399810791016, -7.847620487213135, -3.151841163635254, 1.5439376831054688, 6.239717483520508, 10.935497283935547, 15.631275177001953, 20.327056884765625, 25.02283477783203, 29.71861457824707, 34.41439437866211, 39.110172271728516, 43.80595397949219, 48.501731872558594, 53.197509765625, 57.89329147338867, 62.58906936645508, 67.28485107421875, 71.98062896728516, 76.67640686035156, 81.37218475341797, 86.06796264648438, 90.76374816894531, 95.45952606201172, 100.15530395507812, 104.85108184814453, 109.54685974121094, 114.24264526367188, 118.93842315673828, 123.63420104980469, 128.32998657226562, 133.0257568359375, 137.72154235839844, 142.41732788085938, 147.11309814453125, 151.8088836669922, 156.50465393066406, 161.200439453125, 165.89620971679688, 170.5919952392578, 175.28778076171875, 179.9835662841797, 184.67933654785156, 189.3751220703125, 194.07089233398438, 198.7666778564453, 203.46246337890625, 208.15823364257812, 212.85400390625, 217.54978942871094, 222.2455596923828, 226.94134521484375, 231.63711547851562, 236.33290100097656, 241.0286865234375, 245.72445678710938, 250.4202423095703, 255.11602783203125, 259.8117980957031, 264.507568359375, 269.203369140625, 273.8991394042969, 278.59490966796875, 283.29071044921875, 287.9864807128906]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 7.0, 2.0, 4.0, 3.0, 7.0, 7.0, 6.0, 7.0, 11.0, 13.0, 14.0, 11.0, 20.0, 27.0, 22.0, 28.0, 25.0, 37.0, 21.0, 45.0, 52.0, 44.0, 40.0, 36.0, 41.0, 44.0, 42.0, 44.0, 32.0, 45.0, 38.0, 26.0, 23.0, 20.0, 26.0, 15.0, 19.0, 9.0, 17.0, 4.0, 16.0, 5.0, 14.0, 6.0, 7.0, 6.0, 6.0, 3.0, 6.0, 4.0, 0.0, 3.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.086910247802734, -57.02975082397461, -54.97259521484375, -52.915435791015625, -50.8582763671875, -48.801116943359375, -46.74395751953125, -44.68680191040039, -42.629642486572266, -40.57248306274414, -38.51532745361328, -36.458168029785156, -34.40100860595703, -32.343849182128906, -30.286691665649414, -28.229534149169922, -26.172374725341797, -24.115215301513672, -22.05805778503418, -20.000900268554688, -17.943740844726562, -15.886582374572754, -13.829423904418945, -11.772265434265137, -9.715106964111328, -7.6579484939575195, -5.600790023803711, -3.5436315536499023, -1.4864730834960938, 0.5706853866577148, 2.6278438568115234, 4.685002326965332, 6.742156982421875, 8.799315452575684, 10.856473922729492, 12.9136323928833, 14.97079086303711, 17.027950286865234, 19.085107803344727, 21.14226531982422, 23.199424743652344, 25.25658416748047, 27.31374168395996, 29.370899200439453, 31.428058624267578, 33.4852180480957, 35.54237365722656, 37.59953308105469, 39.65669250488281, 41.71385192871094, 43.77101135253906, 45.82816696166992, 47.88532638549805, 49.94248580932617, 51.99964141845703, 54.056800842285156, 56.11396026611328, 58.171119689941406, 60.22827911376953, 62.28543472290039, 64.34259033203125, 66.39974975585938, 68.4569091796875, 70.51406860351562, 72.57122802734375]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 6.0, 8.0, 6.0, 6.0, 7.0, 11.0, 13.0, 11.0, 17.0, 19.0, 11.0, 17.0, 20.0, 23.0, 33.0, 33.0, 30.0, 34.0, 34.0, 36.0, 34.0, 38.0, 45.0, 35.0, 38.0, 38.0, 44.0, 37.0, 21.0, 31.0, 29.0, 26.0, 22.0, 22.0, 13.0, 25.0, 17.0, 15.0, 16.0, 17.0, 10.0, 14.0, 12.0, 4.0, 12.0, 3.0, 5.0, 1.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-7.1875, -6.9527587890625, -6.718017578125, -6.4832763671875, -6.24853515625, -6.0137939453125, -5.779052734375, -5.5443115234375, -5.3095703125, -5.0748291015625, -4.840087890625, -4.6053466796875, -4.37060546875, -4.1358642578125, -3.901123046875, -3.6663818359375, -3.431640625, -3.1968994140625, -2.962158203125, -2.7274169921875, -2.49267578125, -2.2579345703125, -2.023193359375, -1.7884521484375, -1.5537109375, -1.3189697265625, -1.084228515625, -0.8494873046875, -0.61474609375, -0.3800048828125, -0.145263671875, 0.0894775390625, 0.32421875, 0.5589599609375, 0.793701171875, 1.0284423828125, 1.26318359375, 1.4979248046875, 1.732666015625, 1.9674072265625, 2.2021484375, 2.4368896484375, 2.671630859375, 2.9063720703125, 3.14111328125, 3.3758544921875, 3.610595703125, 3.8453369140625, 4.080078125, 4.3148193359375, 4.549560546875, 4.7843017578125, 5.01904296875, 5.2537841796875, 5.488525390625, 5.7232666015625, 5.9580078125, 6.1927490234375, 6.427490234375, 6.6622314453125, 6.89697265625, 7.1317138671875, 7.366455078125, 7.6011962890625, 7.8359375]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 4.0, 3.0, 4.0, 9.0, 7.0, 4.0, 8.0, 9.0, 18.0, 11.0, 15.0, 13.0, 13.0, 22.0, 23.0, 33.0, 35.0, 49.0, 89.0, 125.0, 225.0, 493.0, 1116.0, 3793.0, 23033.0, 526528.0, 3106704.0, 503074.0, 22602.0, 3756.0, 1207.0, 507.0, 254.0, 133.0, 67.0, 59.0, 39.0, 24.0, 26.0, 21.0, 12.0, 13.0, 15.0, 15.0, 17.0, 13.0, 11.0, 11.0, 9.0, 2.0, 5.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0], "bins": [-20.328125, -19.638916015625, -18.94970703125, -18.260498046875, -17.5712890625, -16.882080078125, -16.19287109375, -15.503662109375, -14.814453125, -14.125244140625, -13.43603515625, -12.746826171875, -12.0576171875, -11.368408203125, -10.67919921875, -9.989990234375, -9.30078125, -8.611572265625, -7.92236328125, -7.233154296875, -6.5439453125, -5.854736328125, -5.16552734375, -4.476318359375, -3.787109375, -3.097900390625, -2.40869140625, -1.719482421875, -1.0302734375, -0.341064453125, 0.34814453125, 1.037353515625, 1.7265625, 2.415771484375, 3.10498046875, 3.794189453125, 4.4833984375, 5.172607421875, 5.86181640625, 6.551025390625, 7.240234375, 7.929443359375, 8.61865234375, 9.307861328125, 9.9970703125, 10.686279296875, 11.37548828125, 12.064697265625, 12.75390625, 13.443115234375, 14.13232421875, 14.821533203125, 15.5107421875, 16.199951171875, 16.88916015625, 17.578369140625, 18.267578125, 18.956787109375, 19.64599609375, 20.335205078125, 21.0244140625, 21.713623046875, 22.40283203125, 23.092041015625, 23.78125]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 5.0, 4.0, 8.0, 12.0, 22.0, 17.0, 11.0, 16.0, 22.0, 27.0, 36.0, 41.0, 70.0, 75.0, 66.0, 77.0, 112.0, 136.0, 172.0, 233.0, 243.0, 313.0, 346.0, 361.0, 318.0, 256.0, 195.0, 157.0, 129.0, 120.0, 88.0, 74.0, 57.0, 49.0, 35.0, 32.0, 28.0, 18.0, 9.0, 15.0, 19.0, 7.0, 10.0, 6.0, 9.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 4.0, 4.0], "bins": [-11.515625, -11.175537109375, -10.83544921875, -10.495361328125, -10.1552734375, -9.815185546875, -9.47509765625, -9.135009765625, -8.794921875, -8.454833984375, -8.11474609375, -7.774658203125, -7.4345703125, -7.094482421875, -6.75439453125, -6.414306640625, -6.07421875, -5.734130859375, -5.39404296875, -5.053955078125, -4.7138671875, -4.373779296875, -4.03369140625, -3.693603515625, -3.353515625, -3.013427734375, -2.67333984375, -2.333251953125, -1.9931640625, -1.653076171875, -1.31298828125, -0.972900390625, -0.6328125, -0.292724609375, 0.04736328125, 0.387451171875, 0.7275390625, 1.067626953125, 1.40771484375, 1.747802734375, 2.087890625, 2.427978515625, 2.76806640625, 3.108154296875, 3.4482421875, 3.788330078125, 4.12841796875, 4.468505859375, 4.80859375, 5.148681640625, 5.48876953125, 5.828857421875, 6.1689453125, 6.509033203125, 6.84912109375, 7.189208984375, 7.529296875, 7.869384765625, 8.20947265625, 8.549560546875, 8.8896484375, 9.229736328125, 9.56982421875, 9.909912109375, 10.25]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 4.0, 5.0, 5.0, 5.0, 6.0, 6.0, 16.0, 19.0, 19.0, 24.0, 25.0, 22.0, 42.0, 51.0, 49.0, 51.0, 86.0, 98.0, 134.0, 161.0, 157.0, 217.0, 304.0, 466.0, 2008.0, 217158.0, 3949513.0, 21029.0, 800.0, 377.0, 273.0, 202.0, 142.0, 148.0, 124.0, 87.0, 79.0, 75.0, 50.0, 46.0, 43.0, 35.0, 35.0, 27.0, 22.0, 8.0, 12.0, 10.0, 4.0, 4.0, 2.0, 3.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-60.84375, -58.83544921875, -56.8271484375, -54.81884765625, -52.810546875, -50.80224609375, -48.7939453125, -46.78564453125, -44.77734375, -42.76904296875, -40.7607421875, -38.75244140625, -36.744140625, -34.73583984375, -32.7275390625, -30.71923828125, -28.7109375, -26.70263671875, -24.6943359375, -22.68603515625, -20.677734375, -18.66943359375, -16.6611328125, -14.65283203125, -12.64453125, -10.63623046875, -8.6279296875, -6.61962890625, -4.611328125, -2.60302734375, -0.5947265625, 1.41357421875, 3.421875, 5.43017578125, 7.4384765625, 9.44677734375, 11.455078125, 13.46337890625, 15.4716796875, 17.47998046875, 19.48828125, 21.49658203125, 23.5048828125, 25.51318359375, 27.521484375, 29.52978515625, 31.5380859375, 33.54638671875, 35.5546875, 37.56298828125, 39.5712890625, 41.57958984375, 43.587890625, 45.59619140625, 47.6044921875, 49.61279296875, 51.62109375, 53.62939453125, 55.6376953125, 57.64599609375, 59.654296875, 61.66259765625, 63.6708984375, 65.67919921875, 67.6875]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 7.0, 13.0, 29.0, 41.0, 64.0, 95.0, 113.0, 134.0, 123.0, 112.0, 78.0, 85.0, 51.0, 32.0, 13.0, 9.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.03321838378906, -68.19615936279297, -66.35910034179688, -64.52204132080078, -62.68497848510742, -60.84791946411133, -59.010860443115234, -57.17380142211914, -55.33673858642578, -53.49967956542969, -51.662620544433594, -49.8255615234375, -47.98849868774414, -46.15143966674805, -44.31438064575195, -42.47732162475586, -40.640262603759766, -38.80320358276367, -36.96614456176758, -35.12908172607422, -33.292022705078125, -31.45496368408203, -29.617904663085938, -27.780845642089844, -25.943784713745117, -24.106725692749023, -22.269664764404297, -20.432605743408203, -18.59554672241211, -16.758485794067383, -14.921426773071289, -13.084366798400879, -11.247306823730469, -9.410246849060059, -7.573187351226807, -5.736127853393555, -3.8990678787231445, -2.0620079040527344, -0.22494888305664062, 1.6121110916137695, 3.4491710662841797, 5.28623104095459, 7.123290538787842, 8.960350036621094, 10.797410011291504, 12.634469985961914, 14.471529006958008, 16.308589935302734, 18.145648956298828, 19.982707977294922, 21.81976890563965, 23.656827926635742, 25.49388885498047, 27.330947875976562, 29.168006896972656, 31.00506591796875, 32.842124938964844, 34.67918395996094, 36.51624298095703, 38.353302001953125, 40.190364837646484, 42.02742385864258, 43.86448287963867, 45.701541900634766, 47.538604736328125]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 1.0, 7.0, 4.0, 10.0, 14.0, 3.0, 20.0, 16.0, 14.0, 21.0, 27.0, 25.0, 35.0, 37.0, 38.0, 33.0, 38.0, 46.0, 39.0, 43.0, 36.0, 49.0, 32.0, 32.0, 34.0, 38.0, 38.0, 31.0, 32.0, 26.0, 30.0, 24.0, 18.0, 22.0, 24.0, 17.0, 14.0, 7.0, 6.0, 11.0, 7.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-49.86654281616211, -48.255897521972656, -46.6452522277832, -45.03460693359375, -43.42396545410156, -41.81332015991211, -40.202674865722656, -38.5920295715332, -36.98138427734375, -35.3707389831543, -33.760093688964844, -32.149452209472656, -30.538806915283203, -28.92816162109375, -27.317516326904297, -25.706871032714844, -24.096229553222656, -22.485584259033203, -20.874940872192383, -19.26429557800293, -17.65365219116211, -16.043006896972656, -14.432361602783203, -12.821717262268066, -11.21107292175293, -9.600428581237793, -7.989783763885498, -6.379138946533203, -4.768494606018066, -3.1578502655029297, -1.5472049713134766, 0.06343936920166016, 1.6740798950195312, 3.284724473953247, 4.895369052886963, 6.506013870239258, 8.116658210754395, 9.727302551269531, 11.337947845458984, 12.948592185974121, 14.559236526489258, 16.16988182067871, 17.78052520751953, 19.391170501708984, 21.001815795898438, 22.612459182739258, 24.22310447692871, 25.83374786376953, 27.444393157958984, 29.055038452148438, 30.665681838989258, 32.276329040527344, 33.88697052001953, 35.497615814208984, 37.10826110839844, 38.71890640258789, 40.329551696777344, 41.9401969909668, 43.55084228515625, 45.16148376464844, 46.77212905883789, 48.382774353027344, 49.9934196472168, 51.60406494140625, 53.21470642089844]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 1.0, 10.0, 7.0, 11.0, 8.0, 14.0, 13.0, 16.0, 12.0, 15.0, 21.0, 20.0, 31.0, 14.0, 22.0, 25.0, 31.0, 26.0, 27.0, 49.0, 36.0, 44.0, 35.0, 34.0, 38.0, 36.0, 37.0, 53.0, 33.0, 24.0, 26.0, 22.0, 26.0, 25.0, 31.0, 16.0, 21.0, 10.0, 15.0, 16.0, 8.0, 9.0, 5.0, 7.0, 7.0, 2.0, 3.0, 2.0, 7.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-7.1328125, -6.90472412109375, -6.6766357421875, -6.44854736328125, -6.220458984375, -5.99237060546875, -5.7642822265625, -5.53619384765625, -5.30810546875, -5.08001708984375, -4.8519287109375, -4.62384033203125, -4.395751953125, -4.16766357421875, -3.9395751953125, -3.71148681640625, -3.4833984375, -3.25531005859375, -3.0272216796875, -2.79913330078125, -2.571044921875, -2.34295654296875, -2.1148681640625, -1.88677978515625, -1.65869140625, -1.43060302734375, -1.2025146484375, -0.97442626953125, -0.746337890625, -0.51824951171875, -0.2901611328125, -0.06207275390625, 0.166015625, 0.39410400390625, 0.6221923828125, 0.85028076171875, 1.078369140625, 1.30645751953125, 1.5345458984375, 1.76263427734375, 1.99072265625, 2.21881103515625, 2.4468994140625, 2.67498779296875, 2.903076171875, 3.13116455078125, 3.3592529296875, 3.58734130859375, 3.8154296875, 4.04351806640625, 4.2716064453125, 4.49969482421875, 4.727783203125, 4.95587158203125, 5.1839599609375, 5.41204833984375, 5.64013671875, 5.86822509765625, 6.0963134765625, 6.32440185546875, 6.552490234375, 6.78057861328125, 7.0086669921875, 7.23675537109375, 7.46484375]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 5.0, 6.0, 13.0, 23.0, 32.0, 42.0, 86.0, 137.0, 189.0, 354.0, 583.0, 912.0, 1400.0, 2046.0, 3268.0, 4979.0, 7319.0, 11651.0, 18109.0, 28930.0, 46520.0, 76119.0, 128777.0, 216045.0, 198711.0, 116524.0, 69437.0, 42427.0, 26546.0, 16667.0, 10708.0, 7053.0, 4737.0, 2914.0, 1954.0, 1221.0, 780.0, 499.0, 291.0, 202.0, 127.0, 79.0, 52.0, 35.0, 16.0, 17.0, 7.0, 4.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.2578125, -1.2207183837890625, -1.183624267578125, -1.1465301513671875, -1.10943603515625, -1.0723419189453125, -1.035247802734375, -0.9981536865234375, -0.9610595703125, -0.9239654541015625, -0.886871337890625, -0.8497772216796875, -0.81268310546875, -0.7755889892578125, -0.738494873046875, -0.7014007568359375, -0.664306640625, -0.6272125244140625, -0.590118408203125, -0.5530242919921875, -0.51593017578125, -0.4788360595703125, -0.441741943359375, -0.4046478271484375, -0.3675537109375, -0.3304595947265625, -0.293365478515625, -0.2562713623046875, -0.21917724609375, -0.1820831298828125, -0.144989013671875, -0.1078948974609375, -0.07080078125, -0.0337066650390625, 0.003387451171875, 0.0404815673828125, 0.07757568359375, 0.1146697998046875, 0.151763916015625, 0.1888580322265625, 0.2259521484375, 0.2630462646484375, 0.300140380859375, 0.3372344970703125, 0.37432861328125, 0.4114227294921875, 0.448516845703125, 0.4856109619140625, 0.522705078125, 0.5597991943359375, 0.596893310546875, 0.6339874267578125, 0.67108154296875, 0.7081756591796875, 0.745269775390625, 0.7823638916015625, 0.8194580078125, 0.8565521240234375, 0.893646240234375, 0.9307403564453125, 0.96783447265625, 1.0049285888671875, 1.042022705078125, 1.0791168212890625, 1.1162109375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 12.0, 13.0, 17.0, 15.0, 20.0, 21.0, 23.0, 20.0, 33.0, 34.0, 38.0, 46.0, 48.0, 40.0, 42.0, 43.0, 40.0, 1066.0, 56.0, 45.0, 42.0, 34.0, 30.0, 42.0, 29.0, 32.0, 23.0, 24.0, 20.0, 10.0, 21.0, 5.0, 11.0, 6.0, 8.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.640625, -5.46484375, -5.2890625, -5.11328125, -4.9375, -4.76171875, -4.5859375, -4.41015625, -4.234375, -4.05859375, -3.8828125, -3.70703125, -3.53125, -3.35546875, -3.1796875, -3.00390625, -2.828125, -2.65234375, -2.4765625, -2.30078125, -2.125, -1.94921875, -1.7734375, -1.59765625, -1.421875, -1.24609375, -1.0703125, -0.89453125, -0.71875, -0.54296875, -0.3671875, -0.19140625, -0.015625, 0.16015625, 0.3359375, 0.51171875, 0.6875, 0.86328125, 1.0390625, 1.21484375, 1.390625, 1.56640625, 1.7421875, 1.91796875, 2.09375, 2.26953125, 2.4453125, 2.62109375, 2.796875, 2.97265625, 3.1484375, 3.32421875, 3.5, 3.67578125, 3.8515625, 4.02734375, 4.203125, 4.37890625, 4.5546875, 4.73046875, 4.90625, 5.08203125, 5.2578125, 5.43359375, 5.609375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 10.0, 12.0, 8.0, 20.0, 39.0, 39.0, 76.0, 111.0, 153.0, 216.0, 326.0, 516.0, 819.0, 1269.0, 2003.0, 3180.0, 4893.0, 7964.0, 12811.0, 20387.0, 32579.0, 53967.0, 89005.0, 146293.0, 1264745.0, 176899.0, 107427.0, 65455.0, 39849.0, 24527.0, 15296.0, 9637.0, 6050.0, 3790.0, 2446.0, 1513.0, 963.0, 616.0, 450.0, 271.0, 171.0, 129.0, 71.0, 50.0, 28.0, 23.0, 15.0, 7.0, 7.0, 7.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1279296875, -1.09234619140625, -1.0567626953125, -1.02117919921875, -0.985595703125, -0.95001220703125, -0.9144287109375, -0.87884521484375, -0.84326171875, -0.80767822265625, -0.7720947265625, -0.73651123046875, -0.700927734375, -0.66534423828125, -0.6297607421875, -0.59417724609375, -0.55859375, -0.52301025390625, -0.4874267578125, -0.45184326171875, -0.416259765625, -0.38067626953125, -0.3450927734375, -0.30950927734375, -0.27392578125, -0.23834228515625, -0.2027587890625, -0.16717529296875, -0.131591796875, -0.09600830078125, -0.0604248046875, -0.02484130859375, 0.0107421875, 0.04632568359375, 0.0819091796875, 0.11749267578125, 0.153076171875, 0.18865966796875, 0.2242431640625, 0.25982666015625, 0.29541015625, 0.33099365234375, 0.3665771484375, 0.40216064453125, 0.437744140625, 0.47332763671875, 0.5089111328125, 0.54449462890625, 0.580078125, 0.61566162109375, 0.6512451171875, 0.68682861328125, 0.722412109375, 0.75799560546875, 0.7935791015625, 0.82916259765625, 0.86474609375, 0.90032958984375, 0.9359130859375, 0.97149658203125, 1.007080078125, 1.04266357421875, 1.0782470703125, 1.11383056640625, 1.1494140625]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 3.0, 7.0, 4.0, 5.0, 11.0, 9.0, 15.0, 15.0, 14.0, 30.0, 30.0, 33.0, 52.0, 43.0, 37.0, 50.0, 49.0, 63.0, 51.0, 52.0, 56.0, 44.0, 52.0, 31.0, 41.0, 31.0, 21.0, 26.0, 20.0, 29.0, 15.0, 14.0, 7.0, 12.0, 8.0, 2.0, 4.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 4.0, 3.0], "bins": [-0.001979827880859375, -0.0019268542528152466, -0.0018738806247711182, -0.0018209069967269897, -0.0017679333686828613, -0.001714959740638733, -0.0016619861125946045, -0.001609012484550476, -0.0015560388565063477, -0.0015030652284622192, -0.0014500916004180908, -0.0013971179723739624, -0.001344144344329834, -0.0012911707162857056, -0.0012381970882415771, -0.0011852234601974487, -0.0011322498321533203, -0.001079276204109192, -0.0010263025760650635, -0.0009733289480209351, -0.0009203553199768066, -0.0008673816919326782, -0.0008144080638885498, -0.0007614344358444214, -0.000708460807800293, -0.0006554871797561646, -0.0006025135517120361, -0.0005495399236679077, -0.0004965662956237793, -0.0004435926675796509, -0.00039061903953552246, -0.00033764541149139404, -0.0002846717834472656, -0.0002316981554031372, -0.0001787245273590088, -0.00012575089931488037, -7.277727127075195e-05, -1.9803643226623535e-05, 3.316998481750488e-05, 8.61436128616333e-05, 0.00013911724090576172, 0.00019209086894989014, 0.00024506449699401855, 0.00029803812503814697, 0.0003510117530822754, 0.0004039853811264038, 0.0004569590091705322, 0.0005099326372146606, 0.0005629062652587891, 0.0006158798933029175, 0.0006688535213470459, 0.0007218271493911743, 0.0007748007774353027, 0.0008277744054794312, 0.0008807480335235596, 0.000933721661567688, 0.0009866952896118164, 0.0010396689176559448, 0.0010926425457000732, 0.0011456161737442017, 0.00119858980178833, 0.0012515634298324585, 0.001304537057876587, 0.0013575106859207153, 0.0014104843139648438]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 0.0, 5.0, 2.0, 6.0, 8.0, 8.0, 12.0, 10.0, 14.0, 23.0, 27.0, 25.0, 32.0, 39.0, 49.0, 82.0, 113.0, 153.0, 411.0, 1812.0, 1029906.0, 14499.0, 617.0, 211.0, 126.0, 90.0, 61.0, 47.0, 29.0, 34.0, 19.0, 18.0, 15.0, 8.0, 8.0, 9.0, 5.0, 1.0, 6.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.03765869140625, -0.03629875183105469, -0.034938812255859375, -0.03357887268066406, -0.03221893310546875, -0.030858993530273438, -0.029499053955078125, -0.028139114379882812, -0.0267791748046875, -0.025419235229492188, -0.024059295654296875, -0.022699356079101562, -0.02133941650390625, -0.019979476928710938, -0.018619537353515625, -0.017259597778320312, -0.015899658203125, -0.014539718627929688, -0.013179779052734375, -0.011819839477539062, -0.01045989990234375, -0.009099960327148438, -0.007740020751953125, -0.0063800811767578125, -0.0050201416015625, -0.0036602020263671875, -0.002300262451171875, -0.0009403228759765625, 0.00041961669921875, 0.0017795562744140625, 0.003139495849609375, 0.0044994354248046875, 0.005859375, 0.0072193145751953125, 0.008579254150390625, 0.009939193725585938, 0.01129913330078125, 0.012659072875976562, 0.014019012451171875, 0.015378952026367188, 0.0167388916015625, 0.018098831176757812, 0.019458770751953125, 0.020818710327148438, 0.02217864990234375, 0.023538589477539062, 0.024898529052734375, 0.026258468627929688, 0.027618408203125, 0.028978347778320312, 0.030338287353515625, 0.03169822692871094, 0.03305816650390625, 0.03441810607910156, 0.035778045654296875, 0.03713798522949219, 0.0384979248046875, 0.03985786437988281, 0.041217803955078125, 0.04257774353027344, 0.04393768310546875, 0.04529762268066406, 0.046657562255859375, 0.04801750183105469, 0.04937744140625]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [3.0, 5.0, 62.0, 463.0, 423.0, 62.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006158868200145662, -0.00046125007793307304, -0.00030661336495541036, -0.00015197665197774768, 2.6600901037454605e-06, 0.0001572968321852386, 0.0003119335160590708, 0.0004665703163482249, 0.0006212070002220571, 0.0007758437423035502, 0.0009304804261773825, 0.0010851172264665365, 0.0012397539103403687, 0.001394390594214201, 0.001549027394503355, 0.001703664194792509, 0.0018583007622510195, 0.0020129375625401735, 0.002167574129998684, 0.002322210930287838, 0.002476847730576992, 0.002631484530866146, 0.0027861210983246565, 0.0029407578986138105, 0.0030953946989029646, 0.0032500314991921186, 0.003404668066650629, 0.003559304866939783, 0.003713941667228937, 0.003868578467518091, 0.004023214802145958, 0.004177851602435112, 0.004332488868385553, 0.004487125668674707, 0.0046417624689638615, 0.004796398803591728, 0.004951035603880882, 0.005105672404170036, 0.00526030920445919, 0.005414946004748344, 0.0055695828050374985, 0.0057242196053266525, 0.005878856405615807, 0.006033493205904961, 0.006188129540532827, 0.006342766340821981, 0.0064974031411111355, 0.0066520399414002895, 0.006806676276028156, 0.00696131307631731, 0.007115949876606464, 0.0072705866768956184, 0.007425223011523485, 0.007579859811812639, 0.007734496612101793, 0.00788913294672966, 0.008043770678341389, 0.008198407478630543, 0.008353044278919697, 0.00850768107920885, 0.008662317879498005, 0.008816954679787159, 0.008971590548753738, 0.009126227349042892, 0.009280864149332047]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 11.0, 10.0, 8.0, 8.0, 13.0, 13.0, 12.0, 21.0, 19.0, 25.0, 23.0, 34.0, 27.0, 35.0, 37.0, 39.0, 45.0, 44.0, 50.0, 41.0, 38.0, 32.0, 39.0, 32.0, 32.0, 36.0, 27.0, 32.0, 33.0, 36.0, 21.0, 31.0, 17.0, 16.0, 12.0, 14.0, 12.0, 9.0, 5.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00106126070022583, -0.0010304655879735947, -0.0009996704757213593, -0.0009688753634691238, -0.0009380802512168884, -0.000907285138964653, -0.0008764900267124176, -0.0008456949144601822, -0.0008148998022079468, -0.0007841046899557114, -0.000753309577703476, -0.0007225144654512405, -0.0006917193531990051, -0.0006609242409467697, -0.0006301291286945343, -0.0005993340164422989, -0.0005685389041900635, -0.0005377437919378281, -0.0005069486796855927, -0.00047615356743335724, -0.0004453584551811218, -0.0004145633429288864, -0.000383768230676651, -0.0003529731184244156, -0.0003221780061721802, -0.00029138289391994476, -0.00026058778166770935, -0.00022979266941547394, -0.00019899755716323853, -0.0001682024449110031, -0.0001374073326587677, -0.00010661222040653229, -7.581710815429688e-05, -4.502199590206146e-05, -1.422688364982605e-05, 1.6568228602409363e-05, 4.7363340854644775e-05, 7.815845310688019e-05, 0.0001089535653591156, 0.000139748677611351, 0.00017054378986358643, 0.00020133890211582184, 0.00023213401436805725, 0.00026292912662029266, 0.0002937242388725281, 0.0003245193511247635, 0.0003553144633769989, 0.0003861095756292343, 0.0004169046878814697, 0.00044769980013370514, 0.00047849491238594055, 0.000509290024638176, 0.0005400851368904114, 0.0005708802491426468, 0.0006016753613948822, 0.0006324704736471176, 0.000663265585899353, 0.0006940606981515884, 0.0007248558104038239, 0.0007556509226560593, 0.0007864460349082947, 0.0008172411471605301, 0.0008480362594127655, 0.0008788313716650009, 0.0009096264839172363]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 1.0, 10.0, 7.0, 11.0, 8.0, 14.0, 13.0, 16.0, 12.0, 15.0, 21.0, 20.0, 31.0, 14.0, 23.0, 24.0, 31.0, 26.0, 27.0, 49.0, 36.0, 44.0, 35.0, 34.0, 38.0, 36.0, 37.0, 53.0, 33.0, 24.0, 26.0, 22.0, 26.0, 25.0, 31.0, 16.0, 21.0, 10.0, 15.0, 16.0, 8.0, 9.0, 5.0, 7.0, 7.0, 2.0, 3.0, 2.0, 7.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-7.1328125, -6.90472412109375, -6.6766357421875, -6.44854736328125, -6.220458984375, -5.99237060546875, -5.7642822265625, -5.53619384765625, -5.30810546875, -5.08001708984375, -4.8519287109375, -4.62384033203125, -4.395751953125, -4.16766357421875, -3.9395751953125, -3.71148681640625, -3.4833984375, -3.25531005859375, -3.0272216796875, -2.79913330078125, -2.571044921875, -2.34295654296875, -2.1148681640625, -1.88677978515625, -1.65869140625, -1.43060302734375, -1.2025146484375, -0.97442626953125, -0.746337890625, -0.51824951171875, -0.2901611328125, -0.06207275390625, 0.166015625, 0.39410400390625, 0.6221923828125, 0.85028076171875, 1.078369140625, 1.30645751953125, 1.5345458984375, 1.76263427734375, 1.99072265625, 2.21881103515625, 2.4468994140625, 2.67498779296875, 2.903076171875, 3.13116455078125, 3.3592529296875, 3.58734130859375, 3.8154296875, 4.04351806640625, 4.2716064453125, 4.49969482421875, 4.727783203125, 4.95587158203125, 5.1839599609375, 5.41204833984375, 5.64013671875, 5.86822509765625, 6.0963134765625, 6.32440185546875, 6.552490234375, 6.78057861328125, 7.0086669921875, 7.23675537109375, 7.46484375]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 3.0, 6.0, 4.0, 8.0, 9.0, 11.0, 9.0, 22.0, 25.0, 39.0, 46.0, 69.0, 74.0, 91.0, 109.0, 172.0, 248.0, 421.0, 791.0, 1592.0, 3644.0, 8697.0, 23064.0, 61624.0, 180445.0, 477799.0, 186153.0, 63537.0, 23431.0, 8879.0, 3679.0, 1649.0, 831.0, 435.0, 290.0, 151.0, 133.0, 90.0, 50.0, 53.0, 35.0, 28.0, 19.0, 22.0, 17.0, 12.0, 16.0, 10.0, 8.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.953125, -6.717529296875, -6.48193359375, -6.246337890625, -6.0107421875, -5.775146484375, -5.53955078125, -5.303955078125, -5.068359375, -4.832763671875, -4.59716796875, -4.361572265625, -4.1259765625, -3.890380859375, -3.65478515625, -3.419189453125, -3.18359375, -2.947998046875, -2.71240234375, -2.476806640625, -2.2412109375, -2.005615234375, -1.77001953125, -1.534423828125, -1.298828125, -1.063232421875, -0.82763671875, -0.592041015625, -0.3564453125, -0.120849609375, 0.11474609375, 0.350341796875, 0.5859375, 0.821533203125, 1.05712890625, 1.292724609375, 1.5283203125, 1.763916015625, 1.99951171875, 2.235107421875, 2.470703125, 2.706298828125, 2.94189453125, 3.177490234375, 3.4130859375, 3.648681640625, 3.88427734375, 4.119873046875, 4.35546875, 4.591064453125, 4.82666015625, 5.062255859375, 5.2978515625, 5.533447265625, 5.76904296875, 6.004638671875, 6.240234375, 6.475830078125, 6.71142578125, 6.947021484375, 7.1826171875, 7.418212890625, 7.65380859375, 7.889404296875, 8.125]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 5.0, 6.0, 2.0, 7.0, 9.0, 13.0, 9.0, 11.0, 20.0, 18.0, 23.0, 23.0, 36.0, 27.0, 30.0, 42.0, 52.0, 53.0, 54.0, 136.0, 1710.0, 260.0, 79.0, 61.0, 50.0, 33.0, 44.0, 38.0, 26.0, 27.0, 22.0, 19.0, 17.0, 16.0, 12.0, 15.0, 10.0, 12.0, 6.0, 8.0, 5.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-27.390625, -26.57861328125, -25.7666015625, -24.95458984375, -24.142578125, -23.33056640625, -22.5185546875, -21.70654296875, -20.89453125, -20.08251953125, -19.2705078125, -18.45849609375, -17.646484375, -16.83447265625, -16.0224609375, -15.21044921875, -14.3984375, -13.58642578125, -12.7744140625, -11.96240234375, -11.150390625, -10.33837890625, -9.5263671875, -8.71435546875, -7.90234375, -7.09033203125, -6.2783203125, -5.46630859375, -4.654296875, -3.84228515625, -3.0302734375, -2.21826171875, -1.40625, -0.59423828125, 0.2177734375, 1.02978515625, 1.841796875, 2.65380859375, 3.4658203125, 4.27783203125, 5.08984375, 5.90185546875, 6.7138671875, 7.52587890625, 8.337890625, 9.14990234375, 9.9619140625, 10.77392578125, 11.5859375, 12.39794921875, 13.2099609375, 14.02197265625, 14.833984375, 15.64599609375, 16.4580078125, 17.27001953125, 18.08203125, 18.89404296875, 19.7060546875, 20.51806640625, 21.330078125, 22.14208984375, 22.9541015625, 23.76611328125, 24.578125]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 3.0, 5.0, 3.0, 6.0, 11.0, 8.0, 12.0, 12.0, 25.0, 25.0, 35.0, 37.0, 31.0, 46.0, 57.0, 107.0, 94.0, 183.0, 251.0, 472.0, 801.0, 2646.0, 459542.0, 2674891.0, 3939.0, 1030.0, 488.0, 254.0, 167.0, 108.0, 89.0, 58.0, 57.0, 42.0, 38.0, 19.0, 33.0, 13.0, 11.0, 10.0, 11.0, 8.0, 9.0, 8.0, 4.0, 1.0, 2.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-61.40625, -59.5498046875, -57.693359375, -55.8369140625, -53.98046875, -52.1240234375, -50.267578125, -48.4111328125, -46.5546875, -44.6982421875, -42.841796875, -40.9853515625, -39.12890625, -37.2724609375, -35.416015625, -33.5595703125, -31.703125, -29.8466796875, -27.990234375, -26.1337890625, -24.27734375, -22.4208984375, -20.564453125, -18.7080078125, -16.8515625, -14.9951171875, -13.138671875, -11.2822265625, -9.42578125, -7.5693359375, -5.712890625, -3.8564453125, -2.0, -0.1435546875, 1.712890625, 3.5693359375, 5.42578125, 7.2822265625, 9.138671875, 10.9951171875, 12.8515625, 14.7080078125, 16.564453125, 18.4208984375, 20.27734375, 22.1337890625, 23.990234375, 25.8466796875, 27.703125, 29.5595703125, 31.416015625, 33.2724609375, 35.12890625, 36.9853515625, 38.841796875, 40.6982421875, 42.5546875, 44.4111328125, 46.267578125, 48.1240234375, 49.98046875, 51.8369140625, 53.693359375, 55.5498046875, 57.40625]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 68.0, 672.0, 260.0, 13.0, 1.0, 2.0], "bins": [-266.497802734375, -262.031005859375, -257.5642395019531, -253.09744262695312, -248.6306610107422, -244.16387939453125, -239.69708251953125, -235.2303009033203, -230.76351928710938, -226.29673767089844, -221.8299560546875, -217.3631591796875, -212.89637756347656, -208.42959594726562, -203.96279907226562, -199.4960174560547, -195.02923583984375, -190.5624542236328, -186.09567260742188, -181.62887573242188, -177.16209411621094, -172.6953125, -168.228515625, -163.76173400878906, -159.29495239257812, -154.8281707763672, -150.36138916015625, -145.89459228515625, -141.4278106689453, -136.96102905273438, -132.49423217773438, -128.02745056152344, -123.56065368652344, -119.0938720703125, -114.62708282470703, -110.16029357910156, -105.69351196289062, -101.22673034667969, -96.75994110107422, -92.29315185546875, -87.82637023925781, -83.35958862304688, -78.8927993774414, -74.42601013183594, -69.959228515625, -65.49244689941406, -61.025657653808594, -56.55887222290039, -52.09208679199219, -47.625301361083984, -43.15851593017578, -38.69173049926758, -34.224945068359375, -29.758159637451172, -25.29137420654297, -20.824588775634766, -16.357803344726562, -11.89101791381836, -7.424232482910156, -2.957447052001953, 1.50933837890625, 5.976123809814453, 10.442909240722656, 14.90969467163086, 19.376480102539062]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 3.0, 4.0, 5.0, 4.0, 7.0, 8.0, 12.0, 8.0, 13.0, 16.0, 17.0, 12.0, 13.0, 22.0, 23.0, 34.0, 32.0, 34.0, 42.0, 28.0, 44.0, 39.0, 35.0, 38.0, 27.0, 41.0, 36.0, 40.0, 38.0, 36.0, 32.0, 37.0, 28.0, 29.0, 23.0, 16.0, 15.0, 22.0, 16.0, 14.0, 15.0, 13.0, 7.0, 10.0, 8.0, 8.0, 0.0, 1.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0], "bins": [-67.62173461914062, -65.60232543945312, -63.582908630371094, -61.56349563598633, -59.54408264160156, -57.5246696472168, -55.50525665283203, -53.485843658447266, -51.4664306640625, -49.447017669677734, -47.42760467529297, -45.4081916809082, -43.38877868652344, -41.36936569213867, -39.349952697753906, -37.33053970336914, -35.311126708984375, -33.29171371459961, -31.272300720214844, -29.252887725830078, -27.233474731445312, -25.214061737060547, -23.19464874267578, -21.175235748291016, -19.15582275390625, -17.136409759521484, -15.116996765136719, -13.097583770751953, -11.078170776367188, -9.058757781982422, -7.039344787597656, -5.019931793212891, -3.0005264282226562, -0.9811134338378906, 1.038299560546875, 3.0577125549316406, 5.077125549316406, 7.096538543701172, 9.115951538085938, 11.135364532470703, 13.154777526855469, 15.174190521240234, 17.193603515625, 19.213016510009766, 21.23242950439453, 23.251842498779297, 25.271255493164062, 27.290668487548828, 29.310081481933594, 31.32949447631836, 33.348907470703125, 35.36832046508789, 37.387733459472656, 39.40714645385742, 41.42655944824219, 43.44597244262695, 45.46538543701172, 47.484798431396484, 49.50421142578125, 51.523624420166016, 53.54303741455078, 55.56245040893555, 57.58186340332031, 59.60127639770508, 61.620689392089844]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 7.0, 7.0, 8.0, 11.0, 7.0, 10.0, 16.0, 15.0, 15.0, 20.0, 26.0, 20.0, 28.0, 19.0, 30.0, 28.0, 31.0, 32.0, 38.0, 57.0, 49.0, 40.0, 37.0, 36.0, 37.0, 27.0, 41.0, 38.0, 29.0, 23.0, 28.0, 25.0, 29.0, 17.0, 18.0, 18.0, 14.0, 12.0, 9.0, 12.0, 9.0, 6.0, 4.0, 5.0, 3.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-8.015625, -7.764892578125, -7.51416015625, -7.263427734375, -7.0126953125, -6.761962890625, -6.51123046875, -6.260498046875, -6.009765625, -5.759033203125, -5.50830078125, -5.257568359375, -5.0068359375, -4.756103515625, -4.50537109375, -4.254638671875, -4.00390625, -3.753173828125, -3.50244140625, -3.251708984375, -3.0009765625, -2.750244140625, -2.49951171875, -2.248779296875, -1.998046875, -1.747314453125, -1.49658203125, -1.245849609375, -0.9951171875, -0.744384765625, -0.49365234375, -0.242919921875, 0.0078125, 0.258544921875, 0.50927734375, 0.760009765625, 1.0107421875, 1.261474609375, 1.51220703125, 1.762939453125, 2.013671875, 2.264404296875, 2.51513671875, 2.765869140625, 3.0166015625, 3.267333984375, 3.51806640625, 3.768798828125, 4.01953125, 4.270263671875, 4.52099609375, 4.771728515625, 5.0224609375, 5.273193359375, 5.52392578125, 5.774658203125, 6.025390625, 6.276123046875, 6.52685546875, 6.777587890625, 7.0283203125, 7.279052734375, 7.52978515625, 7.780517578125, 8.03125]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 8.0, 3.0, 2.0, 7.0, 4.0, 10.0, 9.0, 12.0, 10.0, 21.0, 18.0, 31.0, 24.0, 44.0, 49.0, 68.0, 58.0, 120.0, 180.0, 311.0, 768.0, 2952.0, 25932.0, 1128912.0, 2921941.0, 103854.0, 6368.0, 1316.0, 465.0, 227.0, 136.0, 92.0, 59.0, 57.0, 38.0, 32.0, 33.0, 20.0, 21.0, 13.0, 14.0, 9.0, 7.0, 10.0, 6.0, 5.0, 2.0, 3.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-26.0, -25.166748046875, -24.33349609375, -23.500244140625, -22.6669921875, -21.833740234375, -21.00048828125, -20.167236328125, -19.333984375, -18.500732421875, -17.66748046875, -16.834228515625, -16.0009765625, -15.167724609375, -14.33447265625, -13.501220703125, -12.66796875, -11.834716796875, -11.00146484375, -10.168212890625, -9.3349609375, -8.501708984375, -7.66845703125, -6.835205078125, -6.001953125, -5.168701171875, -4.33544921875, -3.502197265625, -2.6689453125, -1.835693359375, -1.00244140625, -0.169189453125, 0.6640625, 1.497314453125, 2.33056640625, 3.163818359375, 3.9970703125, 4.830322265625, 5.66357421875, 6.496826171875, 7.330078125, 8.163330078125, 8.99658203125, 9.829833984375, 10.6630859375, 11.496337890625, 12.32958984375, 13.162841796875, 13.99609375, 14.829345703125, 15.66259765625, 16.495849609375, 17.3291015625, 18.162353515625, 18.99560546875, 19.828857421875, 20.662109375, 21.495361328125, 22.32861328125, 23.161865234375, 23.9951171875, 24.828369140625, 25.66162109375, 26.494873046875, 27.328125]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 5.0, 10.0, 9.0, 5.0, 15.0, 23.0, 26.0, 45.0, 62.0, 98.0, 146.0, 172.0, 280.0, 433.0, 586.0, 653.0, 511.0, 344.0, 230.0, 137.0, 95.0, 58.0, 48.0, 34.0, 19.0, 12.0, 6.0, 6.0, 4.0, 5.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.34375, -18.72314453125, -18.1025390625, -17.48193359375, -16.861328125, -16.24072265625, -15.6201171875, -14.99951171875, -14.37890625, -13.75830078125, -13.1376953125, -12.51708984375, -11.896484375, -11.27587890625, -10.6552734375, -10.03466796875, -9.4140625, -8.79345703125, -8.1728515625, -7.55224609375, -6.931640625, -6.31103515625, -5.6904296875, -5.06982421875, -4.44921875, -3.82861328125, -3.2080078125, -2.58740234375, -1.966796875, -1.34619140625, -0.7255859375, -0.10498046875, 0.515625, 1.13623046875, 1.7568359375, 2.37744140625, 2.998046875, 3.61865234375, 4.2392578125, 4.85986328125, 5.48046875, 6.10107421875, 6.7216796875, 7.34228515625, 7.962890625, 8.58349609375, 9.2041015625, 9.82470703125, 10.4453125, 11.06591796875, 11.6865234375, 12.30712890625, 12.927734375, 13.54833984375, 14.1689453125, 14.78955078125, 15.41015625, 16.03076171875, 16.6513671875, 17.27197265625, 17.892578125, 18.51318359375, 19.1337890625, 19.75439453125, 20.375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 7.0, 6.0, 14.0, 4.0, 19.0, 40.0, 43.0, 68.0, 91.0, 125.0, 201.0, 224.0, 370.0, 638.0, 5900.0, 4141783.0, 42478.0, 881.0, 359.0, 241.0, 190.0, 140.0, 122.0, 114.0, 64.0, 50.0, 42.0, 22.0, 8.0, 9.0, 17.0, 5.0, 6.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-111.6875, -108.2666015625, -104.845703125, -101.4248046875, -98.00390625, -94.5830078125, -91.162109375, -87.7412109375, -84.3203125, -80.8994140625, -77.478515625, -74.0576171875, -70.63671875, -67.2158203125, -63.794921875, -60.3740234375, -56.953125, -53.5322265625, -50.111328125, -46.6904296875, -43.26953125, -39.8486328125, -36.427734375, -33.0068359375, -29.5859375, -26.1650390625, -22.744140625, -19.3232421875, -15.90234375, -12.4814453125, -9.060546875, -5.6396484375, -2.21875, 1.2021484375, 4.623046875, 8.0439453125, 11.46484375, 14.8857421875, 18.306640625, 21.7275390625, 25.1484375, 28.5693359375, 31.990234375, 35.4111328125, 38.83203125, 42.2529296875, 45.673828125, 49.0947265625, 52.515625, 55.9365234375, 59.357421875, 62.7783203125, 66.19921875, 69.6201171875, 73.041015625, 76.4619140625, 79.8828125, 83.3037109375, 86.724609375, 90.1455078125, 93.56640625, 96.9873046875, 100.408203125, 103.8291015625, 107.25]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 27.0, 186.0, 464.0, 275.0, 48.0, 11.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-360.4863586425781, -353.8907470703125, -347.2951354980469, -340.69952392578125, -334.1039123535156, -327.50830078125, -320.9126892089844, -314.31707763671875, -307.72149658203125, -301.1258850097656, -294.5302734375, -287.9346618652344, -281.33905029296875, -274.7434387207031, -268.1478271484375, -261.55224609375, -254.95660400390625, -248.36099243164062, -241.765380859375, -235.16976928710938, -228.57415771484375, -221.97854614257812, -215.38294982910156, -208.78733825683594, -202.1917266845703, -195.5961151123047, -189.00050354003906, -182.40489196777344, -175.80929565429688, -169.21368408203125, -162.61807250976562, -156.0224609375, -149.42684936523438, -142.83123779296875, -136.23562622070312, -129.6400146484375, -123.0444107055664, -116.44879913330078, -109.85319519042969, -103.25758361816406, -96.66197204589844, -90.06636047363281, -83.47074890136719, -76.8751449584961, -70.27953338623047, -63.683921813964844, -57.088314056396484, -50.492706298828125, -43.897090911865234, -37.301483154296875, -30.70587158203125, -24.110261917114258, -17.514652252197266, -10.91904067993164, -4.323432922363281, 2.272174835205078, 8.867786407470703, 15.463396072387695, 22.059005737304688, 28.65461540222168, 35.25022506713867, 41.8458366394043, 48.441444396972656, 55.037052154541016, 61.63266372680664]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 1.0, 5.0, 6.0, 8.0, 11.0, 8.0, 10.0, 12.0, 13.0, 16.0, 26.0, 25.0, 33.0, 28.0, 28.0, 32.0, 37.0, 50.0, 35.0, 39.0, 36.0, 40.0, 53.0, 36.0, 54.0, 36.0, 30.0, 33.0, 34.0, 26.0, 34.0, 25.0, 16.0, 18.0, 16.0, 21.0, 12.0, 15.0, 5.0, 15.0, 7.0, 5.0, 7.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-49.81153106689453, -48.25680923461914, -46.70208740234375, -45.147361755371094, -43.5926399230957, -42.03791809082031, -40.48319625854492, -38.92847442626953, -37.37375259399414, -35.81903076171875, -34.26430892944336, -32.70958709716797, -31.154863357543945, -29.600139617919922, -28.04541778564453, -26.49069595336914, -24.935972213745117, -23.381250381469727, -21.826526641845703, -20.271804809570312, -18.717082977294922, -17.16236114501953, -15.607637405395508, -14.052915573120117, -12.49819278717041, -10.943470001220703, -9.388748168945312, -7.8340253829956055, -6.279303073883057, -4.724580764770508, -3.169857978820801, -1.6151361465454102, -0.060413360595703125, 1.4943090677261353, 3.0490314960479736, 4.603754043579102, 6.15847635269165, 7.713198661804199, 9.267921447753906, 10.822643280029297, 12.377366065979004, 13.932088851928711, 15.486810684204102, 17.041534423828125, 18.596256256103516, 20.150978088378906, 21.705699920654297, 23.260421752929688, 24.81514549255371, 26.3698673248291, 27.924591064453125, 29.479312896728516, 31.034034729003906, 32.5887565612793, 34.14347839355469, 35.698204040527344, 37.252925872802734, 38.807647705078125, 40.362369537353516, 41.917091369628906, 43.47181701660156, 45.02653884887695, 46.581260681152344, 48.135982513427734, 49.690704345703125]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 5.0, 3.0, 1.0, 5.0, 8.0, 17.0, 5.0, 11.0, 11.0, 14.0, 19.0, 22.0, 22.0, 23.0, 20.0, 16.0, 28.0, 27.0, 44.0, 30.0, 51.0, 40.0, 39.0, 49.0, 38.0, 37.0, 51.0, 41.0, 23.0, 33.0, 37.0, 28.0, 27.0, 22.0, 19.0, 25.0, 15.0, 20.0, 15.0, 14.0, 13.0, 5.0, 3.0, 6.0, 5.0, 5.0, 3.0, 6.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.55859375, -7.30609130859375, -7.0535888671875, -6.80108642578125, -6.548583984375, -6.29608154296875, -6.0435791015625, -5.79107666015625, -5.53857421875, -5.28607177734375, -5.0335693359375, -4.78106689453125, -4.528564453125, -4.27606201171875, -4.0235595703125, -3.77105712890625, -3.5185546875, -3.26605224609375, -3.0135498046875, -2.76104736328125, -2.508544921875, -2.25604248046875, -2.0035400390625, -1.75103759765625, -1.49853515625, -1.24603271484375, -0.9935302734375, -0.74102783203125, -0.488525390625, -0.23602294921875, 0.0164794921875, 0.26898193359375, 0.521484375, 0.77398681640625, 1.0264892578125, 1.27899169921875, 1.531494140625, 1.78399658203125, 2.0364990234375, 2.28900146484375, 2.54150390625, 2.79400634765625, 3.0465087890625, 3.29901123046875, 3.551513671875, 3.80401611328125, 4.0565185546875, 4.30902099609375, 4.5615234375, 4.81402587890625, 5.0665283203125, 5.31903076171875, 5.571533203125, 5.82403564453125, 6.0765380859375, 6.32904052734375, 6.58154296875, 6.83404541015625, 7.0865478515625, 7.33905029296875, 7.591552734375, 7.84405517578125, 8.0965576171875, 8.34906005859375, 8.6015625]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 1.0, 3.0, 8.0, 6.0, 10.0, 16.0, 39.0, 49.0, 71.0, 126.0, 187.0, 268.0, 437.0, 655.0, 1101.0, 1552.0, 2450.0, 3772.0, 5810.0, 9110.0, 14171.0, 22815.0, 35903.0, 59225.0, 97962.0, 166807.0, 228347.0, 156867.0, 91926.0, 55897.0, 33845.0, 21248.0, 13515.0, 8735.0, 5437.0, 3464.0, 2368.0, 1555.0, 1053.0, 609.0, 400.0, 281.0, 140.0, 115.0, 76.0, 51.0, 26.0, 23.0, 13.0, 11.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1806640625, -1.141876220703125, -1.10308837890625, -1.064300537109375, -1.0255126953125, -0.986724853515625, -0.94793701171875, -0.909149169921875, -0.870361328125, -0.831573486328125, -0.79278564453125, -0.753997802734375, -0.7152099609375, -0.676422119140625, -0.63763427734375, -0.598846435546875, -0.56005859375, -0.521270751953125, -0.48248291015625, -0.443695068359375, -0.4049072265625, -0.366119384765625, -0.32733154296875, -0.288543701171875, -0.249755859375, -0.210968017578125, -0.17218017578125, -0.133392333984375, -0.0946044921875, -0.055816650390625, -0.01702880859375, 0.021759033203125, 0.060546875, 0.099334716796875, 0.13812255859375, 0.176910400390625, 0.2156982421875, 0.254486083984375, 0.29327392578125, 0.332061767578125, 0.370849609375, 0.409637451171875, 0.44842529296875, 0.487213134765625, 0.5260009765625, 0.564788818359375, 0.60357666015625, 0.642364501953125, 0.68115234375, 0.719940185546875, 0.75872802734375, 0.797515869140625, 0.8363037109375, 0.875091552734375, 0.91387939453125, 0.952667236328125, 0.991455078125, 1.030242919921875, 1.06903076171875, 1.107818603515625, 1.1466064453125, 1.185394287109375, 1.22418212890625, 1.262969970703125, 1.3017578125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 5.0, 7.0, 2.0, 6.0, 5.0, 5.0, 15.0, 12.0, 11.0, 19.0, 25.0, 19.0, 30.0, 33.0, 31.0, 40.0, 34.0, 42.0, 49.0, 39.0, 34.0, 1058.0, 38.0, 51.0, 36.0, 39.0, 35.0, 41.0, 28.0, 34.0, 35.0, 28.0, 27.0, 13.0, 14.0, 19.0, 15.0, 11.0, 12.0, 7.0, 5.0, 6.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 3.0], "bins": [-5.69921875, -5.528564453125, -5.35791015625, -5.187255859375, -5.0166015625, -4.845947265625, -4.67529296875, -4.504638671875, -4.333984375, -4.163330078125, -3.99267578125, -3.822021484375, -3.6513671875, -3.480712890625, -3.31005859375, -3.139404296875, -2.96875, -2.798095703125, -2.62744140625, -2.456787109375, -2.2861328125, -2.115478515625, -1.94482421875, -1.774169921875, -1.603515625, -1.432861328125, -1.26220703125, -1.091552734375, -0.9208984375, -0.750244140625, -0.57958984375, -0.408935546875, -0.23828125, -0.067626953125, 0.10302734375, 0.273681640625, 0.4443359375, 0.614990234375, 0.78564453125, 0.956298828125, 1.126953125, 1.297607421875, 1.46826171875, 1.638916015625, 1.8095703125, 1.980224609375, 2.15087890625, 2.321533203125, 2.4921875, 2.662841796875, 2.83349609375, 3.004150390625, 3.1748046875, 3.345458984375, 3.51611328125, 3.686767578125, 3.857421875, 4.028076171875, 4.19873046875, 4.369384765625, 4.5400390625, 4.710693359375, 4.88134765625, 5.052001953125, 5.22265625]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 8.0, 6.0, 4.0, 14.0, 22.0, 39.0, 58.0, 84.0, 130.0, 221.0, 334.0, 547.0, 824.0, 1359.0, 2305.0, 3755.0, 6182.0, 10427.0, 17941.0, 30189.0, 52425.0, 90520.0, 160765.0, 1297047.0, 179307.0, 101854.0, 58141.0, 33698.0, 19725.0, 11744.0, 6865.0, 4118.0, 2455.0, 1469.0, 933.0, 608.0, 348.0, 234.0, 162.0, 88.0, 65.0, 42.0, 26.0, 19.0, 14.0, 6.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.267578125, -1.2261505126953125, -1.184722900390625, -1.1432952880859375, -1.10186767578125, -1.0604400634765625, -1.019012451171875, -0.9775848388671875, -0.9361572265625, -0.8947296142578125, -0.853302001953125, -0.8118743896484375, -0.77044677734375, -0.7290191650390625, -0.687591552734375, -0.6461639404296875, -0.604736328125, -0.5633087158203125, -0.521881103515625, -0.4804534912109375, -0.43902587890625, -0.3975982666015625, -0.356170654296875, -0.3147430419921875, -0.2733154296875, -0.2318878173828125, -0.190460205078125, -0.1490325927734375, -0.10760498046875, -0.0661773681640625, -0.024749755859375, 0.0166778564453125, 0.05810546875, 0.0995330810546875, 0.140960693359375, 0.1823883056640625, 0.22381591796875, 0.2652435302734375, 0.306671142578125, 0.3480987548828125, 0.3895263671875, 0.4309539794921875, 0.472381591796875, 0.5138092041015625, 0.55523681640625, 0.5966644287109375, 0.638092041015625, 0.6795196533203125, 0.720947265625, 0.7623748779296875, 0.803802490234375, 0.8452301025390625, 0.88665771484375, 0.9280853271484375, 0.969512939453125, 1.0109405517578125, 1.0523681640625, 1.0937957763671875, 1.135223388671875, 1.1766510009765625, 1.21807861328125, 1.2595062255859375, 1.300933837890625, 1.3423614501953125, 1.3837890625]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 5.0, 6.0, 9.0, 5.0, 8.0, 15.0, 17.0, 17.0, 20.0, 25.0, 40.0, 35.0, 34.0, 43.0, 52.0, 50.0, 62.0, 51.0, 62.0, 54.0, 63.0, 41.0, 42.0, 36.0, 35.0, 19.0, 28.0, 17.0, 17.0, 12.0, 11.0, 21.0, 11.0, 9.0, 5.0, 6.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0016422271728515625, -0.0015890896320343018, -0.001535952091217041, -0.0014828145503997803, -0.0014296770095825195, -0.0013765394687652588, -0.001323401927947998, -0.0012702643871307373, -0.0012171268463134766, -0.0011639893054962158, -0.001110851764678955, -0.0010577142238616943, -0.0010045766830444336, -0.0009514391422271729, -0.0008983016014099121, -0.0008451640605926514, -0.0007920265197753906, -0.0007388889789581299, -0.0006857514381408691, -0.0006326138973236084, -0.0005794763565063477, -0.0005263388156890869, -0.00047320127487182617, -0.00042006373405456543, -0.0003669261932373047, -0.00031378865242004395, -0.0002606511116027832, -0.00020751357078552246, -0.00015437602996826172, -0.00010123848915100098, -4.8100948333740234e-05, 5.036592483520508e-06, 5.817413330078125e-05, 0.00011131167411804199, 0.00016444921493530273, 0.00021758675575256348, 0.0002707242965698242, 0.00032386183738708496, 0.0003769993782043457, 0.00043013691902160645, 0.0004832744598388672, 0.0005364120006561279, 0.0005895495414733887, 0.0006426870822906494, 0.0006958246231079102, 0.0007489621639251709, 0.0008020997047424316, 0.0008552372455596924, 0.0009083747863769531, 0.0009615123271942139, 0.0010146498680114746, 0.0010677874088287354, 0.001120924949645996, 0.0011740624904632568, 0.0012272000312805176, 0.0012803375720977783, 0.001333475112915039, 0.0013866126537322998, 0.0014397501945495605, 0.0014928877353668213, 0.001546025276184082, 0.0015991628170013428, 0.0016523003578186035, 0.0017054378986358643, 0.001758575439453125]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 4.0, 1.0, 4.0, 6.0, 9.0, 9.0, 18.0, 17.0, 17.0, 15.0, 31.0, 44.0, 44.0, 50.0, 77.0, 115.0, 177.0, 452.0, 2042.0, 1024301.0, 19655.0, 685.0, 263.0, 136.0, 81.0, 55.0, 55.0, 32.0, 33.0, 30.0, 13.0, 19.0, 13.0, 10.0, 14.0, 3.0, 8.0, 3.0, 3.0, 0.0, 6.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.045623779296875, -0.04427003860473633, -0.042916297912597656, -0.041562557220458984, -0.04020881652832031, -0.03885507583618164, -0.03750133514404297, -0.0361475944519043, -0.034793853759765625, -0.03344011306762695, -0.03208637237548828, -0.03073263168334961, -0.029378890991210938, -0.028025150299072266, -0.026671409606933594, -0.025317668914794922, -0.02396392822265625, -0.022610187530517578, -0.021256446838378906, -0.019902706146240234, -0.018548965454101562, -0.01719522476196289, -0.01584148406982422, -0.014487743377685547, -0.013134002685546875, -0.011780261993408203, -0.010426521301269531, -0.00907278060913086, -0.0077190399169921875, -0.006365299224853516, -0.005011558532714844, -0.003657817840576172, -0.0023040771484375, -0.0009503364562988281, 0.00040340423583984375, 0.0017571449279785156, 0.0031108856201171875, 0.004464626312255859, 0.005818367004394531, 0.007172107696533203, 0.008525848388671875, 0.009879589080810547, 0.011233329772949219, 0.01258707046508789, 0.013940811157226562, 0.015294551849365234, 0.016648292541503906, 0.018002033233642578, 0.01935577392578125, 0.020709514617919922, 0.022063255310058594, 0.023416996002197266, 0.024770736694335938, 0.02612447738647461, 0.02747821807861328, 0.028831958770751953, 0.030185699462890625, 0.0315394401550293, 0.03289318084716797, 0.03424692153930664, 0.03560066223144531, 0.036954402923583984, 0.038308143615722656, 0.03966188430786133, 0.041015625]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 8.0, 17.0, 32.0, 69.0, 126.0, 188.0, 196.0, 173.0, 98.0, 54.0, 34.0, 8.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0022862080950289965, -0.002235752996057272, -0.0021852978970855474, -0.002134842798113823, -0.0020843876991420984, -0.002033932600170374, -0.0019834775011986494, -0.001933022285811603, -0.0018825671868398786, -0.001832112087868154, -0.0017816569888964295, -0.001731201889924705, -0.0016807467909529805, -0.0016302915755659342, -0.0015798364765942097, -0.0015293813776224852, -0.0014789262786507607, -0.0014284711796790361, -0.0013780160807073116, -0.0013275609817355871, -0.0012771058827638626, -0.001226650783792138, -0.0011761956848204136, -0.0011257404694333673, -0.0010752854868769646, -0.00102483038790524, -0.0009743752889335155, -0.000923920189961791, -0.0008734650327824056, -0.0008230099338106811, -0.0007725548348389566, -0.0007220996776595712, -0.0006716445786878467, -0.0006211894797161222, -0.0005707343807443976, -0.0005202792817726731, -0.0004698241245932877, -0.0004193690256215632, -0.0003689139266498387, -0.0003184587985742837, -0.0002680036996025592, -0.00021754858607891947, -0.00016709347255527973, -0.00011663837358355522, -6.618326005991548e-05, -1.5728146536275744e-05, 3.4726952435448766e-05, 8.518208051100373e-05, 0.00013563717948272824, 0.00018609229300636798, 0.00023654740653000772, 0.00028700250550173223, 0.0003374576335772872, 0.0003879127325490117, 0.0004383678315207362, 0.0004888229304924607, 0.0005392780294641852, 0.0005897331284359097, 0.0006401882274076343, 0.0006906433263793588, 0.0007410984835587442, 0.0007915535825304687, 0.0008420086815021932, 0.0008924638386815786, 0.0009429189376533031]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 2.0, 6.0, 13.0, 7.0, 6.0, 10.0, 17.0, 5.0, 19.0, 21.0, 22.0, 28.0, 25.0, 28.0, 40.0, 29.0, 34.0, 30.0, 26.0, 45.0, 36.0, 40.0, 40.0, 42.0, 39.0, 35.0, 35.0, 36.0, 35.0, 26.0, 31.0, 23.0, 26.0, 22.0, 22.0, 23.0, 15.0, 11.0, 11.0, 7.0, 6.0, 10.0, 7.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0009571313858032227, -0.0009287148714065552, -0.0009002983570098877, -0.0008718818426132202, -0.0008434653282165527, -0.0008150488138198853, -0.0007866322994232178, -0.0007582157850265503, -0.0007297992706298828, -0.0007013827562332153, -0.0006729662418365479, -0.0006445497274398804, -0.0006161332130432129, -0.0005877166986465454, -0.0005593001842498779, -0.0005308836698532104, -0.000502467155456543, -0.0004740506410598755, -0.000445634126663208, -0.00041721761226654053, -0.00038880109786987305, -0.00036038458347320557, -0.0003319680690765381, -0.0003035515546798706, -0.0002751350402832031, -0.00024671852588653564, -0.00021830201148986816, -0.00018988549709320068, -0.0001614689826965332, -0.00013305246829986572, -0.00010463595390319824, -7.621943950653076e-05, -4.780292510986328e-05, -1.93864107131958e-05, 9.03010368347168e-06, 3.744661808013916e-05, 6.586313247680664e-05, 9.427964687347412e-05, 0.0001226961612701416, 0.00015111267566680908, 0.00017952919006347656, 0.00020794570446014404, 0.00023636221885681152, 0.000264778733253479, 0.0002931952476501465, 0.00032161176204681396, 0.00035002827644348145, 0.0003784447908401489, 0.0004068613052368164, 0.0004352778196334839, 0.00046369433403015137, 0.0004921108484268188, 0.0005205273628234863, 0.0005489438772201538, 0.0005773603916168213, 0.0006057769060134888, 0.0006341934204101562, 0.0006626099348068237, 0.0006910264492034912, 0.0007194429636001587, 0.0007478594779968262, 0.0007762759923934937, 0.0008046925067901611, 0.0008331090211868286, 0.0008615255355834961]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 5.0, 3.0, 1.0, 5.0, 7.0, 18.0, 5.0, 11.0, 11.0, 14.0, 19.0, 22.0, 21.0, 24.0, 20.0, 16.0, 27.0, 28.0, 44.0, 30.0, 51.0, 40.0, 38.0, 50.0, 38.0, 37.0, 51.0, 40.0, 24.0, 33.0, 35.0, 29.0, 28.0, 22.0, 19.0, 25.0, 15.0, 20.0, 15.0, 14.0, 13.0, 5.0, 3.0, 6.0, 5.0, 5.0, 3.0, 6.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.5625, -7.3099365234375, -7.057373046875, -6.8048095703125, -6.55224609375, -6.2996826171875, -6.047119140625, -5.7945556640625, -5.5419921875, -5.2894287109375, -5.036865234375, -4.7843017578125, -4.53173828125, -4.2791748046875, -4.026611328125, -3.7740478515625, -3.521484375, -3.2689208984375, -3.016357421875, -2.7637939453125, -2.51123046875, -2.2586669921875, -2.006103515625, -1.7535400390625, -1.5009765625, -1.2484130859375, -0.995849609375, -0.7432861328125, -0.49072265625, -0.2381591796875, 0.014404296875, 0.2669677734375, 0.51953125, 0.7720947265625, 1.024658203125, 1.2772216796875, 1.52978515625, 1.7823486328125, 2.034912109375, 2.2874755859375, 2.5400390625, 2.7926025390625, 3.045166015625, 3.2977294921875, 3.55029296875, 3.8028564453125, 4.055419921875, 4.3079833984375, 4.560546875, 4.8131103515625, 5.065673828125, 5.3182373046875, 5.57080078125, 5.8233642578125, 6.075927734375, 6.3284912109375, 6.5810546875, 6.8336181640625, 7.086181640625, 7.3387451171875, 7.59130859375, 7.8438720703125, 8.096435546875, 8.3489990234375, 8.6015625]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 4.0, 0.0, 6.0, 2.0, 6.0, 3.0, 6.0, 25.0, 12.0, 17.0, 22.0, 23.0, 35.0, 59.0, 45.0, 69.0, 92.0, 148.0, 172.0, 287.0, 453.0, 918.0, 2205.0, 7583.0, 40485.0, 569883.0, 382884.0, 32543.0, 6457.0, 1848.0, 827.0, 413.0, 283.0, 214.0, 121.0, 92.0, 75.0, 56.0, 37.0, 25.0, 29.0, 27.0, 21.0, 10.0, 5.0, 6.0, 8.0, 5.0, 4.0, 7.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.921875, -13.4569091796875, -12.991943359375, -12.5269775390625, -12.06201171875, -11.5970458984375, -11.132080078125, -10.6671142578125, -10.2021484375, -9.7371826171875, -9.272216796875, -8.8072509765625, -8.34228515625, -7.8773193359375, -7.412353515625, -6.9473876953125, -6.482421875, -6.0174560546875, -5.552490234375, -5.0875244140625, -4.62255859375, -4.1575927734375, -3.692626953125, -3.2276611328125, -2.7626953125, -2.2977294921875, -1.832763671875, -1.3677978515625, -0.90283203125, -0.4378662109375, 0.027099609375, 0.4920654296875, 0.95703125, 1.4219970703125, 1.886962890625, 2.3519287109375, 2.81689453125, 3.2818603515625, 3.746826171875, 4.2117919921875, 4.6767578125, 5.1417236328125, 5.606689453125, 6.0716552734375, 6.53662109375, 7.0015869140625, 7.466552734375, 7.9315185546875, 8.396484375, 8.8614501953125, 9.326416015625, 9.7913818359375, 10.25634765625, 10.7213134765625, 11.186279296875, 11.6512451171875, 12.1162109375, 12.5811767578125, 13.046142578125, 13.5111083984375, 13.97607421875, 14.4410400390625, 14.906005859375, 15.3709716796875, 15.8359375]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 2.0, 4.0, 3.0, 5.0, 11.0, 9.0, 7.0, 11.0, 9.0, 14.0, 14.0, 11.0, 15.0, 20.0, 15.0, 24.0, 25.0, 26.0, 26.0, 44.0, 32.0, 36.0, 56.0, 83.0, 406.0, 1564.0, 87.0, 73.0, 46.0, 43.0, 44.0, 34.0, 34.0, 29.0, 32.0, 25.0, 26.0, 14.0, 12.0, 15.0, 12.0, 10.0, 3.0, 6.0, 7.0, 9.0, 7.0, 7.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-22.953125, -22.21337890625, -21.4736328125, -20.73388671875, -19.994140625, -19.25439453125, -18.5146484375, -17.77490234375, -17.03515625, -16.29541015625, -15.5556640625, -14.81591796875, -14.076171875, -13.33642578125, -12.5966796875, -11.85693359375, -11.1171875, -10.37744140625, -9.6376953125, -8.89794921875, -8.158203125, -7.41845703125, -6.6787109375, -5.93896484375, -5.19921875, -4.45947265625, -3.7197265625, -2.97998046875, -2.240234375, -1.50048828125, -0.7607421875, -0.02099609375, 0.71875, 1.45849609375, 2.1982421875, 2.93798828125, 3.677734375, 4.41748046875, 5.1572265625, 5.89697265625, 6.63671875, 7.37646484375, 8.1162109375, 8.85595703125, 9.595703125, 10.33544921875, 11.0751953125, 11.81494140625, 12.5546875, 13.29443359375, 14.0341796875, 14.77392578125, 15.513671875, 16.25341796875, 16.9931640625, 17.73291015625, 18.47265625, 19.21240234375, 19.9521484375, 20.69189453125, 21.431640625, 22.17138671875, 22.9111328125, 23.65087890625, 24.390625]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 7.0, 6.0, 7.0, 5.0, 9.0, 7.0, 7.0, 9.0, 20.0, 15.0, 20.0, 21.0, 24.0, 24.0, 46.0, 48.0, 60.0, 73.0, 101.0, 176.0, 251.0, 557.0, 2233.0, 2909123.0, 230236.0, 1357.0, 424.0, 242.0, 151.0, 100.0, 71.0, 50.0, 29.0, 30.0, 14.0, 23.0, 18.0, 15.0, 15.0, 12.0, 19.0, 6.0, 9.0, 7.0, 15.0, 7.0, 3.0, 5.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0], "bins": [-72.9375, -70.720703125, -68.50390625, -66.287109375, -64.0703125, -61.853515625, -59.63671875, -57.419921875, -55.203125, -52.986328125, -50.76953125, -48.552734375, -46.3359375, -44.119140625, -41.90234375, -39.685546875, -37.46875, -35.251953125, -33.03515625, -30.818359375, -28.6015625, -26.384765625, -24.16796875, -21.951171875, -19.734375, -17.517578125, -15.30078125, -13.083984375, -10.8671875, -8.650390625, -6.43359375, -4.216796875, -2.0, 0.216796875, 2.43359375, 4.650390625, 6.8671875, 9.083984375, 11.30078125, 13.517578125, 15.734375, 17.951171875, 20.16796875, 22.384765625, 24.6015625, 26.818359375, 29.03515625, 31.251953125, 33.46875, 35.685546875, 37.90234375, 40.119140625, 42.3359375, 44.552734375, 46.76953125, 48.986328125, 51.203125, 53.419921875, 55.63671875, 57.853515625, 60.0703125, 62.287109375, 64.50390625, 66.720703125, 68.9375]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 238.0, 708.0, 70.0], "bins": [-266.7608947753906, -262.4787902832031, -258.19671630859375, -253.91461181640625, -249.63250732421875, -245.35040283203125, -241.0683135986328, -236.78622436523438, -232.50411987304688, -228.22201538085938, -223.93992614746094, -219.6578369140625, -215.375732421875, -211.0936279296875, -206.81153869628906, -202.52944946289062, -198.24734497070312, -193.96524047851562, -189.6831512451172, -185.40106201171875, -181.11895751953125, -176.83685302734375, -172.5547637939453, -168.27267456054688, -163.99057006835938, -159.70846557617188, -155.42637634277344, -151.144287109375, -146.8621826171875, -142.580078125, -138.29798889160156, -134.01589965820312, -129.73377990722656, -125.4516830444336, -121.16958618164062, -116.88748931884766, -112.60539245605469, -108.32329559326172, -104.04119873046875, -99.75910186767578, -95.47700500488281, -91.19490814208984, -86.91281127929688, -82.6307144165039, -78.34861755371094, -74.06652069091797, -69.784423828125, -65.50232696533203, -61.22023391723633, -56.93813705444336, -52.65604019165039, -48.37394332885742, -44.09184646606445, -39.809749603271484, -35.527652740478516, -31.245555877685547, -26.963457107543945, -22.681360244750977, -18.399263381958008, -14.117166519165039, -9.83506965637207, -5.552972793579102, -1.2708759307861328, 3.011220932006836, 7.2933173179626465]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 4.0, 6.0, 4.0, 7.0, 4.0, 10.0, 18.0, 10.0, 15.0, 11.0, 23.0, 22.0, 20.0, 20.0, 32.0, 28.0, 45.0, 28.0, 50.0, 47.0, 49.0, 29.0, 40.0, 34.0, 37.0, 46.0, 39.0, 36.0, 31.0, 37.0, 33.0, 24.0, 19.0, 21.0, 20.0, 23.0, 8.0, 16.0, 11.0, 11.0, 7.0, 6.0, 10.0, 2.0, 6.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-80.03221130371094, -77.61380767822266, -75.19539642333984, -72.77699279785156, -70.35858154296875, -67.94017791748047, -65.52176666259766, -63.103363037109375, -60.68495559692383, -58.26654815673828, -55.848140716552734, -53.42973327636719, -51.011329650878906, -48.592918395996094, -46.17451477050781, -43.756107330322266, -41.33769989013672, -38.91929244995117, -36.500885009765625, -34.08247756958008, -31.664072036743164, -29.245664596557617, -26.827259063720703, -24.408851623535156, -21.99044418334961, -19.572036743164062, -17.153629302978516, -14.735223770141602, -12.316816329956055, -9.898408889770508, -7.480002403259277, -5.061595916748047, -2.6431808471679688, -0.22477388381958008, 2.1936330795288086, 4.612040042877197, 7.030447006225586, 9.448854446411133, 11.867260932922363, 14.285667419433594, 16.70407485961914, 19.122482299804688, 21.540889739990234, 23.95929527282715, 26.377702713012695, 28.796110153198242, 31.214515686035156, 33.6329231262207, 36.05133056640625, 38.4697380065918, 40.888145446777344, 43.30655288696289, 45.72496032714844, 48.14336395263672, 50.561771392822266, 52.98017883300781, 55.39858627319336, 57.816993713378906, 60.23540115356445, 62.65380859375, 65.07221221923828, 67.4906234741211, 69.90902709960938, 72.32743835449219, 74.74584197998047]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 3.0, 2.0, 9.0, 4.0, 7.0, 10.0, 11.0, 13.0, 16.0, 18.0, 18.0, 16.0, 17.0, 23.0, 28.0, 30.0, 28.0, 36.0, 38.0, 38.0, 41.0, 49.0, 44.0, 52.0, 53.0, 39.0, 35.0, 40.0, 38.0, 21.0, 36.0, 19.0, 32.0, 23.0, 17.0, 16.0, 15.0, 14.0, 16.0, 7.0, 4.0, 10.0, 4.0, 3.0, 4.0, 5.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0625, -7.7835693359375, -7.504638671875, -7.2257080078125, -6.94677734375, -6.6678466796875, -6.388916015625, -6.1099853515625, -5.8310546875, -5.5521240234375, -5.273193359375, -4.9942626953125, -4.71533203125, -4.4364013671875, -4.157470703125, -3.8785400390625, -3.599609375, -3.3206787109375, -3.041748046875, -2.7628173828125, -2.48388671875, -2.2049560546875, -1.926025390625, -1.6470947265625, -1.3681640625, -1.0892333984375, -0.810302734375, -0.5313720703125, -0.25244140625, 0.0264892578125, 0.305419921875, 0.5843505859375, 0.86328125, 1.1422119140625, 1.421142578125, 1.7000732421875, 1.97900390625, 2.2579345703125, 2.536865234375, 2.8157958984375, 3.0947265625, 3.3736572265625, 3.652587890625, 3.9315185546875, 4.21044921875, 4.4893798828125, 4.768310546875, 5.0472412109375, 5.326171875, 5.6051025390625, 5.884033203125, 6.1629638671875, 6.44189453125, 6.7208251953125, 6.999755859375, 7.2786865234375, 7.5576171875, 7.8365478515625, 8.115478515625, 8.3944091796875, 8.67333984375, 8.9522705078125, 9.231201171875, 9.5101318359375, 9.7890625]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 3.0, 1.0, 8.0, 9.0, 5.0, 9.0, 6.0, 16.0, 20.0, 17.0, 24.0, 33.0, 39.0, 62.0, 90.0, 89.0, 194.0, 263.0, 440.0, 747.0, 1409.0, 2518.0, 5546.0, 13621.0, 41992.0, 168976.0, 641277.0, 1450368.0, 1243760.0, 455921.0, 115826.0, 30216.0, 10752.0, 4595.0, 2291.0, 1189.0, 699.0, 408.0, 248.0, 159.0, 113.0, 91.0, 60.0, 42.0, 34.0, 24.0, 19.0, 15.0, 11.0, 10.0, 3.0, 6.0, 8.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-9.96875, -9.6558837890625, -9.343017578125, -9.0301513671875, -8.71728515625, -8.4044189453125, -8.091552734375, -7.7786865234375, -7.4658203125, -7.1529541015625, -6.840087890625, -6.5272216796875, -6.21435546875, -5.9014892578125, -5.588623046875, -5.2757568359375, -4.962890625, -4.6500244140625, -4.337158203125, -4.0242919921875, -3.71142578125, -3.3985595703125, -3.085693359375, -2.7728271484375, -2.4599609375, -2.1470947265625, -1.834228515625, -1.5213623046875, -1.20849609375, -0.8956298828125, -0.582763671875, -0.2698974609375, 0.04296875, 0.3558349609375, 0.668701171875, 0.9815673828125, 1.29443359375, 1.6072998046875, 1.920166015625, 2.2330322265625, 2.5458984375, 2.8587646484375, 3.171630859375, 3.4844970703125, 3.79736328125, 4.1102294921875, 4.423095703125, 4.7359619140625, 5.048828125, 5.3616943359375, 5.674560546875, 5.9874267578125, 6.30029296875, 6.6131591796875, 6.926025390625, 7.2388916015625, 7.5517578125, 7.8646240234375, 8.177490234375, 8.4903564453125, 8.80322265625, 9.1160888671875, 9.428955078125, 9.7418212890625, 10.0546875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 4.0, 3.0, 10.0, 9.0, 17.0, 23.0, 32.0, 61.0, 89.0, 128.0, 177.0, 263.0, 391.0, 543.0, 653.0, 524.0, 396.0, 269.0, 153.0, 119.0, 79.0, 58.0, 33.0, 18.0, 12.0, 9.0, 8.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-33.25, -32.519287109375, -31.78857421875, -31.057861328125, -30.3271484375, -29.596435546875, -28.86572265625, -28.135009765625, -27.404296875, -26.673583984375, -25.94287109375, -25.212158203125, -24.4814453125, -23.750732421875, -23.02001953125, -22.289306640625, -21.55859375, -20.827880859375, -20.09716796875, -19.366455078125, -18.6357421875, -17.905029296875, -17.17431640625, -16.443603515625, -15.712890625, -14.982177734375, -14.25146484375, -13.520751953125, -12.7900390625, -12.059326171875, -11.32861328125, -10.597900390625, -9.8671875, -9.136474609375, -8.40576171875, -7.675048828125, -6.9443359375, -6.213623046875, -5.48291015625, -4.752197265625, -4.021484375, -3.290771484375, -2.56005859375, -1.829345703125, -1.0986328125, -0.367919921875, 0.36279296875, 1.093505859375, 1.82421875, 2.554931640625, 3.28564453125, 4.016357421875, 4.7470703125, 5.477783203125, 6.20849609375, 6.939208984375, 7.669921875, 8.400634765625, 9.13134765625, 9.862060546875, 10.5927734375, 11.323486328125, 12.05419921875, 12.784912109375, 13.515625]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 11.0, 16.0, 23.0, 46.0, 66.0, 101.0, 157.0, 223.0, 335.0, 570.0, 1504.0, 111574.0, 4073539.0, 4061.0, 773.0, 443.0, 276.0, 192.0, 148.0, 73.0, 62.0, 39.0, 25.0, 11.0, 10.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-107.6875, -104.1259765625, -100.564453125, -97.0029296875, -93.44140625, -89.8798828125, -86.318359375, -82.7568359375, -79.1953125, -75.6337890625, -72.072265625, -68.5107421875, -64.94921875, -61.3876953125, -57.826171875, -54.2646484375, -50.703125, -47.1416015625, -43.580078125, -40.0185546875, -36.45703125, -32.8955078125, -29.333984375, -25.7724609375, -22.2109375, -18.6494140625, -15.087890625, -11.5263671875, -7.96484375, -4.4033203125, -0.841796875, 2.7197265625, 6.28125, 9.8427734375, 13.404296875, 16.9658203125, 20.52734375, 24.0888671875, 27.650390625, 31.2119140625, 34.7734375, 38.3349609375, 41.896484375, 45.4580078125, 49.01953125, 52.5810546875, 56.142578125, 59.7041015625, 63.265625, 66.8271484375, 70.388671875, 73.9501953125, 77.51171875, 81.0732421875, 84.634765625, 88.1962890625, 91.7578125, 95.3193359375, 98.880859375, 102.4423828125, 106.00390625, 109.5654296875, 113.126953125, 116.6884765625, 120.25]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 582.0, 435.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1828.9698486328125, -1795.708251953125, -1762.4466552734375, -1729.1851806640625, -1695.923583984375, -1662.6619873046875, -1629.400390625, -1596.138916015625, -1562.8773193359375, -1529.61572265625, -1496.3541259765625, -1463.0926513671875, -1429.8310546875, -1396.5694580078125, -1363.307861328125, -1330.04638671875, -1296.78466796875, -1263.5230712890625, -1230.261474609375, -1197.0, -1163.7384033203125, -1130.476806640625, -1097.2152099609375, -1063.95361328125, -1030.692138671875, -997.4305419921875, -964.1690063476562, -930.9074096679688, -897.6458740234375, -864.38427734375, -831.1226806640625, -797.8611450195312, -764.599609375, -731.3380126953125, -698.0764770507812, -664.8148803710938, -631.5533447265625, -598.291748046875, -565.0301513671875, -531.7686157226562, -498.507080078125, -465.2455139160156, -431.98394775390625, -398.72235107421875, -365.4608154296875, -332.19921875, -298.9376525878906, -265.67608642578125, -232.41452026367188, -199.1529541015625, -165.89138793945312, -132.6298065185547, -99.36824035644531, -66.10667419433594, -32.8450927734375, 0.416473388671875, 33.67803955078125, 66.93960571289062, 100.20117950439453, 133.46275329589844, 166.7243194580078, 199.9858856201172, 233.24746704101562, 266.509033203125, 299.7705993652344]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 10.0, 8.0, 12.0, 17.0, 26.0, 33.0, 39.0, 33.0, 37.0, 45.0, 43.0, 52.0, 65.0, 52.0, 60.0, 68.0, 67.0, 52.0, 48.0, 50.0, 36.0, 42.0, 31.0, 17.0, 12.0, 10.0, 14.0, 11.0, 11.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.33647155761719, -55.7484130859375, -53.16035079956055, -50.57229232788086, -47.984230041503906, -45.39617156982422, -42.80811309814453, -40.22005081176758, -37.631988525390625, -35.04393005371094, -32.455867767333984, -29.867809295654297, -27.279747009277344, -24.691688537597656, -22.103628158569336, -19.515567779541016, -16.927509307861328, -14.339448928833008, -11.751388549804688, -9.163329124450684, -6.575268745422363, -3.987208366394043, -1.399148941040039, 1.1889114379882812, 3.7769718170166016, 6.365032196044922, 8.953092575073242, 11.541152000427246, 14.129212379455566, 16.717273712158203, 19.30533218383789, 21.89339256286621, 24.48145294189453, 27.06951332092285, 29.657573699951172, 32.24563217163086, 34.83369445800781, 37.4217529296875, 40.00981140136719, 42.59787368774414, 45.185935974121094, 47.77399444580078, 50.362056732177734, 52.95011520385742, 55.538177490234375, 58.12623596191406, 60.71429443359375, 63.3023567199707, 65.89041137695312, 68.47846984863281, 71.0665283203125, 73.65459442138672, 76.2426528930664, 78.8307113647461, 81.41876983642578, 84.0068359375, 86.59489440917969, 89.18295288085938, 91.77101135253906, 94.35907745361328, 96.94713592529297, 99.53519439697266, 102.12325286865234, 104.71131896972656, 107.29937744140625]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 1.0, 5.0, 3.0, 4.0, 5.0, 6.0, 5.0, 11.0, 12.0, 15.0, 18.0, 21.0, 22.0, 17.0, 27.0, 32.0, 28.0, 44.0, 44.0, 36.0, 50.0, 43.0, 50.0, 45.0, 50.0, 46.0, 45.0, 40.0, 48.0, 34.0, 26.0, 20.0, 24.0, 18.0, 20.0, 20.0, 14.0, 14.0, 11.0, 4.0, 7.0, 3.0, 6.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8359375, -8.55126953125, -8.2666015625, -7.98193359375, -7.697265625, -7.41259765625, -7.1279296875, -6.84326171875, -6.55859375, -6.27392578125, -5.9892578125, -5.70458984375, -5.419921875, -5.13525390625, -4.8505859375, -4.56591796875, -4.28125, -3.99658203125, -3.7119140625, -3.42724609375, -3.142578125, -2.85791015625, -2.5732421875, -2.28857421875, -2.00390625, -1.71923828125, -1.4345703125, -1.14990234375, -0.865234375, -0.58056640625, -0.2958984375, -0.01123046875, 0.2734375, 0.55810546875, 0.8427734375, 1.12744140625, 1.412109375, 1.69677734375, 1.9814453125, 2.26611328125, 2.55078125, 2.83544921875, 3.1201171875, 3.40478515625, 3.689453125, 3.97412109375, 4.2587890625, 4.54345703125, 4.828125, 5.11279296875, 5.3974609375, 5.68212890625, 5.966796875, 6.25146484375, 6.5361328125, 6.82080078125, 7.10546875, 7.39013671875, 7.6748046875, 7.95947265625, 8.244140625, 8.52880859375, 8.8134765625, 9.09814453125, 9.3828125]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 7.0, 2.0, 14.0, 24.0, 21.0, 36.0, 49.0, 80.0, 109.0, 163.0, 199.0, 354.0, 477.0, 679.0, 938.0, 1443.0, 2059.0, 3033.0, 4424.0, 6366.0, 9271.0, 13525.0, 19563.0, 28001.0, 41595.0, 62630.0, 99367.0, 160021.0, 202115.0, 136025.0, 84958.0, 54647.0, 36148.0, 24741.0, 17215.0, 11899.0, 8301.0, 5606.0, 3869.0, 2712.0, 1882.0, 1213.0, 864.0, 590.0, 420.0, 278.0, 199.0, 140.0, 79.0, 63.0, 57.0, 31.0, 22.0, 12.0, 12.0, 8.0, 5.0, 2.0, 1.0, 2.0], "bins": [-1.0927734375, -1.0589752197265625, -1.025177001953125, -0.9913787841796875, -0.95758056640625, -0.9237823486328125, -0.889984130859375, -0.8561859130859375, -0.8223876953125, -0.7885894775390625, -0.754791259765625, -0.7209930419921875, -0.68719482421875, -0.6533966064453125, -0.619598388671875, -0.5858001708984375, -0.552001953125, -0.5182037353515625, -0.484405517578125, -0.4506072998046875, -0.41680908203125, -0.3830108642578125, -0.349212646484375, -0.3154144287109375, -0.2816162109375, -0.2478179931640625, -0.214019775390625, -0.1802215576171875, -0.14642333984375, -0.1126251220703125, -0.078826904296875, -0.0450286865234375, -0.01123046875, 0.0225677490234375, 0.056365966796875, 0.0901641845703125, 0.12396240234375, 0.1577606201171875, 0.191558837890625, 0.2253570556640625, 0.2591552734375, 0.2929534912109375, 0.326751708984375, 0.3605499267578125, 0.39434814453125, 0.4281463623046875, 0.461944580078125, 0.4957427978515625, 0.529541015625, 0.5633392333984375, 0.597137451171875, 0.6309356689453125, 0.66473388671875, 0.6985321044921875, 0.732330322265625, 0.7661285400390625, 0.7999267578125, 0.8337249755859375, 0.867523193359375, 0.9013214111328125, 0.93511962890625, 0.9689178466796875, 1.002716064453125, 1.0365142822265625, 1.0703125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 8.0, 5.0, 5.0, 6.0, 8.0, 6.0, 20.0, 10.0, 15.0, 14.0, 18.0, 14.0, 23.0, 18.0, 28.0, 28.0, 26.0, 33.0, 24.0, 26.0, 30.0, 43.0, 44.0, 36.0, 1060.0, 43.0, 35.0, 33.0, 30.0, 32.0, 20.0, 27.0, 29.0, 32.0, 23.0, 29.0, 21.0, 18.0, 14.0, 16.0, 11.0, 11.0, 12.0, 9.0, 4.0, 7.0, 5.0, 6.0, 4.0, 2.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-4.578125, -4.4312744140625, -4.284423828125, -4.1375732421875, -3.99072265625, -3.8438720703125, -3.697021484375, -3.5501708984375, -3.4033203125, -3.2564697265625, -3.109619140625, -2.9627685546875, -2.81591796875, -2.6690673828125, -2.522216796875, -2.3753662109375, -2.228515625, -2.0816650390625, -1.934814453125, -1.7879638671875, -1.64111328125, -1.4942626953125, -1.347412109375, -1.2005615234375, -1.0537109375, -0.9068603515625, -0.760009765625, -0.6131591796875, -0.46630859375, -0.3194580078125, -0.172607421875, -0.0257568359375, 0.12109375, 0.2679443359375, 0.414794921875, 0.5616455078125, 0.70849609375, 0.8553466796875, 1.002197265625, 1.1490478515625, 1.2958984375, 1.4427490234375, 1.589599609375, 1.7364501953125, 1.88330078125, 2.0301513671875, 2.177001953125, 2.3238525390625, 2.470703125, 2.6175537109375, 2.764404296875, 2.9112548828125, 3.05810546875, 3.2049560546875, 3.351806640625, 3.4986572265625, 3.6455078125, 3.7923583984375, 3.939208984375, 4.0860595703125, 4.23291015625, 4.3797607421875, 4.526611328125, 4.6734619140625, 4.8203125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 10.0, 10.0, 10.0, 25.0, 50.0, 57.0, 66.0, 120.0, 197.0, 291.0, 432.0, 701.0, 1091.0, 1595.0, 2353.0, 3533.0, 5483.0, 8487.0, 12847.0, 20010.0, 31411.0, 48849.0, 77319.0, 120659.0, 486522.0, 937513.0, 121485.0, 77358.0, 49474.0, 31526.0, 20028.0, 12889.0, 8466.0, 5580.0, 3707.0, 2379.0, 1619.0, 973.0, 686.0, 455.0, 309.0, 204.0, 133.0, 84.0, 42.0, 41.0, 16.0, 8.0, 9.0, 15.0, 6.0, 0.0, 3.0, 1.0, 1.0, 2.0], "bins": [-1.138671875, -1.1041717529296875, -1.069671630859375, -1.0351715087890625, -1.00067138671875, -0.9661712646484375, -0.931671142578125, -0.8971710205078125, -0.8626708984375, -0.8281707763671875, -0.793670654296875, -0.7591705322265625, -0.72467041015625, -0.6901702880859375, -0.655670166015625, -0.6211700439453125, -0.586669921875, -0.5521697998046875, -0.517669677734375, -0.4831695556640625, -0.44866943359375, -0.4141693115234375, -0.379669189453125, -0.3451690673828125, -0.3106689453125, -0.2761688232421875, -0.241668701171875, -0.2071685791015625, -0.17266845703125, -0.1381683349609375, -0.103668212890625, -0.0691680908203125, -0.03466796875, -0.0001678466796875, 0.034332275390625, 0.0688323974609375, 0.10333251953125, 0.1378326416015625, 0.172332763671875, 0.2068328857421875, 0.2413330078125, 0.2758331298828125, 0.310333251953125, 0.3448333740234375, 0.37933349609375, 0.4138336181640625, 0.448333740234375, 0.4828338623046875, 0.517333984375, 0.5518341064453125, 0.586334228515625, 0.6208343505859375, 0.65533447265625, 0.6898345947265625, 0.724334716796875, 0.7588348388671875, 0.7933349609375, 0.8278350830078125, 0.862335205078125, 0.8968353271484375, 0.93133544921875, 0.9658355712890625, 1.000335693359375, 1.0348358154296875, 1.0693359375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 8.0, 6.0, 10.0, 11.0, 13.0, 17.0, 17.0, 26.0, 32.0, 35.0, 30.0, 42.0, 40.0, 50.0, 52.0, 54.0, 52.0, 58.0, 58.0, 53.0, 56.0, 50.0, 41.0, 37.0, 32.0, 16.0, 25.0, 19.0, 14.0, 11.0, 7.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0018224716186523438, -0.0017687678337097168, -0.0017150640487670898, -0.0016613602638244629, -0.001607656478881836, -0.001553952693939209, -0.001500248908996582, -0.001446545124053955, -0.0013928413391113281, -0.0013391375541687012, -0.0012854337692260742, -0.0012317299842834473, -0.0011780261993408203, -0.0011243224143981934, -0.0010706186294555664, -0.0010169148445129395, -0.0009632110595703125, -0.0009095072746276855, -0.0008558034896850586, -0.0008020997047424316, -0.0007483959197998047, -0.0006946921348571777, -0.0006409883499145508, -0.0005872845649719238, -0.0005335807800292969, -0.0004798769950866699, -0.00042617321014404297, -0.000372469425201416, -0.00031876564025878906, -0.0002650618553161621, -0.00021135807037353516, -0.0001576542854309082, -0.00010395050048828125, -5.02467155456543e-05, 3.4570693969726562e-06, 5.716085433959961e-05, 0.00011086463928222656, 0.00016456842422485352, 0.00021827220916748047, 0.0002719759941101074, 0.0003256797790527344, 0.00037938356399536133, 0.0004330873489379883, 0.00048679113388061523, 0.0005404949188232422, 0.0005941987037658691, 0.0006479024887084961, 0.000701606273651123, 0.00075531005859375, 0.000809013843536377, 0.0008627176284790039, 0.0009164214134216309, 0.0009701251983642578, 0.0010238289833068848, 0.0010775327682495117, 0.0011312365531921387, 0.0011849403381347656, 0.0012386441230773926, 0.0012923479080200195, 0.0013460516929626465, 0.0013997554779052734, 0.0014534592628479004, 0.0015071630477905273, 0.0015608668327331543, 0.0016145706176757812]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 5.0, 8.0, 10.0, 20.0, 25.0, 22.0, 27.0, 36.0, 67.0, 69.0, 96.0, 142.0, 224.0, 524.0, 2062.0, 1000731.0, 42458.0, 976.0, 369.0, 181.0, 102.0, 80.0, 80.0, 57.0, 45.0, 28.0, 27.0, 15.0, 9.0, 14.0, 9.0, 12.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.040313720703125, -0.03900289535522461, -0.03769207000732422, -0.03638124465942383, -0.03507041931152344, -0.03375959396362305, -0.032448768615722656, -0.031137943267822266, -0.029827117919921875, -0.028516292572021484, -0.027205467224121094, -0.025894641876220703, -0.024583816528320312, -0.023272991180419922, -0.02196216583251953, -0.02065134048461914, -0.01934051513671875, -0.01802968978881836, -0.01671886444091797, -0.015408039093017578, -0.014097213745117188, -0.012786388397216797, -0.011475563049316406, -0.010164737701416016, -0.008853912353515625, -0.007543087005615234, -0.006232261657714844, -0.004921436309814453, -0.0036106109619140625, -0.002299785614013672, -0.0009889602661132812, 0.0003218650817871094, 0.0016326904296875, 0.0029435157775878906, 0.004254341125488281, 0.005565166473388672, 0.0068759918212890625, 0.008186817169189453, 0.009497642517089844, 0.010808467864990234, 0.012119293212890625, 0.013430118560791016, 0.014740943908691406, 0.016051769256591797, 0.017362594604492188, 0.018673419952392578, 0.01998424530029297, 0.02129507064819336, 0.02260589599609375, 0.02391672134399414, 0.02522754669189453, 0.026538372039794922, 0.027849197387695312, 0.029160022735595703, 0.030470848083496094, 0.031781673431396484, 0.033092498779296875, 0.034403324127197266, 0.035714149475097656, 0.03702497482299805, 0.03833580017089844, 0.03964662551879883, 0.04095745086669922, 0.04226827621459961, 0.0435791015625]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 19.0, 61.0, 151.0, 269.0, 270.0, 159.0, 59.0, 17.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0031445971690118313, -0.0030660019256174564, -0.0029874066822230816, -0.002908811205998063, -0.0028302159626036882, -0.0027516207192093134, -0.0026730254758149385, -0.00259442999958992, -0.002515834756195545, -0.0024372395128011703, -0.0023586442694067955, -0.002280048793181777, -0.002201453549787402, -0.0021228583063930273, -0.0020442630629986525, -0.001965667586773634, -0.001887072459794581, -0.001808477216400206, -0.0017298818565905094, -0.0016512866131961346, -0.001572691253386438, -0.001494096009992063, -0.0014155006501823664, -0.0013369054067879915, -0.0012583101633936167, -0.0011797149199992418, -0.0011011195601895452, -0.0010225243167951703, -0.0009439289569854736, -0.0008653337135910988, -0.000786738411989063, -0.0007081431103870273, -0.0006295477505773306, -0.0005509524489752948, -0.00047235714737325907, -0.00039376187487505376, -0.000315166573273018, -0.00023657127167098224, -0.00015797599917277694, -7.938069757074118e-05, -7.853959687054157e-07, 7.780989835737273e-05, 0.00015640519268345088, 0.0002350004797335714, 0.00031359578133560717, 0.00039219108293764293, 0.00047078635543584824, 0.000549381657037884, 0.0006279769586399198, 0.0007065722602419555, 0.0007851675618439913, 0.0008637628052383661, 0.0009423581650480628, 0.0010209534084424376, 0.0010995487682521343, 0.0011781440116465092, 0.001256739255040884, 0.0013353344984352589, 0.0014139298582449555, 0.0014925251016393304, 0.001571120461449027, 0.001649715704843402, 0.0017283109482377768, 0.0018069063080474734, 0.00188550166785717]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 2.0, 10.0, 13.0, 14.0, 14.0, 15.0, 16.0, 30.0, 27.0, 24.0, 30.0, 36.0, 27.0, 24.0, 51.0, 49.0, 52.0, 52.0, 51.0, 37.0, 38.0, 44.0, 48.0, 34.0, 35.0, 34.0, 28.0, 26.0, 20.0, 14.0, 22.0, 16.0, 14.0, 6.0, 8.0, 6.0, 9.0, 5.0, 5.0, 6.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009677410125732422, -0.000937717966735363, -0.0009076949208974838, -0.0008776718750596046, -0.0008476488292217255, -0.0008176257833838463, -0.0007876027375459671, -0.0007575796917080879, -0.0007275566458702087, -0.0006975336000323296, -0.0006675105541944504, -0.0006374875083565712, -0.000607464462518692, -0.0005774414166808128, -0.0005474183708429337, -0.0005173953250050545, -0.0004873722791671753, -0.0004573492333292961, -0.00042732618749141693, -0.00039730314165353775, -0.00036728009581565857, -0.0003372570499777794, -0.0003072340041399002, -0.000277210958302021, -0.00024718791246414185, -0.00021716486662626266, -0.00018714182078838348, -0.0001571187749505043, -0.00012709572911262512, -9.707268327474594e-05, -6.704963743686676e-05, -3.702659159898758e-05, -7.0035457611083984e-06, 2.3019500076770782e-05, 5.304254591464996e-05, 8.306559175252914e-05, 0.00011308863759040833, 0.0001431116834282875, 0.0001731347292661667, 0.00020315777510404587, 0.00023318082094192505, 0.00026320386677980423, 0.0002932269126176834, 0.0003232499584555626, 0.00035327300429344177, 0.00038329605013132095, 0.00041331909596920013, 0.0004433421418070793, 0.0004733651876449585, 0.0005033882334828377, 0.0005334112793207169, 0.000563434325158596, 0.0005934573709964752, 0.0006234804168343544, 0.0006535034626722336, 0.0006835265085101128, 0.0007135495543479919, 0.0007435726001858711, 0.0007735956460237503, 0.0008036186918616295, 0.0008336417376995087, 0.0008636647835373878, 0.000893687829375267, 0.0009237108752131462, 0.0009537339210510254]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 1.0, 5.0, 3.0, 4.0, 5.0, 6.0, 5.0, 11.0, 12.0, 15.0, 18.0, 21.0, 22.0, 17.0, 27.0, 32.0, 28.0, 44.0, 44.0, 36.0, 50.0, 43.0, 50.0, 45.0, 50.0, 46.0, 45.0, 40.0, 48.0, 34.0, 26.0, 20.0, 24.0, 18.0, 20.0, 20.0, 14.0, 14.0, 11.0, 4.0, 7.0, 3.0, 6.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8359375, -8.55126953125, -8.2666015625, -7.98193359375, -7.697265625, -7.41259765625, -7.1279296875, -6.84326171875, -6.55859375, -6.27392578125, -5.9892578125, -5.70458984375, -5.419921875, -5.13525390625, -4.8505859375, -4.56591796875, -4.28125, -3.99658203125, -3.7119140625, -3.42724609375, -3.142578125, -2.85791015625, -2.5732421875, -2.28857421875, -2.00390625, -1.71923828125, -1.4345703125, -1.14990234375, -0.865234375, -0.58056640625, -0.2958984375, -0.01123046875, 0.2734375, 0.55810546875, 0.8427734375, 1.12744140625, 1.412109375, 1.69677734375, 1.9814453125, 2.26611328125, 2.55078125, 2.83544921875, 3.1201171875, 3.40478515625, 3.689453125, 3.97412109375, 4.2587890625, 4.54345703125, 4.828125, 5.11279296875, 5.3974609375, 5.68212890625, 5.966796875, 6.25146484375, 6.5361328125, 6.82080078125, 7.10546875, 7.39013671875, 7.6748046875, 7.95947265625, 8.244140625, 8.52880859375, 8.8134765625, 9.09814453125, 9.3828125]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 4.0, 3.0, 4.0, 4.0, 6.0, 10.0, 11.0, 23.0, 17.0, 32.0, 36.0, 48.0, 84.0, 108.0, 170.0, 395.0, 743.0, 1650.0, 3526.0, 8626.0, 21335.0, 54551.0, 156613.0, 439405.0, 234982.0, 76305.0, 29234.0, 11636.0, 4835.0, 2097.0, 940.0, 434.0, 246.0, 138.0, 90.0, 61.0, 41.0, 30.0, 23.0, 15.0, 11.0, 11.0, 5.0, 6.0, 7.0, 5.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.8359375, -7.5885009765625, -7.341064453125, -7.0936279296875, -6.84619140625, -6.5987548828125, -6.351318359375, -6.1038818359375, -5.8564453125, -5.6090087890625, -5.361572265625, -5.1141357421875, -4.86669921875, -4.6192626953125, -4.371826171875, -4.1243896484375, -3.876953125, -3.6295166015625, -3.382080078125, -3.1346435546875, -2.88720703125, -2.6397705078125, -2.392333984375, -2.1448974609375, -1.8974609375, -1.6500244140625, -1.402587890625, -1.1551513671875, -0.90771484375, -0.6602783203125, -0.412841796875, -0.1654052734375, 0.08203125, 0.3294677734375, 0.576904296875, 0.8243408203125, 1.07177734375, 1.3192138671875, 1.566650390625, 1.8140869140625, 2.0615234375, 2.3089599609375, 2.556396484375, 2.8038330078125, 3.05126953125, 3.2987060546875, 3.546142578125, 3.7935791015625, 4.041015625, 4.2884521484375, 4.535888671875, 4.7833251953125, 5.03076171875, 5.2781982421875, 5.525634765625, 5.7730712890625, 6.0205078125, 6.2679443359375, 6.515380859375, 6.7628173828125, 7.01025390625, 7.2576904296875, 7.505126953125, 7.7525634765625, 8.0]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 2.0, 5.0, 4.0, 5.0, 9.0, 12.0, 14.0, 12.0, 14.0, 18.0, 18.0, 26.0, 25.0, 25.0, 41.0, 39.0, 36.0, 55.0, 48.0, 76.0, 199.0, 1563.0, 279.0, 77.0, 55.0, 40.0, 46.0, 42.0, 40.0, 32.0, 28.0, 31.0, 19.0, 23.0, 16.0, 14.0, 17.0, 9.0, 4.0, 8.0, 8.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-26.421875, -25.5859375, -24.75, -23.9140625, -23.078125, -22.2421875, -21.40625, -20.5703125, -19.734375, -18.8984375, -18.0625, -17.2265625, -16.390625, -15.5546875, -14.71875, -13.8828125, -13.046875, -12.2109375, -11.375, -10.5390625, -9.703125, -8.8671875, -8.03125, -7.1953125, -6.359375, -5.5234375, -4.6875, -3.8515625, -3.015625, -2.1796875, -1.34375, -0.5078125, 0.328125, 1.1640625, 2.0, 2.8359375, 3.671875, 4.5078125, 5.34375, 6.1796875, 7.015625, 7.8515625, 8.6875, 9.5234375, 10.359375, 11.1953125, 12.03125, 12.8671875, 13.703125, 14.5390625, 15.375, 16.2109375, 17.046875, 17.8828125, 18.71875, 19.5546875, 20.390625, 21.2265625, 22.0625, 22.8984375, 23.734375, 24.5703125, 25.40625, 26.2421875, 27.078125]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 5.0, 1.0, 4.0, 3.0, 8.0, 7.0, 13.0, 13.0, 16.0, 32.0, 28.0, 28.0, 45.0, 62.0, 95.0, 115.0, 161.0, 187.0, 337.0, 609.0, 2074.0, 98432.0, 3023566.0, 17195.0, 1212.0, 479.0, 284.0, 213.0, 120.0, 77.0, 71.0, 36.0, 47.0, 33.0, 31.0, 18.0, 20.0, 7.0, 3.0, 3.0, 8.0, 6.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-54.4375, -52.8515625, -51.265625, -49.6796875, -48.09375, -46.5078125, -44.921875, -43.3359375, -41.75, -40.1640625, -38.578125, -36.9921875, -35.40625, -33.8203125, -32.234375, -30.6484375, -29.0625, -27.4765625, -25.890625, -24.3046875, -22.71875, -21.1328125, -19.546875, -17.9609375, -16.375, -14.7890625, -13.203125, -11.6171875, -10.03125, -8.4453125, -6.859375, -5.2734375, -3.6875, -2.1015625, -0.515625, 1.0703125, 2.65625, 4.2421875, 5.828125, 7.4140625, 9.0, 10.5859375, 12.171875, 13.7578125, 15.34375, 16.9296875, 18.515625, 20.1015625, 21.6875, 23.2734375, 24.859375, 26.4453125, 28.03125, 29.6171875, 31.203125, 32.7890625, 34.375, 35.9609375, 37.546875, 39.1328125, 40.71875, 42.3046875, 43.890625, 45.4765625, 47.0625]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 141.0, 845.0, 28.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-445.35626220703125, -437.0059814453125, -428.6556701660156, -420.3053894042969, -411.9551086425781, -403.60479736328125, -395.2545166015625, -386.90423583984375, -378.5539245605469, -370.2036437988281, -361.85333251953125, -353.5030517578125, -345.15277099609375, -336.8024597167969, -328.4521789550781, -320.1018981933594, -311.7515869140625, -303.40130615234375, -295.0509948730469, -286.7007141113281, -278.3504333496094, -270.0001220703125, -261.64984130859375, -253.29954528808594, -244.94927978515625, -236.59898376464844, -228.2487030029297, -219.89840698242188, -211.54811096191406, -203.19781494140625, -194.8475341796875, -186.4972381591797, -178.14697265625, -169.7966766357422, -161.44639587402344, -153.09609985351562, -144.7458038330078, -136.3955078125, -128.04522705078125, -119.69493103027344, -111.34463500976562, -102.99434661865234, -94.64405059814453, -86.29376220703125, -77.94346618652344, -69.59317779541016, -61.242889404296875, -52.89259719848633, -44.54230499267578, -36.192012786865234, -27.84172248840332, -19.491432189941406, -11.14113998413086, -2.7908477783203125, 5.559440612792969, 13.909732818603516, 22.260025024414062, 30.61031723022461, 38.960609436035156, 47.31089782714844, 55.661190032958984, 64.01148223876953, 72.36177062988281, 80.71206665039062, 89.0623550415039]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 6.0, 3.0, 6.0, 9.0, 8.0, 14.0, 4.0, 16.0, 10.0, 26.0, 22.0, 27.0, 24.0, 23.0, 25.0, 38.0, 41.0, 31.0, 33.0, 38.0, 49.0, 43.0, 41.0, 45.0, 34.0, 34.0, 33.0, 34.0, 38.0, 26.0, 18.0, 33.0, 20.0, 25.0, 21.0, 14.0, 17.0, 9.0, 16.0, 11.0, 9.0, 9.0, 8.0, 4.0, 2.0, 4.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-63.102821350097656, -61.157371520996094, -59.211917877197266, -57.2664680480957, -55.321014404296875, -53.37556457519531, -51.430110931396484, -49.48466110229492, -47.539207458496094, -45.59375762939453, -43.6483039855957, -41.70285415649414, -39.75740051269531, -37.81195068359375, -35.86649703979492, -33.92104721069336, -31.975595474243164, -30.03014373779297, -28.084692001342773, -26.139240264892578, -24.193788528442383, -22.248336791992188, -20.302886962890625, -18.357433319091797, -16.411983489990234, -14.466531753540039, -12.521080017089844, -10.575628280639648, -8.630176544189453, -6.684725761413574, -4.739274024963379, -2.7938222885131836, -0.8483695983886719, 1.0970820188522339, 3.0425336360931396, 4.987985134124756, 6.933436870574951, 8.878888130187988, 10.824339866638184, 12.769791603088379, 14.715243339538574, 16.660694122314453, 18.60614585876465, 20.551597595214844, 22.49704933166504, 24.442501068115234, 26.38795280456543, 28.333404541015625, 30.27885627746582, 32.224308013916016, 34.16975784301758, 36.115211486816406, 38.06066131591797, 40.0061149597168, 41.95156478881836, 43.89701843261719, 45.84246826171875, 47.78791809082031, 49.73337173461914, 51.6788215637207, 53.62427520751953, 55.569725036621094, 57.51517868041992, 59.460628509521484, 61.40608215332031]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 2.0, 2.0, 4.0, 6.0, 5.0, 7.0, 15.0, 18.0, 15.0, 19.0, 21.0, 31.0, 36.0, 34.0, 30.0, 36.0, 50.0, 51.0, 43.0, 64.0, 37.0, 52.0, 66.0, 41.0, 44.0, 46.0, 28.0, 33.0, 22.0, 22.0, 19.0, 25.0, 19.0, 13.0, 11.0, 4.0, 9.0, 5.0, 2.0, 7.0, 3.0, 6.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.8984375, -9.5826416015625, -9.266845703125, -8.9510498046875, -8.63525390625, -8.3194580078125, -8.003662109375, -7.6878662109375, -7.3720703125, -7.0562744140625, -6.740478515625, -6.4246826171875, -6.10888671875, -5.7930908203125, -5.477294921875, -5.1614990234375, -4.845703125, -4.5299072265625, -4.214111328125, -3.8983154296875, -3.58251953125, -3.2667236328125, -2.950927734375, -2.6351318359375, -2.3193359375, -2.0035400390625, -1.687744140625, -1.3719482421875, -1.05615234375, -0.7403564453125, -0.424560546875, -0.1087646484375, 0.20703125, 0.5228271484375, 0.838623046875, 1.1544189453125, 1.47021484375, 1.7860107421875, 2.101806640625, 2.4176025390625, 2.7333984375, 3.0491943359375, 3.364990234375, 3.6807861328125, 3.99658203125, 4.3123779296875, 4.628173828125, 4.9439697265625, 5.259765625, 5.5755615234375, 5.891357421875, 6.2071533203125, 6.52294921875, 6.8387451171875, 7.154541015625, 7.4703369140625, 7.7861328125, 8.1019287109375, 8.417724609375, 8.7335205078125, 9.04931640625, 9.3651123046875, 9.680908203125, 9.9967041015625, 10.3125]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 6.0, 3.0, 12.0, 4.0, 13.0, 13.0, 16.0, 21.0, 27.0, 22.0, 32.0, 44.0, 56.0, 79.0, 105.0, 201.0, 515.0, 1993.0, 14759.0, 415658.0, 3486065.0, 260233.0, 11623.0, 1709.0, 476.0, 171.0, 89.0, 70.0, 47.0, 43.0, 39.0, 32.0, 22.0, 16.0, 15.0, 13.0, 11.0, 8.0, 5.0, 5.0, 5.0, 4.0, 3.0, 3.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.203125, -28.2744140625, -27.345703125, -26.4169921875, -25.48828125, -24.5595703125, -23.630859375, -22.7021484375, -21.7734375, -20.8447265625, -19.916015625, -18.9873046875, -18.05859375, -17.1298828125, -16.201171875, -15.2724609375, -14.34375, -13.4150390625, -12.486328125, -11.5576171875, -10.62890625, -9.7001953125, -8.771484375, -7.8427734375, -6.9140625, -5.9853515625, -5.056640625, -4.1279296875, -3.19921875, -2.2705078125, -1.341796875, -0.4130859375, 0.515625, 1.4443359375, 2.373046875, 3.3017578125, 4.23046875, 5.1591796875, 6.087890625, 7.0166015625, 7.9453125, 8.8740234375, 9.802734375, 10.7314453125, 11.66015625, 12.5888671875, 13.517578125, 14.4462890625, 15.375, 16.3037109375, 17.232421875, 18.1611328125, 19.08984375, 20.0185546875, 20.947265625, 21.8759765625, 22.8046875, 23.7333984375, 24.662109375, 25.5908203125, 26.51953125, 27.4482421875, 28.376953125, 29.3056640625, 30.234375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 7.0, 3.0, 4.0, 4.0, 8.0, 13.0, 8.0, 16.0, 21.0, 22.0, 30.0, 33.0, 39.0, 72.0, 80.0, 101.0, 131.0, 145.0, 210.0, 290.0, 323.0, 365.0, 402.0, 394.0, 299.0, 236.0, 169.0, 156.0, 97.0, 86.0, 60.0, 53.0, 44.0, 40.0, 24.0, 22.0, 23.0, 4.0, 15.0, 13.0, 4.0, 7.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.015625, -12.613037109375, -12.21044921875, -11.807861328125, -11.4052734375, -11.002685546875, -10.60009765625, -10.197509765625, -9.794921875, -9.392333984375, -8.98974609375, -8.587158203125, -8.1845703125, -7.781982421875, -7.37939453125, -6.976806640625, -6.57421875, -6.171630859375, -5.76904296875, -5.366455078125, -4.9638671875, -4.561279296875, -4.15869140625, -3.756103515625, -3.353515625, -2.950927734375, -2.54833984375, -2.145751953125, -1.7431640625, -1.340576171875, -0.93798828125, -0.535400390625, -0.1328125, 0.269775390625, 0.67236328125, 1.074951171875, 1.4775390625, 1.880126953125, 2.28271484375, 2.685302734375, 3.087890625, 3.490478515625, 3.89306640625, 4.295654296875, 4.6982421875, 5.100830078125, 5.50341796875, 5.906005859375, 6.30859375, 6.711181640625, 7.11376953125, 7.516357421875, 7.9189453125, 8.321533203125, 8.72412109375, 9.126708984375, 9.529296875, 9.931884765625, 10.33447265625, 10.737060546875, 11.1396484375, 11.542236328125, 11.94482421875, 12.347412109375, 12.75]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 5.0, 4.0, 7.0, 11.0, 13.0, 18.0, 30.0, 28.0, 62.0, 82.0, 110.0, 122.0, 209.0, 308.0, 498.0, 1761.0, 679453.0, 3506693.0, 3191.0, 585.0, 330.0, 212.0, 149.0, 129.0, 73.0, 59.0, 54.0, 32.0, 16.0, 14.0, 13.0, 6.0, 8.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-114.4375, -111.2666015625, -108.095703125, -104.9248046875, -101.75390625, -98.5830078125, -95.412109375, -92.2412109375, -89.0703125, -85.8994140625, -82.728515625, -79.5576171875, -76.38671875, -73.2158203125, -70.044921875, -66.8740234375, -63.703125, -60.5322265625, -57.361328125, -54.1904296875, -51.01953125, -47.8486328125, -44.677734375, -41.5068359375, -38.3359375, -35.1650390625, -31.994140625, -28.8232421875, -25.65234375, -22.4814453125, -19.310546875, -16.1396484375, -12.96875, -9.7978515625, -6.626953125, -3.4560546875, -0.28515625, 2.8857421875, 6.056640625, 9.2275390625, 12.3984375, 15.5693359375, 18.740234375, 21.9111328125, 25.08203125, 28.2529296875, 31.423828125, 34.5947265625, 37.765625, 40.9365234375, 44.107421875, 47.2783203125, 50.44921875, 53.6201171875, 56.791015625, 59.9619140625, 63.1328125, 66.3037109375, 69.474609375, 72.6455078125, 75.81640625, 78.9873046875, 82.158203125, 85.3291015625, 88.5]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 59.0, 459.0, 438.0, 55.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-451.9886169433594, -442.93896484375, -433.8892822265625, -424.8396301269531, -415.78997802734375, -406.74029541015625, -397.6906433105469, -388.6409912109375, -379.59130859375, -370.5416564941406, -361.4919738769531, -352.44232177734375, -343.3926696777344, -334.343017578125, -325.2933349609375, -316.2436828613281, -307.19403076171875, -298.1443786621094, -289.0946960449219, -280.0450439453125, -270.9953918457031, -261.94573974609375, -252.89605712890625, -243.84640502929688, -234.79673767089844, -225.7470703125, -216.69741821289062, -207.6477508544922, -198.59808349609375, -189.54843139648438, -180.49876403808594, -171.4490966796875, -162.39944458007812, -153.3497772216797, -144.3001251220703, -135.25045776367188, -126.20079803466797, -117.15113830566406, -108.10147094726562, -99.05181121826172, -90.00215148925781, -80.9524917602539, -71.90283203125, -62.85316467285156, -53.803504943847656, -44.75384521484375, -35.70418167114258, -26.654518127441406, -17.6048583984375, -8.555196762084961, 0.4944648742675781, 9.544126510620117, 18.593788146972656, 27.643447875976562, 36.693111419677734, 45.742774963378906, 54.79243469238281, 63.84209442138672, 72.89175415039062, 81.94142150878906, 90.99108123779297, 100.04074096679688, 109.09040832519531, 118.14006805419922, 127.18972778320312]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 1.0, 6.0, 3.0, 4.0, 10.0, 9.0, 12.0, 12.0, 12.0, 14.0, 10.0, 23.0, 20.0, 31.0, 38.0, 33.0, 32.0, 35.0, 28.0, 40.0, 34.0, 35.0, 44.0, 32.0, 36.0, 50.0, 38.0, 31.0, 40.0, 45.0, 30.0, 33.0, 22.0, 28.0, 27.0, 20.0, 13.0, 19.0, 15.0, 12.0, 6.0, 3.0, 3.0, 4.0, 5.0, 2.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.2247314453125, -50.460514068603516, -48.69629669189453, -46.93207931518555, -45.16786193847656, -43.40364456176758, -41.639427185058594, -39.87520980834961, -38.110992431640625, -36.34677505493164, -34.582557678222656, -32.81834030151367, -31.054122924804688, -29.289905548095703, -27.52568817138672, -25.761470794677734, -23.99725341796875, -22.233036041259766, -20.46881866455078, -18.704601287841797, -16.940383911132812, -15.176166534423828, -13.411949157714844, -11.64773178100586, -9.883514404296875, -8.11929702758789, -6.355079650878906, -4.590862274169922, -2.8266448974609375, -1.0624275207519531, 0.7017898559570312, 2.4660072326660156, 4.230224609375, 5.994441986083984, 7.758659362792969, 9.522876739501953, 11.287094116210938, 13.051311492919922, 14.815528869628906, 16.57974624633789, 18.343963623046875, 20.10818099975586, 21.872398376464844, 23.636615753173828, 25.400833129882812, 27.165050506591797, 28.92926788330078, 30.693485260009766, 32.45770263671875, 34.221920013427734, 35.98613739013672, 37.7503547668457, 39.51457214355469, 41.27878952026367, 43.043006896972656, 44.80722427368164, 46.571441650390625, 48.33565902709961, 50.099876403808594, 51.86409378051758, 53.62831115722656, 55.39252853393555, 57.15674591064453, 58.920963287353516, 60.6851806640625]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 10.0, 11.0, 8.0, 10.0, 11.0, 11.0, 15.0, 13.0, 27.0, 17.0, 25.0, 24.0, 34.0, 28.0, 34.0, 38.0, 38.0, 52.0, 44.0, 48.0, 51.0, 35.0, 35.0, 43.0, 32.0, 39.0, 41.0, 28.0, 34.0, 24.0, 24.0, 22.0, 13.0, 15.0, 18.0, 10.0, 5.0, 7.0, 4.0, 6.0, 8.0, 2.0, 3.0, 0.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.96875, -8.680419921875, -8.39208984375, -8.103759765625, -7.8154296875, -7.527099609375, -7.23876953125, -6.950439453125, -6.662109375, -6.373779296875, -6.08544921875, -5.797119140625, -5.5087890625, -5.220458984375, -4.93212890625, -4.643798828125, -4.35546875, -4.067138671875, -3.77880859375, -3.490478515625, -3.2021484375, -2.913818359375, -2.62548828125, -2.337158203125, -2.048828125, -1.760498046875, -1.47216796875, -1.183837890625, -0.8955078125, -0.607177734375, -0.31884765625, -0.030517578125, 0.2578125, 0.546142578125, 0.83447265625, 1.122802734375, 1.4111328125, 1.699462890625, 1.98779296875, 2.276123046875, 2.564453125, 2.852783203125, 3.14111328125, 3.429443359375, 3.7177734375, 4.006103515625, 4.29443359375, 4.582763671875, 4.87109375, 5.159423828125, 5.44775390625, 5.736083984375, 6.0244140625, 6.312744140625, 6.60107421875, 6.889404296875, 7.177734375, 7.466064453125, 7.75439453125, 8.042724609375, 8.3310546875, 8.619384765625, 8.90771484375, 9.196044921875, 9.484375]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 5.0, 4.0, 10.0, 7.0, 12.0, 28.0, 51.0, 70.0, 95.0, 128.0, 176.0, 270.0, 406.0, 580.0, 811.0, 1172.0, 1700.0, 2486.0, 3588.0, 5080.0, 7388.0, 10870.0, 15664.0, 22916.0, 33509.0, 50646.0, 77827.0, 122904.0, 185820.0, 173623.0, 112405.0, 71793.0, 46814.0, 31608.0, 21249.0, 14335.0, 10050.0, 6839.0, 4801.0, 3344.0, 2232.0, 1660.0, 1135.0, 775.0, 534.0, 350.0, 249.0, 178.0, 110.0, 86.0, 64.0, 35.0, 32.0, 21.0, 9.0, 8.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-1.1494140625, -1.1133880615234375, -1.077362060546875, -1.0413360595703125, -1.00531005859375, -0.9692840576171875, -0.933258056640625, -0.8972320556640625, -0.8612060546875, -0.8251800537109375, -0.789154052734375, -0.7531280517578125, -0.71710205078125, -0.6810760498046875, -0.645050048828125, -0.6090240478515625, -0.572998046875, -0.5369720458984375, -0.500946044921875, -0.4649200439453125, -0.42889404296875, -0.3928680419921875, -0.356842041015625, -0.3208160400390625, -0.2847900390625, -0.2487640380859375, -0.212738037109375, -0.1767120361328125, -0.14068603515625, -0.1046600341796875, -0.068634033203125, -0.0326080322265625, 0.00341796875, 0.0394439697265625, 0.075469970703125, 0.1114959716796875, 0.14752197265625, 0.1835479736328125, 0.219573974609375, 0.2555999755859375, 0.2916259765625, 0.3276519775390625, 0.363677978515625, 0.3997039794921875, 0.43572998046875, 0.4717559814453125, 0.507781982421875, 0.5438079833984375, 0.579833984375, 0.6158599853515625, 0.651885986328125, 0.6879119873046875, 0.72393798828125, 0.7599639892578125, 0.795989990234375, 0.8320159912109375, 0.8680419921875, 0.9040679931640625, 0.940093994140625, 0.9761199951171875, 1.01214599609375, 1.0481719970703125, 1.084197998046875, 1.1202239990234375, 1.15625]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 6.0, 3.0, 6.0, 5.0, 10.0, 13.0, 10.0, 8.0, 17.0, 28.0, 24.0, 25.0, 15.0, 26.0, 42.0, 48.0, 36.0, 24.0, 39.0, 43.0, 1072.0, 47.0, 45.0, 44.0, 45.0, 47.0, 42.0, 36.0, 36.0, 26.0, 26.0, 19.0, 25.0, 16.0, 16.0, 20.0, 13.0, 8.0, 9.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.2421875, -6.040771484375, -5.83935546875, -5.637939453125, -5.4365234375, -5.235107421875, -5.03369140625, -4.832275390625, -4.630859375, -4.429443359375, -4.22802734375, -4.026611328125, -3.8251953125, -3.623779296875, -3.42236328125, -3.220947265625, -3.01953125, -2.818115234375, -2.61669921875, -2.415283203125, -2.2138671875, -2.012451171875, -1.81103515625, -1.609619140625, -1.408203125, -1.206787109375, -1.00537109375, -0.803955078125, -0.6025390625, -0.401123046875, -0.19970703125, 0.001708984375, 0.203125, 0.404541015625, 0.60595703125, 0.807373046875, 1.0087890625, 1.210205078125, 1.41162109375, 1.613037109375, 1.814453125, 2.015869140625, 2.21728515625, 2.418701171875, 2.6201171875, 2.821533203125, 3.02294921875, 3.224365234375, 3.42578125, 3.627197265625, 3.82861328125, 4.030029296875, 4.2314453125, 4.432861328125, 4.63427734375, 4.835693359375, 5.037109375, 5.238525390625, 5.43994140625, 5.641357421875, 5.8427734375, 6.044189453125, 6.24560546875, 6.447021484375, 6.6484375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 12.0, 6.0, 20.0, 16.0, 29.0, 36.0, 73.0, 126.0, 182.0, 288.0, 468.0, 734.0, 1217.0, 2053.0, 3413.0, 5709.0, 9746.0, 15985.0, 27145.0, 47282.0, 83181.0, 146196.0, 1293279.0, 196277.0, 111710.0, 63051.0, 36132.0, 21382.0, 12450.0, 7497.0, 4601.0, 2617.0, 1635.0, 967.0, 612.0, 396.0, 212.0, 152.0, 74.0, 63.0, 47.0, 23.0, 17.0, 14.0, 3.0, 5.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.533203125, -1.4864044189453125, -1.439605712890625, -1.3928070068359375, -1.34600830078125, -1.2992095947265625, -1.252410888671875, -1.2056121826171875, -1.1588134765625, -1.1120147705078125, -1.065216064453125, -1.0184173583984375, -0.97161865234375, -0.9248199462890625, -0.878021240234375, -0.8312225341796875, -0.784423828125, -0.7376251220703125, -0.690826416015625, -0.6440277099609375, -0.59722900390625, -0.5504302978515625, -0.503631591796875, -0.4568328857421875, -0.4100341796875, -0.3632354736328125, -0.316436767578125, -0.2696380615234375, -0.22283935546875, -0.1760406494140625, -0.129241943359375, -0.0824432373046875, -0.03564453125, 0.0111541748046875, 0.057952880859375, 0.1047515869140625, 0.15155029296875, 0.1983489990234375, 0.245147705078125, 0.2919464111328125, 0.3387451171875, 0.3855438232421875, 0.432342529296875, 0.4791412353515625, 0.52593994140625, 0.5727386474609375, 0.619537353515625, 0.6663360595703125, 0.713134765625, 0.7599334716796875, 0.806732177734375, 0.8535308837890625, 0.90032958984375, 0.9471282958984375, 0.993927001953125, 1.0407257080078125, 1.0875244140625, 1.1343231201171875, 1.181121826171875, 1.2279205322265625, 1.27471923828125, 1.3215179443359375, 1.368316650390625, 1.4151153564453125, 1.4619140625]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 5.0, 8.0, 8.0, 6.0, 10.0, 11.0, 22.0, 19.0, 21.0, 34.0, 47.0, 58.0, 57.0, 72.0, 69.0, 96.0, 77.0, 59.0, 69.0, 51.0, 44.0, 37.0, 25.0, 21.0, 16.0, 9.0, 13.0, 4.0, 4.0, 7.0, 7.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.002986907958984375, -0.002899855375289917, -0.002812802791595459, -0.002725750207901001, -0.002638697624206543, -0.002551645040512085, -0.002464592456817627, -0.002377539873123169, -0.002290487289428711, -0.002203434705734253, -0.002116382122039795, -0.002029329538345337, -0.001942276954650879, -0.001855224370956421, -0.0017681717872619629, -0.0016811192035675049, -0.0015940666198730469, -0.0015070140361785889, -0.0014199614524841309, -0.0013329088687896729, -0.0012458562850952148, -0.0011588037014007568, -0.0010717511177062988, -0.0009846985340118408, -0.0008976459503173828, -0.0008105933666229248, -0.0007235407829284668, -0.0006364881992340088, -0.0005494356155395508, -0.0004623830318450928, -0.00037533044815063477, -0.00028827786445617676, -0.00020122528076171875, -0.00011417269706726074, -2.7120113372802734e-05, 5.9932470321655273e-05, 0.00014698505401611328, 0.0002340376377105713, 0.0003210902214050293, 0.0004081428050994873, 0.0004951953887939453, 0.0005822479724884033, 0.0006693005561828613, 0.0007563531398773193, 0.0008434057235717773, 0.0009304583072662354, 0.0010175108909606934, 0.0011045634746551514, 0.0011916160583496094, 0.0012786686420440674, 0.0013657212257385254, 0.0014527738094329834, 0.0015398263931274414, 0.0016268789768218994, 0.0017139315605163574, 0.0018009841442108154, 0.0018880367279052734, 0.0019750893115997314, 0.0020621418952941895, 0.0021491944789886475, 0.0022362470626831055, 0.0023232996463775635, 0.0024103522300720215, 0.0024974048137664795, 0.0025844573974609375]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 1.0, 5.0, 6.0, 12.0, 8.0, 11.0, 7.0, 20.0, 40.0, 21.0, 60.0, 92.0, 127.0, 158.0, 346.0, 911.0, 299970.0, 744794.0, 1038.0, 339.0, 176.0, 115.0, 76.0, 55.0, 35.0, 27.0, 22.0, 19.0, 8.0, 12.0, 5.0, 10.0, 6.0, 1.0, 4.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.056793212890625, -0.054837703704833984, -0.05288219451904297, -0.05092668533325195, -0.04897117614746094, -0.04701566696166992, -0.045060157775878906, -0.04310464859008789, -0.041149139404296875, -0.03919363021850586, -0.037238121032714844, -0.03528261184692383, -0.03332710266113281, -0.0313715934753418, -0.02941608428955078, -0.027460575103759766, -0.02550506591796875, -0.023549556732177734, -0.02159404754638672, -0.019638538360595703, -0.017683029174804688, -0.015727519989013672, -0.013772010803222656, -0.01181650161743164, -0.009860992431640625, -0.00790548324584961, -0.005949974060058594, -0.003994464874267578, -0.0020389556884765625, -8.344650268554688e-05, 0.0018720626831054688, 0.0038275718688964844, 0.0057830810546875, 0.007738590240478516, 0.009694099426269531, 0.011649608612060547, 0.013605117797851562, 0.015560626983642578, 0.017516136169433594, 0.01947164535522461, 0.021427154541015625, 0.02338266372680664, 0.025338172912597656, 0.027293682098388672, 0.029249191284179688, 0.031204700469970703, 0.03316020965576172, 0.035115718841552734, 0.03707122802734375, 0.039026737213134766, 0.04098224639892578, 0.0429377555847168, 0.04489326477050781, 0.04684877395629883, 0.048804283142089844, 0.05075979232788086, 0.052715301513671875, 0.05467081069946289, 0.056626319885253906, 0.05858182907104492, 0.06053733825683594, 0.06249284744262695, 0.06444835662841797, 0.06640386581420898, 0.068359375]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 7.0, 7.0, 23.0, 79.0, 169.0, 276.0, 230.0, 142.0, 59.0, 20.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006881483714096248, -0.0006108620436862111, -0.0005335757159627974, -0.0004562893882393837, -0.00037900306051597, -0.0003017167327925563, -0.00022443040506914258, -0.00014714407734572887, -6.985774962231517e-05, 7.4285781010985374e-06, 8.471490582451224e-05, 0.00016200123354792595, 0.00023928756127133965, 0.00031657388899475336, 0.00039386021671816707, 0.00047114654444158077, 0.0005484328721649945, 0.0006257191998884082, 0.0007030055276118219, 0.0007802918553352356, 0.0008575781830586493, 0.000934864510782063, 0.0010121508967131376, 0.0010894371662288904, 0.0011667234357446432, 0.001244009705260396, 0.0013212960911914706, 0.0013985824771225452, 0.001475868746638298, 0.0015531550161540508, 0.0016304414020851254, 0.0017077277880162, 0.0017850142903625965, 0.0018623005598783493, 0.001939586945809424, 0.0020168733317404985, 0.0020941596012562513, 0.002171445870772004, 0.0022487323731184006, 0.0023260186426341534, 0.002403304912149906, 0.002480591181665659, 0.0025578774511814117, 0.002635163953527808, 0.002712450223043561, 0.0027897364925593138, 0.0028670229949057102, 0.002944309264421463, 0.003021595533937216, 0.0030988818034529686, 0.0031761680729687214, 0.003253454575315118, 0.0033307408448308706, 0.0034080271143466234, 0.00348531361669302, 0.0035625998862087727, 0.0036398861557245255, 0.0037171724252402782, 0.003794458694756031, 0.0038717451971024275, 0.003949031233787537, 0.004026317968964577, 0.0041036042384803295, 0.004180890507996082, 0.004258176777511835]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 4.0, 6.0, 11.0, 8.0, 11.0, 10.0, 15.0, 9.0, 18.0, 21.0, 27.0, 27.0, 36.0, 39.0, 40.0, 37.0, 40.0, 46.0, 36.0, 44.0, 32.0, 42.0, 56.0, 29.0, 46.0, 36.0, 37.0, 28.0, 29.0, 36.0, 29.0, 28.0, 14.0, 14.0, 11.0, 14.0, 11.0, 7.0, 7.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.001127481460571289, -0.0010868236422538757, -0.0010461658239364624, -0.001005508005619049, -0.0009648501873016357, -0.0009241923689842224, -0.0008835345506668091, -0.0008428767323493958, -0.0008022189140319824, -0.0007615610957145691, -0.0007209032773971558, -0.0006802454590797424, -0.0006395876407623291, -0.0005989298224449158, -0.0005582720041275024, -0.0005176141858100891, -0.0004769563674926758, -0.00043629854917526245, -0.0003956407308578491, -0.0003549829125404358, -0.00031432509422302246, -0.00027366727590560913, -0.0002330094575881958, -0.00019235163927078247, -0.00015169382095336914, -0.00011103600263595581, -7.037818431854248e-05, -2.972036600112915e-05, 1.093745231628418e-05, 5.159527063369751e-05, 9.225308895111084e-05, 0.00013291090726852417, 0.0001735687255859375, 0.00021422654390335083, 0.00025488436222076416, 0.0002955421805381775, 0.0003361999988555908, 0.00037685781717300415, 0.0004175156354904175, 0.0004581734538078308, 0.0004988312721252441, 0.0005394890904426575, 0.0005801469087600708, 0.0006208047270774841, 0.0006614625453948975, 0.0007021203637123108, 0.0007427781820297241, 0.0007834360003471375, 0.0008240938186645508, 0.0008647516369819641, 0.0009054094552993774, 0.0009460672736167908, 0.000986725091934204, 0.0010273829102516174, 0.0010680407285690308, 0.001108698546886444, 0.0011493563652038574, 0.0011900141835212708, 0.001230672001838684, 0.0012713298201560974, 0.0013119876384735107, 0.001352645456790924, 0.0013933032751083374, 0.0014339610934257507, 0.001474618911743164]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 10.0, 11.0, 8.0, 10.0, 11.0, 11.0, 15.0, 13.0, 27.0, 17.0, 25.0, 24.0, 34.0, 28.0, 34.0, 38.0, 38.0, 52.0, 44.0, 48.0, 51.0, 35.0, 35.0, 43.0, 32.0, 39.0, 41.0, 28.0, 34.0, 24.0, 24.0, 22.0, 13.0, 15.0, 18.0, 10.0, 5.0, 7.0, 4.0, 6.0, 8.0, 3.0, 2.0, 0.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.96875, -8.680419921875, -8.39208984375, -8.103759765625, -7.8154296875, -7.527099609375, -7.23876953125, -6.950439453125, -6.662109375, -6.373779296875, -6.08544921875, -5.797119140625, -5.5087890625, -5.220458984375, -4.93212890625, -4.643798828125, -4.35546875, -4.067138671875, -3.77880859375, -3.490478515625, -3.2021484375, -2.913818359375, -2.62548828125, -2.337158203125, -2.048828125, -1.760498046875, -1.47216796875, -1.183837890625, -0.8955078125, -0.607177734375, -0.31884765625, -0.030517578125, 0.2578125, 0.546142578125, 0.83447265625, 1.122802734375, 1.4111328125, 1.699462890625, 1.98779296875, 2.276123046875, 2.564453125, 2.852783203125, 3.14111328125, 3.429443359375, 3.7177734375, 4.006103515625, 4.29443359375, 4.582763671875, 4.87109375, 5.159423828125, 5.44775390625, 5.736083984375, 6.0244140625, 6.312744140625, 6.60107421875, 6.889404296875, 7.177734375, 7.466064453125, 7.75439453125, 8.042724609375, 8.3310546875, 8.619384765625, 8.90771484375, 9.196044921875, 9.484375]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 10.0, 15.0, 11.0, 16.0, 10.0, 18.0, 22.0, 30.0, 31.0, 55.0, 62.0, 101.0, 138.0, 166.0, 314.0, 585.0, 1560.0, 5686.0, 31413.0, 314460.0, 630879.0, 50619.0, 8535.0, 1991.0, 704.0, 327.0, 228.0, 160.0, 98.0, 74.0, 52.0, 51.0, 29.0, 29.0, 19.0, 7.0, 13.0, 7.0, 7.0, 4.0, 9.0, 4.0, 1.0, 1.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.75, -17.1796875, -16.609375, -16.0390625, -15.46875, -14.8984375, -14.328125, -13.7578125, -13.1875, -12.6171875, -12.046875, -11.4765625, -10.90625, -10.3359375, -9.765625, -9.1953125, -8.625, -8.0546875, -7.484375, -6.9140625, -6.34375, -5.7734375, -5.203125, -4.6328125, -4.0625, -3.4921875, -2.921875, -2.3515625, -1.78125, -1.2109375, -0.640625, -0.0703125, 0.5, 1.0703125, 1.640625, 2.2109375, 2.78125, 3.3515625, 3.921875, 4.4921875, 5.0625, 5.6328125, 6.203125, 6.7734375, 7.34375, 7.9140625, 8.484375, 9.0546875, 9.625, 10.1953125, 10.765625, 11.3359375, 11.90625, 12.4765625, 13.046875, 13.6171875, 14.1875, 14.7578125, 15.328125, 15.8984375, 16.46875, 17.0390625, 17.609375, 18.1796875, 18.75]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 0.0, 2.0, 6.0, 5.0, 6.0, 10.0, 6.0, 10.0, 13.0, 17.0, 21.0, 21.0, 27.0, 18.0, 38.0, 25.0, 33.0, 35.0, 54.0, 51.0, 82.0, 145.0, 1569.0, 334.0, 89.0, 65.0, 37.0, 48.0, 44.0, 33.0, 28.0, 25.0, 19.0, 22.0, 25.0, 15.0, 16.0, 13.0, 10.0, 4.0, 6.0, 4.0, 3.0, 3.0, 5.0, 5.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-27.6875, -26.819580078125, -25.95166015625, -25.083740234375, -24.2158203125, -23.347900390625, -22.47998046875, -21.612060546875, -20.744140625, -19.876220703125, -19.00830078125, -18.140380859375, -17.2724609375, -16.404541015625, -15.53662109375, -14.668701171875, -13.80078125, -12.932861328125, -12.06494140625, -11.197021484375, -10.3291015625, -9.461181640625, -8.59326171875, -7.725341796875, -6.857421875, -5.989501953125, -5.12158203125, -4.253662109375, -3.3857421875, -2.517822265625, -1.64990234375, -0.781982421875, 0.0859375, 0.953857421875, 1.82177734375, 2.689697265625, 3.5576171875, 4.425537109375, 5.29345703125, 6.161376953125, 7.029296875, 7.897216796875, 8.76513671875, 9.633056640625, 10.5009765625, 11.368896484375, 12.23681640625, 13.104736328125, 13.97265625, 14.840576171875, 15.70849609375, 16.576416015625, 17.4443359375, 18.312255859375, 19.18017578125, 20.048095703125, 20.916015625, 21.783935546875, 22.65185546875, 23.519775390625, 24.3876953125, 25.255615234375, 26.12353515625, 26.991455078125, 27.859375]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 6.0, 4.0, 5.0, 3.0, 4.0, 9.0, 8.0, 8.0, 13.0, 18.0, 30.0, 32.0, 29.0, 41.0, 43.0, 48.0, 92.0, 108.0, 160.0, 329.0, 759.0, 5474.0, 2742113.0, 391317.0, 3439.0, 640.0, 316.0, 189.0, 97.0, 67.0, 64.0, 47.0, 29.0, 38.0, 28.0, 28.0, 15.0, 13.0, 11.0, 9.0, 5.0, 7.0, 7.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-64.5625, -62.5390625, -60.515625, -58.4921875, -56.46875, -54.4453125, -52.421875, -50.3984375, -48.375, -46.3515625, -44.328125, -42.3046875, -40.28125, -38.2578125, -36.234375, -34.2109375, -32.1875, -30.1640625, -28.140625, -26.1171875, -24.09375, -22.0703125, -20.046875, -18.0234375, -16.0, -13.9765625, -11.953125, -9.9296875, -7.90625, -5.8828125, -3.859375, -1.8359375, 0.1875, 2.2109375, 4.234375, 6.2578125, 8.28125, 10.3046875, 12.328125, 14.3515625, 16.375, 18.3984375, 20.421875, 22.4453125, 24.46875, 26.4921875, 28.515625, 30.5390625, 32.5625, 34.5859375, 36.609375, 38.6328125, 40.65625, 42.6796875, 44.703125, 46.7265625, 48.75, 50.7734375, 52.796875, 54.8203125, 56.84375, 58.8671875, 60.890625, 62.9140625, 64.9375]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 42.0, 471.0, 454.0, 44.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-128.8292999267578, -123.87491607666016, -118.9205322265625, -113.96614837646484, -109.01176452636719, -104.05738067626953, -99.10299682617188, -94.14860534667969, -89.19422912597656, -84.2398452758789, -79.28546142578125, -74.3310775756836, -69.37669372558594, -64.42230987548828, -59.46792221069336, -54.5135383605957, -49.55915069580078, -44.604766845703125, -39.65038299560547, -34.69599914550781, -29.741613388061523, -24.787229537963867, -19.832843780517578, -14.878459930419922, -9.924076080322266, -4.969691753387451, -0.015307426452636719, 4.939077377319336, 9.893461227416992, 14.847845077514648, 19.802230834960938, 24.756614685058594, 29.71099853515625, 34.665382385253906, 39.61976623535156, 44.57415008544922, 49.528533935546875, 54.48291778564453, 59.43730545043945, 64.39169311523438, 69.3460693359375, 74.30045318603516, 79.25483703613281, 84.20922088623047, 89.16360473632812, 94.11798858642578, 99.07237243652344, 104.02676391601562, 108.98114776611328, 113.93553161621094, 118.8899154663086, 123.84429931640625, 128.79869079589844, 133.75306701660156, 138.70745849609375, 143.66183471679688, 148.61622619628906, 153.57061767578125, 158.52499389648438, 163.47938537597656, 168.4337615966797, 173.38815307617188, 178.342529296875, 183.2969207763672, 188.2512969970703]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 1.0, 5.0, 8.0, 7.0, 8.0, 10.0, 11.0, 19.0, 10.0, 13.0, 13.0, 18.0, 21.0, 26.0, 27.0, 29.0, 22.0, 35.0, 28.0, 27.0, 31.0, 32.0, 38.0, 36.0, 29.0, 37.0, 32.0, 30.0, 46.0, 29.0, 37.0, 25.0, 21.0, 28.0, 21.0, 17.0, 25.0, 20.0, 12.0, 17.0, 20.0, 12.0, 14.0, 11.0, 7.0, 4.0, 7.0, 7.0, 4.0, 3.0, 4.0, 1.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0], "bins": [-59.55815124511719, -57.63398742675781, -55.70982360839844, -53.78565979003906, -51.86149978637695, -49.93733596801758, -48.0131721496582, -46.08900833129883, -44.16484832763672, -42.240684509277344, -40.31652069091797, -38.392356872558594, -36.468196868896484, -34.54403305053711, -32.619869232177734, -30.69570541381836, -28.771541595458984, -26.84737777709961, -24.923215866088867, -22.999052047729492, -21.07489013671875, -19.150726318359375, -17.2265625, -15.302399635314941, -13.378236770629883, -11.454073905944824, -9.529911041259766, -7.605747222900391, -5.681584358215332, -3.7574214935302734, -1.8332576751708984, 0.09090518951416016, 2.0150680541992188, 3.9392311573028564, 5.863394260406494, 7.787557601928711, 9.71172046661377, 11.635883331298828, 13.560047149658203, 15.484210014343262, 17.40837287902832, 19.332536697387695, 21.256698608398438, 23.180862426757812, 25.105026245117188, 27.02918815612793, 28.953351974487305, 30.877513885498047, 32.80167770385742, 34.7258415222168, 36.65000534057617, 38.57416534423828, 40.498329162597656, 42.42249298095703, 44.346656799316406, 46.27082061767578, 48.194984436035156, 50.11914825439453, 52.043312072753906, 53.96747589111328, 55.89163589477539, 57.815799713134766, 59.73996353149414, 61.664127349853516, 63.588287353515625]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 9.0, 7.0, 4.0, 7.0, 6.0, 12.0, 9.0, 11.0, 18.0, 20.0, 27.0, 27.0, 26.0, 28.0, 35.0, 32.0, 36.0, 43.0, 43.0, 52.0, 39.0, 37.0, 37.0, 62.0, 34.0, 38.0, 31.0, 39.0, 34.0, 29.0, 33.0, 20.0, 20.0, 17.0, 18.0, 14.0, 9.0, 12.0, 6.0, 4.0, 5.0, 1.0, 4.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.046875, -8.7479248046875, -8.448974609375, -8.1500244140625, -7.85107421875, -7.5521240234375, -7.253173828125, -6.9542236328125, -6.6552734375, -6.3563232421875, -6.057373046875, -5.7584228515625, -5.45947265625, -5.1605224609375, -4.861572265625, -4.5626220703125, -4.263671875, -3.9647216796875, -3.665771484375, -3.3668212890625, -3.06787109375, -2.7689208984375, -2.469970703125, -2.1710205078125, -1.8720703125, -1.5731201171875, -1.274169921875, -0.9752197265625, -0.67626953125, -0.3773193359375, -0.078369140625, 0.2205810546875, 0.51953125, 0.8184814453125, 1.117431640625, 1.4163818359375, 1.71533203125, 2.0142822265625, 2.313232421875, 2.6121826171875, 2.9111328125, 3.2100830078125, 3.509033203125, 3.8079833984375, 4.10693359375, 4.4058837890625, 4.704833984375, 5.0037841796875, 5.302734375, 5.6016845703125, 5.900634765625, 6.1995849609375, 6.49853515625, 6.7974853515625, 7.096435546875, 7.3953857421875, 7.6943359375, 7.9932861328125, 8.292236328125, 8.5911865234375, 8.89013671875, 9.1890869140625, 9.488037109375, 9.7869873046875, 10.0859375]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 0.0, 1.0, 6.0, 11.0, 8.0, 10.0, 13.0, 11.0, 18.0, 20.0, 18.0, 25.0, 50.0, 46.0, 66.0, 162.0, 318.0, 685.0, 2039.0, 7001.0, 36784.0, 612072.0, 3101198.0, 395110.0, 29288.0, 6170.0, 1808.0, 657.0, 256.0, 106.0, 67.0, 51.0, 42.0, 30.0, 33.0, 17.0, 16.0, 11.0, 9.0, 9.0, 5.0, 6.0, 5.0, 10.0, 0.0, 6.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-25.6875, -24.8955078125, -24.103515625, -23.3115234375, -22.51953125, -21.7275390625, -20.935546875, -20.1435546875, -19.3515625, -18.5595703125, -17.767578125, -16.9755859375, -16.18359375, -15.3916015625, -14.599609375, -13.8076171875, -13.015625, -12.2236328125, -11.431640625, -10.6396484375, -9.84765625, -9.0556640625, -8.263671875, -7.4716796875, -6.6796875, -5.8876953125, -5.095703125, -4.3037109375, -3.51171875, -2.7197265625, -1.927734375, -1.1357421875, -0.34375, 0.4482421875, 1.240234375, 2.0322265625, 2.82421875, 3.6162109375, 4.408203125, 5.2001953125, 5.9921875, 6.7841796875, 7.576171875, 8.3681640625, 9.16015625, 9.9521484375, 10.744140625, 11.5361328125, 12.328125, 13.1201171875, 13.912109375, 14.7041015625, 15.49609375, 16.2880859375, 17.080078125, 17.8720703125, 18.6640625, 19.4560546875, 20.248046875, 21.0400390625, 21.83203125, 22.6240234375, 23.416015625, 24.2080078125, 25.0]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 2.0, 11.0, 18.0, 11.0, 17.0, 23.0, 40.0, 59.0, 95.0, 131.0, 168.0, 272.0, 395.0, 559.0, 620.0, 531.0, 362.0, 254.0, 153.0, 128.0, 78.0, 44.0, 37.0, 24.0, 12.0, 11.0, 10.0, 6.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.65625, -21.02685546875, -20.3974609375, -19.76806640625, -19.138671875, -18.50927734375, -17.8798828125, -17.25048828125, -16.62109375, -15.99169921875, -15.3623046875, -14.73291015625, -14.103515625, -13.47412109375, -12.8447265625, -12.21533203125, -11.5859375, -10.95654296875, -10.3271484375, -9.69775390625, -9.068359375, -8.43896484375, -7.8095703125, -7.18017578125, -6.55078125, -5.92138671875, -5.2919921875, -4.66259765625, -4.033203125, -3.40380859375, -2.7744140625, -2.14501953125, -1.515625, -0.88623046875, -0.2568359375, 0.37255859375, 1.001953125, 1.63134765625, 2.2607421875, 2.89013671875, 3.51953125, 4.14892578125, 4.7783203125, 5.40771484375, 6.037109375, 6.66650390625, 7.2958984375, 7.92529296875, 8.5546875, 9.18408203125, 9.8134765625, 10.44287109375, 11.072265625, 11.70166015625, 12.3310546875, 12.96044921875, 13.58984375, 14.21923828125, 14.8486328125, 15.47802734375, 16.107421875, 16.73681640625, 17.3662109375, 17.99560546875, 18.625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 8.0, 9.0, 12.0, 11.0, 9.0, 27.0, 36.0, 39.0, 66.0, 78.0, 102.0, 141.0, 240.0, 354.0, 942.0, 6287.0, 773787.0, 3397200.0, 12376.0, 1244.0, 471.0, 247.0, 170.0, 111.0, 85.0, 51.0, 48.0, 42.0, 23.0, 19.0, 14.0, 10.0, 9.0, 5.0, 2.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-90.5625, -88.18603515625, -85.8095703125, -83.43310546875, -81.056640625, -78.68017578125, -76.3037109375, -73.92724609375, -71.55078125, -69.17431640625, -66.7978515625, -64.42138671875, -62.044921875, -59.66845703125, -57.2919921875, -54.91552734375, -52.5390625, -50.16259765625, -47.7861328125, -45.40966796875, -43.033203125, -40.65673828125, -38.2802734375, -35.90380859375, -33.52734375, -31.15087890625, -28.7744140625, -26.39794921875, -24.021484375, -21.64501953125, -19.2685546875, -16.89208984375, -14.515625, -12.13916015625, -9.7626953125, -7.38623046875, -5.009765625, -2.63330078125, -0.2568359375, 2.11962890625, 4.49609375, 6.87255859375, 9.2490234375, 11.62548828125, 14.001953125, 16.37841796875, 18.7548828125, 21.13134765625, 23.5078125, 25.88427734375, 28.2607421875, 30.63720703125, 33.013671875, 35.39013671875, 37.7666015625, 40.14306640625, 42.51953125, 44.89599609375, 47.2724609375, 49.64892578125, 52.025390625, 54.40185546875, 56.7783203125, 59.15478515625, 61.53125]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 11.0, 31.0, 74.0, 155.0, 248.0, 251.0, 146.0, 64.0, 16.0, 10.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-162.1055450439453, -158.2458953857422, -154.38623046875, -150.52658081054688, -146.6669158935547, -142.80726623535156, -138.94760131835938, -135.08795166015625, -131.22830200195312, -127.36864471435547, -123.50898742675781, -119.64933776855469, -115.78968048095703, -111.93002319335938, -108.07036590576172, -104.21070861816406, -100.3510513305664, -96.49139404296875, -92.6317367553711, -88.77207946777344, -84.91242980957031, -81.05277252197266, -77.193115234375, -73.33345794677734, -69.47380065917969, -65.61414337158203, -61.75448989868164, -57.894832611083984, -54.035179138183594, -50.17552185058594, -46.31586456298828, -42.456207275390625, -38.5965576171875, -34.736900329589844, -30.877246856689453, -27.017589569091797, -23.157934188842773, -19.29827880859375, -15.438621520996094, -11.57896614074707, -7.719310760498047, -3.8596549034118652, 9.5367431640625e-07, 3.8596572875976562, 7.71931266784668, 11.578968048095703, 15.43862533569336, 19.298280715942383, 23.157936096191406, 27.01759147644043, 30.877246856689453, 34.73690414428711, 38.5965576171875, 42.456214904785156, 46.31587219238281, 50.17552947998047, 54.03518295288086, 57.894840240478516, 61.754493713378906, 65.61415100097656, 69.47380828857422, 73.33346557617188, 77.193115234375, 81.05277252197266, 84.91242980957031]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 11.0, 4.0, 6.0, 9.0, 11.0, 9.0, 23.0, 16.0, 22.0, 25.0, 26.0, 37.0, 32.0, 27.0, 38.0, 39.0, 40.0, 43.0, 30.0, 43.0, 46.0, 47.0, 55.0, 47.0, 43.0, 37.0, 40.0, 31.0, 25.0, 23.0, 12.0, 17.0, 13.0, 11.0, 11.0, 18.0, 12.0, 4.0, 3.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.865867614746094, -52.09005355834961, -50.31423568725586, -48.538421630859375, -46.76260757446289, -44.98678970336914, -43.210975646972656, -41.435157775878906, -39.65934371948242, -37.88352966308594, -36.10771179199219, -34.3318977355957, -32.55608367919922, -30.78026580810547, -29.004451751708984, -27.228635787963867, -25.452821731567383, -23.677005767822266, -21.90119171142578, -20.125375747680664, -18.349559783935547, -16.573745727539062, -14.797929763793945, -13.022113800048828, -11.246298789978027, -9.470483779907227, -7.694667816162109, -5.918852806091309, -4.14303731918335, -2.3672218322753906, -0.5914068222045898, 1.1844091415405273, 2.960224151611328, 4.736039638519287, 6.511855125427246, 8.287670135498047, 10.063486099243164, 11.839301109313965, 13.615116119384766, 15.390932083129883, 17.166748046875, 18.942564010620117, 20.7183780670166, 22.49419403076172, 24.270009994506836, 26.045825958251953, 27.821640014648438, 29.597455978393555, 31.37327003479004, 33.149085998535156, 34.92490005493164, 36.700714111328125, 38.476531982421875, 40.25234603881836, 42.028160095214844, 43.803977966308594, 45.57979202270508, 47.35560607910156, 49.13142395019531, 50.9072380065918, 52.68305206298828, 54.45886993408203, 56.234683990478516, 58.010498046875, 59.78631591796875]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 6.0, 10.0, 6.0, 15.0, 10.0, 15.0, 9.0, 15.0, 20.0, 17.0, 24.0, 27.0, 19.0, 21.0, 30.0, 31.0, 35.0, 31.0, 33.0, 47.0, 40.0, 38.0, 35.0, 42.0, 41.0, 47.0, 33.0, 37.0, 40.0, 38.0, 23.0, 23.0, 29.0, 13.0, 13.0, 18.0, 13.0, 14.0, 9.0, 10.0, 6.0, 5.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.921875, -9.634521484375, -9.34716796875, -9.059814453125, -8.7724609375, -8.485107421875, -8.19775390625, -7.910400390625, -7.623046875, -7.335693359375, -7.04833984375, -6.760986328125, -6.4736328125, -6.186279296875, -5.89892578125, -5.611572265625, -5.32421875, -5.036865234375, -4.74951171875, -4.462158203125, -4.1748046875, -3.887451171875, -3.60009765625, -3.312744140625, -3.025390625, -2.738037109375, -2.45068359375, -2.163330078125, -1.8759765625, -1.588623046875, -1.30126953125, -1.013916015625, -0.7265625, -0.439208984375, -0.15185546875, 0.135498046875, 0.4228515625, 0.710205078125, 0.99755859375, 1.284912109375, 1.572265625, 1.859619140625, 2.14697265625, 2.434326171875, 2.7216796875, 3.009033203125, 3.29638671875, 3.583740234375, 3.87109375, 4.158447265625, 4.44580078125, 4.733154296875, 5.0205078125, 5.307861328125, 5.59521484375, 5.882568359375, 6.169921875, 6.457275390625, 6.74462890625, 7.031982421875, 7.3193359375, 7.606689453125, 7.89404296875, 8.181396484375, 8.46875]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 0.0, 6.0, 9.0, 11.0, 12.0, 26.0, 33.0, 55.0, 80.0, 122.0, 198.0, 299.0, 437.0, 652.0, 980.0, 1390.0, 2107.0, 3334.0, 4769.0, 7394.0, 11065.0, 17093.0, 26534.0, 41011.0, 64601.0, 103356.0, 165459.0, 212187.0, 140626.0, 88323.0, 55046.0, 35440.0, 22600.0, 14491.0, 9617.0, 6478.0, 4192.0, 2797.0, 1917.0, 1267.0, 830.0, 544.0, 359.0, 279.0, 182.0, 122.0, 68.0, 54.0, 49.0, 23.0, 19.0, 10.0, 7.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2763671875, -1.234283447265625, -1.19219970703125, -1.150115966796875, -1.1080322265625, -1.065948486328125, -1.02386474609375, -0.981781005859375, -0.939697265625, -0.897613525390625, -0.85552978515625, -0.813446044921875, -0.7713623046875, -0.729278564453125, -0.68719482421875, -0.645111083984375, -0.60302734375, -0.560943603515625, -0.51885986328125, -0.476776123046875, -0.4346923828125, -0.392608642578125, -0.35052490234375, -0.308441162109375, -0.266357421875, -0.224273681640625, -0.18218994140625, -0.140106201171875, -0.0980224609375, -0.055938720703125, -0.01385498046875, 0.028228759765625, 0.0703125, 0.112396240234375, 0.15447998046875, 0.196563720703125, 0.2386474609375, 0.280731201171875, 0.32281494140625, 0.364898681640625, 0.406982421875, 0.449066162109375, 0.49114990234375, 0.533233642578125, 0.5753173828125, 0.617401123046875, 0.65948486328125, 0.701568603515625, 0.74365234375, 0.785736083984375, 0.82781982421875, 0.869903564453125, 0.9119873046875, 0.954071044921875, 0.99615478515625, 1.038238525390625, 1.080322265625, 1.122406005859375, 1.16448974609375, 1.206573486328125, 1.2486572265625, 1.290740966796875, 1.33282470703125, 1.374908447265625, 1.4169921875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 9.0, 9.0, 4.0, 10.0, 14.0, 16.0, 22.0, 13.0, 20.0, 19.0, 26.0, 38.0, 31.0, 36.0, 48.0, 45.0, 42.0, 52.0, 40.0, 1079.0, 43.0, 41.0, 32.0, 35.0, 24.0, 36.0, 28.0, 27.0, 25.0, 31.0, 29.0, 17.0, 13.0, 14.0, 8.0, 10.0, 8.0, 11.0, 4.0, 4.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.96484375, -5.765380859375, -5.56591796875, -5.366455078125, -5.1669921875, -4.967529296875, -4.76806640625, -4.568603515625, -4.369140625, -4.169677734375, -3.97021484375, -3.770751953125, -3.5712890625, -3.371826171875, -3.17236328125, -2.972900390625, -2.7734375, -2.573974609375, -2.37451171875, -2.175048828125, -1.9755859375, -1.776123046875, -1.57666015625, -1.377197265625, -1.177734375, -0.978271484375, -0.77880859375, -0.579345703125, -0.3798828125, -0.180419921875, 0.01904296875, 0.218505859375, 0.41796875, 0.617431640625, 0.81689453125, 1.016357421875, 1.2158203125, 1.415283203125, 1.61474609375, 1.814208984375, 2.013671875, 2.213134765625, 2.41259765625, 2.612060546875, 2.8115234375, 3.010986328125, 3.21044921875, 3.409912109375, 3.609375, 3.808837890625, 4.00830078125, 4.207763671875, 4.4072265625, 4.606689453125, 4.80615234375, 5.005615234375, 5.205078125, 5.404541015625, 5.60400390625, 5.803466796875, 6.0029296875, 6.202392578125, 6.40185546875, 6.601318359375, 6.80078125]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 5.0, 8.0, 7.0, 17.0, 23.0, 45.0, 55.0, 79.0, 108.0, 213.0, 284.0, 517.0, 747.0, 1124.0, 1723.0, 2702.0, 4272.0, 6803.0, 10780.0, 16974.0, 26766.0, 42282.0, 68353.0, 108503.0, 171609.0, 1256187.0, 139284.0, 88107.0, 55507.0, 34449.0, 21652.0, 13749.0, 8725.0, 5563.0, 3518.0, 2296.0, 1520.0, 886.0, 588.0, 365.0, 242.0, 196.0, 102.0, 69.0, 56.0, 27.0, 16.0, 15.0, 9.0, 7.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.2880859375, -1.2469024658203125, -1.205718994140625, -1.1645355224609375, -1.12335205078125, -1.0821685791015625, -1.040985107421875, -0.9998016357421875, -0.9586181640625, -0.9174346923828125, -0.876251220703125, -0.8350677490234375, -0.79388427734375, -0.7527008056640625, -0.711517333984375, -0.6703338623046875, -0.629150390625, -0.5879669189453125, -0.546783447265625, -0.5055999755859375, -0.46441650390625, -0.4232330322265625, -0.382049560546875, -0.3408660888671875, -0.2996826171875, -0.2584991455078125, -0.217315673828125, -0.1761322021484375, -0.13494873046875, -0.0937652587890625, -0.052581787109375, -0.0113983154296875, 0.02978515625, 0.0709686279296875, 0.112152099609375, 0.1533355712890625, 0.19451904296875, 0.2357025146484375, 0.276885986328125, 0.3180694580078125, 0.3592529296875, 0.4004364013671875, 0.441619873046875, 0.4828033447265625, 0.52398681640625, 0.5651702880859375, 0.606353759765625, 0.6475372314453125, 0.688720703125, 0.7299041748046875, 0.771087646484375, 0.8122711181640625, 0.85345458984375, 0.8946380615234375, 0.935821533203125, 0.9770050048828125, 1.0181884765625, 1.0593719482421875, 1.100555419921875, 1.1417388916015625, 1.18292236328125, 1.2241058349609375, 1.265289306640625, 1.3064727783203125, 1.34765625]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 6.0, 3.0, 2.0, 4.0, 4.0, 9.0, 7.0, 8.0, 10.0, 15.0, 31.0, 29.0, 41.0, 65.0, 65.0, 73.0, 80.0, 85.0, 100.0, 70.0, 67.0, 52.0, 41.0, 38.0, 24.0, 18.0, 9.0, 14.0, 15.0, 7.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0036334991455078125, -0.003529101610183716, -0.003424704074859619, -0.0033203065395355225, -0.0032159090042114258, -0.003111511468887329, -0.0030071139335632324, -0.0029027163982391357, -0.002798318862915039, -0.0026939213275909424, -0.0025895237922668457, -0.002485126256942749, -0.0023807287216186523, -0.0022763311862945557, -0.002171933650970459, -0.0020675361156463623, -0.0019631385803222656, -0.001858741044998169, -0.0017543435096740723, -0.0016499459743499756, -0.001545548439025879, -0.0014411509037017822, -0.0013367533683776855, -0.0012323558330535889, -0.0011279582977294922, -0.0010235607624053955, -0.0009191632270812988, -0.0008147656917572021, -0.0007103681564331055, -0.0006059706211090088, -0.0005015730857849121, -0.00039717555046081543, -0.00029277801513671875, -0.00018838047981262207, -8.398294448852539e-05, 2.041459083557129e-05, 0.00012481212615966797, 0.00022920966148376465, 0.00033360719680786133, 0.000438004732131958, 0.0005424022674560547, 0.0006467998027801514, 0.000751197338104248, 0.0008555948734283447, 0.0009599924087524414, 0.001064389944076538, 0.0011687874794006348, 0.0012731850147247314, 0.0013775825500488281, 0.0014819800853729248, 0.0015863776206970215, 0.0016907751560211182, 0.0017951726913452148, 0.0018995702266693115, 0.002003967761993408, 0.002108365297317505, 0.0022127628326416016, 0.0023171603679656982, 0.002421557903289795, 0.0025259554386138916, 0.0026303529739379883, 0.002734750509262085, 0.0028391480445861816, 0.0029435455799102783, 0.003047943115234375]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 5.0, 5.0, 2.0, 8.0, 14.0, 20.0, 14.0, 23.0, 28.0, 43.0, 54.0, 96.0, 147.0, 252.0, 687.0, 48673.0, 996295.0, 1241.0, 337.0, 190.0, 122.0, 75.0, 56.0, 39.0, 29.0, 20.0, 22.0, 10.0, 4.0, 11.0, 6.0, 6.0, 9.0, 2.0, 2.0, 4.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.059783935546875, -0.057584285736083984, -0.05538463592529297, -0.05318498611450195, -0.05098533630371094, -0.04878568649291992, -0.046586036682128906, -0.04438638687133789, -0.042186737060546875, -0.03998708724975586, -0.037787437438964844, -0.03558778762817383, -0.03338813781738281, -0.031188488006591797, -0.02898883819580078, -0.026789188385009766, -0.02458953857421875, -0.022389888763427734, -0.02019023895263672, -0.017990589141845703, -0.015790939331054688, -0.013591289520263672, -0.011391639709472656, -0.00919198989868164, -0.006992340087890625, -0.004792690277099609, -0.0025930404663085938, -0.0003933906555175781, 0.0018062591552734375, 0.004005908966064453, 0.006205558776855469, 0.008405208587646484, 0.0106048583984375, 0.012804508209228516, 0.015004158020019531, 0.017203807830810547, 0.019403457641601562, 0.021603107452392578, 0.023802757263183594, 0.02600240707397461, 0.028202056884765625, 0.03040170669555664, 0.032601356506347656, 0.03480100631713867, 0.03700065612792969, 0.0392003059387207, 0.04139995574951172, 0.043599605560302734, 0.04579925537109375, 0.047998905181884766, 0.05019855499267578, 0.0523982048034668, 0.05459785461425781, 0.05679750442504883, 0.058997154235839844, 0.06119680404663086, 0.06339645385742188, 0.06559610366821289, 0.0677957534790039, 0.06999540328979492, 0.07219505310058594, 0.07439470291137695, 0.07659435272216797, 0.07879400253295898, 0.08099365234375]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 13.0, 503.0, 488.0, 15.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011714515276253223, -0.0007818718440830708, -0.00039229216054081917, -2.712476998567581e-06, 0.000386867206543684, 0.0007764468900859356, 0.0011660265736281872, 0.0015556062571704388, 0.0019451859407126904, 0.002334765624254942, 0.0027243453077971935, 0.003113924991339445, 0.0035035046748816967, 0.0038930843584239483, 0.0042826640419662, 0.0046722437255084515, 0.005061823409050703, 0.005451403092592955, 0.005840982776135206, 0.006230562459677458, 0.006620142143219709, 0.007009721826761961, 0.007399301510304213, 0.007788881193846464, 0.008178461343050003, 0.008568041026592255, 0.008957620710134506, 0.009347200393676758, 0.00973678007721901, 0.010126359760761261, 0.010515939444303513, 0.010905519127845764, 0.011295098811388016, 0.011684678494930267, 0.012074258178472519, 0.01246383786201477, 0.012853417545557022, 0.013242997229099274, 0.013632576912641525, 0.014022156596183777, 0.014411736279726028, 0.01480131596326828, 0.015190895646810532, 0.015580475330352783, 0.015970055013895035, 0.016359634697437286, 0.016749214380979538, 0.01713879406452179, 0.01752837374806404, 0.017917953431606293, 0.018307533115148544, 0.018697112798690796, 0.019086692482233047, 0.0194762721657753, 0.01986585184931755, 0.020255431532859802, 0.020645011216402054, 0.021034590899944305, 0.021424170583486557, 0.02181375026702881, 0.02220332995057106, 0.022592909634113312, 0.022982489317655563, 0.023372069001197815, 0.023761648684740067]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 3.0, 0.0, 3.0, 5.0, 4.0, 4.0, 6.0, 9.0, 10.0, 4.0, 8.0, 9.0, 9.0, 16.0, 17.0, 24.0, 19.0, 17.0, 30.0, 25.0, 30.0, 25.0, 30.0, 45.0, 45.0, 42.0, 40.0, 42.0, 40.0, 41.0, 38.0, 37.0, 32.0, 43.0, 31.0, 35.0, 28.0, 24.0, 18.0, 13.0, 22.0, 10.0, 13.0, 9.0, 9.0, 12.0, 11.0, 6.0, 5.0, 2.0, 2.0, 5.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012637972831726074, -0.001223200000822544, -0.0011826027184724808, -0.0011420054361224174, -0.0011014081537723541, -0.0010608108714222908, -0.0010202135890722275, -0.0009796163067221642, -0.0009390190243721008, -0.0008984217420220375, -0.0008578244596719742, -0.0008172271773219109, -0.0007766298949718475, -0.0007360326126217842, -0.0006954353302717209, -0.0006548380479216576, -0.0006142407655715942, -0.0005736434832215309, -0.0005330462008714676, -0.0004924489185214043, -0.00045185163617134094, -0.0004112543538212776, -0.0003706570714712143, -0.00033005978912115097, -0.00028946250677108765, -0.0002488652244210243, -0.000208267942070961, -0.00016767065972089767, -0.00012707337737083435, -8.647609502077103e-05, -4.58788126707077e-05, -5.281530320644379e-06, 3.5315752029418945e-05, 7.591303437948227e-05, 0.0001165103167295456, 0.00015710759907960892, 0.00019770488142967224, 0.00023830216377973557, 0.0002788994461297989, 0.0003194967284798622, 0.00036009401082992554, 0.00040069129317998886, 0.0004412885755300522, 0.0004818858578801155, 0.0005224831402301788, 0.0005630804225802422, 0.0006036777049303055, 0.0006442749872803688, 0.0006848722696304321, 0.0007254695519804955, 0.0007660668343305588, 0.0008066641166806221, 0.0008472613990306854, 0.0008878586813807487, 0.0009284559637308121, 0.0009690532460808754, 0.0010096505284309387, 0.001050247810781002, 0.0010908450931310654, 0.0011314423754811287, 0.001172039657831192, 0.0012126369401812553, 0.0012532342225313187, 0.001293831504881382, 0.0013344287872314453]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 6.0, 10.0, 6.0, 15.0, 10.0, 15.0, 9.0, 15.0, 20.0, 17.0, 24.0, 27.0, 19.0, 21.0, 30.0, 31.0, 35.0, 31.0, 33.0, 47.0, 40.0, 38.0, 35.0, 42.0, 41.0, 47.0, 33.0, 37.0, 40.0, 38.0, 23.0, 23.0, 29.0, 13.0, 13.0, 18.0, 13.0, 14.0, 9.0, 10.0, 6.0, 5.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.921875, -9.634521484375, -9.34716796875, -9.059814453125, -8.7724609375, -8.485107421875, -8.19775390625, -7.910400390625, -7.623046875, -7.335693359375, -7.04833984375, -6.760986328125, -6.4736328125, -6.186279296875, -5.89892578125, -5.611572265625, -5.32421875, -5.036865234375, -4.74951171875, -4.462158203125, -4.1748046875, -3.887451171875, -3.60009765625, -3.312744140625, -3.025390625, -2.738037109375, -2.45068359375, -2.163330078125, -1.8759765625, -1.588623046875, -1.30126953125, -1.013916015625, -0.7265625, -0.439208984375, -0.15185546875, 0.135498046875, 0.4228515625, 0.710205078125, 0.99755859375, 1.284912109375, 1.572265625, 1.859619140625, 2.14697265625, 2.434326171875, 2.7216796875, 3.009033203125, 3.29638671875, 3.583740234375, 3.87109375, 4.158447265625, 4.44580078125, 4.733154296875, 5.0205078125, 5.307861328125, 5.59521484375, 5.882568359375, 6.169921875, 6.457275390625, 6.74462890625, 7.031982421875, 7.3193359375, 7.606689453125, 7.89404296875, 8.181396484375, 8.46875]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 4.0, 2.0, 4.0, 11.0, 8.0, 13.0, 30.0, 28.0, 31.0, 29.0, 48.0, 52.0, 72.0, 89.0, 142.0, 193.0, 249.0, 304.0, 434.0, 636.0, 1263.0, 3553.0, 14187.0, 80078.0, 832710.0, 91245.0, 15553.0, 3854.0, 1238.0, 667.0, 441.0, 350.0, 262.0, 178.0, 162.0, 104.0, 74.0, 52.0, 49.0, 38.0, 23.0, 27.0, 18.0, 10.0, 14.0, 10.0, 4.0, 6.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-25.078125, -24.351806640625, -23.62548828125, -22.899169921875, -22.1728515625, -21.446533203125, -20.72021484375, -19.993896484375, -19.267578125, -18.541259765625, -17.81494140625, -17.088623046875, -16.3623046875, -15.635986328125, -14.90966796875, -14.183349609375, -13.45703125, -12.730712890625, -12.00439453125, -11.278076171875, -10.5517578125, -9.825439453125, -9.09912109375, -8.372802734375, -7.646484375, -6.920166015625, -6.19384765625, -5.467529296875, -4.7412109375, -4.014892578125, -3.28857421875, -2.562255859375, -1.8359375, -1.109619140625, -0.38330078125, 0.343017578125, 1.0693359375, 1.795654296875, 2.52197265625, 3.248291015625, 3.974609375, 4.700927734375, 5.42724609375, 6.153564453125, 6.8798828125, 7.606201171875, 8.33251953125, 9.058837890625, 9.78515625, 10.511474609375, 11.23779296875, 11.964111328125, 12.6904296875, 13.416748046875, 14.14306640625, 14.869384765625, 15.595703125, 16.322021484375, 17.04833984375, 17.774658203125, 18.5009765625, 19.227294921875, 19.95361328125, 20.679931640625, 21.40625]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 4.0, 7.0, 5.0, 8.0, 6.0, 11.0, 10.0, 20.0, 17.0, 20.0, 21.0, 22.0, 34.0, 41.0, 26.0, 41.0, 50.0, 54.0, 61.0, 180.0, 1741.0, 192.0, 71.0, 57.0, 50.0, 39.0, 37.0, 35.0, 32.0, 26.0, 22.0, 22.0, 10.0, 14.0, 20.0, 10.0, 9.0, 8.0, 5.0, 1.0, 5.0, 1.0, 4.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.875, -28.984375, -28.09375, -27.203125, -26.3125, -25.421875, -24.53125, -23.640625, -22.75, -21.859375, -20.96875, -20.078125, -19.1875, -18.296875, -17.40625, -16.515625, -15.625, -14.734375, -13.84375, -12.953125, -12.0625, -11.171875, -10.28125, -9.390625, -8.5, -7.609375, -6.71875, -5.828125, -4.9375, -4.046875, -3.15625, -2.265625, -1.375, -0.484375, 0.40625, 1.296875, 2.1875, 3.078125, 3.96875, 4.859375, 5.75, 6.640625, 7.53125, 8.421875, 9.3125, 10.203125, 11.09375, 11.984375, 12.875, 13.765625, 14.65625, 15.546875, 16.4375, 17.328125, 18.21875, 19.109375, 20.0, 20.890625, 21.78125, 22.671875, 23.5625, 24.453125, 25.34375, 26.234375, 27.125]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 2.0, 5.0, 6.0, 2.0, 9.0, 13.0, 14.0, 20.0, 16.0, 19.0, 20.0, 32.0, 43.0, 41.0, 46.0, 89.0, 102.0, 192.0, 356.0, 1327.0, 31649.0, 3090045.0, 19573.0, 1078.0, 345.0, 185.0, 116.0, 66.0, 57.0, 36.0, 32.0, 33.0, 30.0, 16.0, 25.0, 12.0, 10.0, 13.0, 4.0, 5.0, 10.0, 5.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.1875, -72.7177734375, -70.248046875, -67.7783203125, -65.30859375, -62.8388671875, -60.369140625, -57.8994140625, -55.4296875, -52.9599609375, -50.490234375, -48.0205078125, -45.55078125, -43.0810546875, -40.611328125, -38.1416015625, -35.671875, -33.2021484375, -30.732421875, -28.2626953125, -25.79296875, -23.3232421875, -20.853515625, -18.3837890625, -15.9140625, -13.4443359375, -10.974609375, -8.5048828125, -6.03515625, -3.5654296875, -1.095703125, 1.3740234375, 3.84375, 6.3134765625, 8.783203125, 11.2529296875, 13.72265625, 16.1923828125, 18.662109375, 21.1318359375, 23.6015625, 26.0712890625, 28.541015625, 31.0107421875, 33.48046875, 35.9501953125, 38.419921875, 40.8896484375, 43.359375, 45.8291015625, 48.298828125, 50.7685546875, 53.23828125, 55.7080078125, 58.177734375, 60.6474609375, 63.1171875, 65.5869140625, 68.056640625, 70.5263671875, 72.99609375, 75.4658203125, 77.935546875, 80.4052734375, 82.875]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 19.0, 121.0, 321.0, 377.0, 129.0, 32.0, 9.0, 4.0, 1.0, 1.0], "bins": [-157.57447814941406, -154.81683349609375, -152.05917358398438, -149.30152893066406, -146.54388427734375, -143.78622436523438, -141.02857971191406, -138.27093505859375, -135.51327514648438, -132.75563049316406, -129.9979705810547, -127.24032592773438, -124.48267364501953, -121.72502136230469, -118.96737670898438, -116.20972442626953, -113.45207977294922, -110.69442749023438, -107.93678283691406, -105.17913055419922, -102.42147827148438, -99.66383361816406, -96.90618133544922, -94.14852905273438, -91.39088439941406, -88.63323211669922, -85.8755874633789, -83.11793518066406, -80.36028289794922, -77.60263061523438, -74.84498596191406, -72.08733367919922, -69.3296890258789, -66.57203674316406, -63.814388275146484, -61.056739807128906, -58.29908752441406, -55.541439056396484, -52.783790588378906, -50.02613830566406, -47.268489837646484, -44.510841369628906, -41.75318908691406, -38.995540618896484, -36.237892150878906, -33.48023986816406, -30.722591400146484, -27.964941024780273, -25.207290649414062, -22.44964027404785, -19.69198989868164, -16.934341430664062, -14.176691055297852, -11.41904067993164, -8.661392211914062, -5.903741836547852, -3.1460914611816406, -0.3884415626525879, 2.369208335876465, 5.126857757568359, 7.88450813293457, 10.642158508300781, 13.39980697631836, 16.15745735168457, 18.91510772705078]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 6.0, 10.0, 5.0, 17.0, 20.0, 15.0, 14.0, 31.0, 34.0, 29.0, 36.0, 36.0, 46.0, 55.0, 36.0, 42.0, 48.0, 47.0, 58.0, 46.0, 34.0, 47.0, 33.0, 32.0, 34.0, 32.0, 24.0, 22.0, 28.0, 19.0, 14.0, 12.0, 12.0, 6.0, 7.0, 3.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-83.14183807373047, -80.67510986328125, -78.2083740234375, -75.74164581298828, -73.27491760253906, -70.80818176269531, -68.3414535522461, -65.87472534179688, -63.407989501953125, -60.94125747680664, -58.47452926635742, -56.00779724121094, -53.54106521606445, -51.07433319091797, -48.60760498046875, -46.140872955322266, -43.67414474487305, -41.20741271972656, -38.740684509277344, -36.27395248413086, -33.807220458984375, -31.340490341186523, -28.873760223388672, -26.407028198242188, -23.940298080444336, -21.473567962646484, -19.0068359375, -16.54010581970215, -14.07337474822998, -11.606643676757812, -9.139913558959961, -6.673181533813477, -4.206451416015625, -1.7397205829620361, 0.7270102500915527, 3.1937408447265625, 5.6604719161987305, 8.127202987670898, 10.59393310546875, 13.060665130615234, 15.527395248413086, 17.994125366210938, 20.460857391357422, 22.927587509155273, 25.394317626953125, 27.86104965209961, 30.32777976989746, 32.79450988769531, 35.2612419128418, 37.72797393798828, 40.1947021484375, 42.661434173583984, 45.12816619873047, 47.59489440917969, 50.06162643432617, 52.528358459472656, 54.995086669921875, 57.46181869506836, 59.92854690551758, 62.39527893066406, 64.86200714111328, 67.32874298095703, 69.79547119140625, 72.26220703125, 74.72893524169922]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 4.0, 5.0, 9.0, 8.0, 14.0, 19.0, 14.0, 16.0, 17.0, 18.0, 23.0, 32.0, 25.0, 29.0, 27.0, 34.0, 29.0, 24.0, 51.0, 49.0, 47.0, 53.0, 60.0, 50.0, 41.0, 44.0, 37.0, 26.0, 29.0, 32.0, 20.0, 20.0, 15.0, 10.0, 20.0, 10.0, 10.0, 5.0, 10.0, 8.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.015625, -10.695068359375, -10.37451171875, -10.053955078125, -9.7333984375, -9.412841796875, -9.09228515625, -8.771728515625, -8.451171875, -8.130615234375, -7.81005859375, -7.489501953125, -7.1689453125, -6.848388671875, -6.52783203125, -6.207275390625, -5.88671875, -5.566162109375, -5.24560546875, -4.925048828125, -4.6044921875, -4.283935546875, -3.96337890625, -3.642822265625, -3.322265625, -3.001708984375, -2.68115234375, -2.360595703125, -2.0400390625, -1.719482421875, -1.39892578125, -1.078369140625, -0.7578125, -0.437255859375, -0.11669921875, 0.203857421875, 0.5244140625, 0.844970703125, 1.16552734375, 1.486083984375, 1.806640625, 2.127197265625, 2.44775390625, 2.768310546875, 3.0888671875, 3.409423828125, 3.72998046875, 4.050537109375, 4.37109375, 4.691650390625, 5.01220703125, 5.332763671875, 5.6533203125, 5.973876953125, 6.29443359375, 6.614990234375, 6.935546875, 7.256103515625, 7.57666015625, 7.897216796875, 8.2177734375, 8.538330078125, 8.85888671875, 9.179443359375, 9.5]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 5.0, 5.0, 11.0, 12.0, 7.0, 17.0, 22.0, 19.0, 40.0, 48.0, 75.0, 94.0, 130.0, 176.0, 301.0, 493.0, 1083.0, 2876.0, 9142.0, 44582.0, 702334.0, 2995714.0, 393973.0, 31358.0, 7145.0, 2367.0, 918.0, 470.0, 280.0, 164.0, 114.0, 87.0, 49.0, 51.0, 32.0, 19.0, 19.0, 11.0, 15.0, 8.0, 7.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-27.296875, -26.50341796875, -25.7099609375, -24.91650390625, -24.123046875, -23.32958984375, -22.5361328125, -21.74267578125, -20.94921875, -20.15576171875, -19.3623046875, -18.56884765625, -17.775390625, -16.98193359375, -16.1884765625, -15.39501953125, -14.6015625, -13.80810546875, -13.0146484375, -12.22119140625, -11.427734375, -10.63427734375, -9.8408203125, -9.04736328125, -8.25390625, -7.46044921875, -6.6669921875, -5.87353515625, -5.080078125, -4.28662109375, -3.4931640625, -2.69970703125, -1.90625, -1.11279296875, -0.3193359375, 0.47412109375, 1.267578125, 2.06103515625, 2.8544921875, 3.64794921875, 4.44140625, 5.23486328125, 6.0283203125, 6.82177734375, 7.615234375, 8.40869140625, 9.2021484375, 9.99560546875, 10.7890625, 11.58251953125, 12.3759765625, 13.16943359375, 13.962890625, 14.75634765625, 15.5498046875, 16.34326171875, 17.13671875, 17.93017578125, 18.7236328125, 19.51708984375, 20.310546875, 21.10400390625, 21.8974609375, 22.69091796875, 23.484375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 9.0, 16.0, 17.0, 34.0, 64.0, 105.0, 204.0, 316.0, 551.0, 787.0, 767.0, 530.0, 259.0, 170.0, 92.0, 62.0, 33.0, 30.0, 19.0, 9.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.015625, -23.154052734375, -22.29248046875, -21.430908203125, -20.5693359375, -19.707763671875, -18.84619140625, -17.984619140625, -17.123046875, -16.261474609375, -15.39990234375, -14.538330078125, -13.6767578125, -12.815185546875, -11.95361328125, -11.092041015625, -10.23046875, -9.368896484375, -8.50732421875, -7.645751953125, -6.7841796875, -5.922607421875, -5.06103515625, -4.199462890625, -3.337890625, -2.476318359375, -1.61474609375, -0.753173828125, 0.1083984375, 0.969970703125, 1.83154296875, 2.693115234375, 3.5546875, 4.416259765625, 5.27783203125, 6.139404296875, 7.0009765625, 7.862548828125, 8.72412109375, 9.585693359375, 10.447265625, 11.308837890625, 12.17041015625, 13.031982421875, 13.8935546875, 14.755126953125, 15.61669921875, 16.478271484375, 17.33984375, 18.201416015625, 19.06298828125, 19.924560546875, 20.7861328125, 21.647705078125, 22.50927734375, 23.370849609375, 24.232421875, 25.093994140625, 25.95556640625, 26.817138671875, 27.6787109375, 28.540283203125, 29.40185546875, 30.263427734375, 31.125]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 3.0, 7.0, 14.0, 19.0, 19.0, 22.0, 38.0, 38.0, 79.0, 101.0, 133.0, 203.0, 339.0, 734.0, 2516.0, 28444.0, 3683215.0, 467066.0, 8506.0, 1403.0, 553.0, 282.0, 162.0, 114.0, 84.0, 45.0, 39.0, 31.0, 19.0, 20.0, 10.0, 7.0, 8.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-73.75, -71.630859375, -69.51171875, -67.392578125, -65.2734375, -63.154296875, -61.03515625, -58.916015625, -56.796875, -54.677734375, -52.55859375, -50.439453125, -48.3203125, -46.201171875, -44.08203125, -41.962890625, -39.84375, -37.724609375, -35.60546875, -33.486328125, -31.3671875, -29.248046875, -27.12890625, -25.009765625, -22.890625, -20.771484375, -18.65234375, -16.533203125, -14.4140625, -12.294921875, -10.17578125, -8.056640625, -5.9375, -3.818359375, -1.69921875, 0.419921875, 2.5390625, 4.658203125, 6.77734375, 8.896484375, 11.015625, 13.134765625, 15.25390625, 17.373046875, 19.4921875, 21.611328125, 23.73046875, 25.849609375, 27.96875, 30.087890625, 32.20703125, 34.326171875, 36.4453125, 38.564453125, 40.68359375, 42.802734375, 44.921875, 47.041015625, 49.16015625, 51.279296875, 53.3984375, 55.517578125, 57.63671875, 59.755859375, 61.875]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 10.0, 347.0, 639.0, 20.0, 0.0, 0.0, 1.0], "bins": [-955.713134765625, -939.5426025390625, -923.3720703125, -907.2015380859375, -891.031005859375, -874.8604736328125, -858.68994140625, -842.5194091796875, -826.348876953125, -810.1783447265625, -794.0078125, -777.8372802734375, -761.666748046875, -745.4962158203125, -729.32568359375, -713.1551513671875, -696.984619140625, -680.8140869140625, -664.6435546875, -648.4730224609375, -632.302490234375, -616.1319580078125, -599.96142578125, -583.7908935546875, -567.6203002929688, -551.4497680664062, -535.2792358398438, -519.1087036132812, -502.93817138671875, -486.76763916015625, -470.59710693359375, -454.42657470703125, -438.2560119628906, -422.0854797363281, -405.9149475097656, -389.7444152832031, -373.5738830566406, -357.4033508300781, -341.2327880859375, -325.062255859375, -308.8917236328125, -292.72119140625, -276.5506591796875, -260.380126953125, -244.2095947265625, -228.0390625, -211.86851501464844, -195.69798278808594, -179.5274658203125, -163.35693359375, -147.1864013671875, -131.015869140625, -114.84532928466797, -98.67479705810547, -82.50425720214844, -66.33372497558594, -50.163185119628906, -33.992652893066406, -17.82211685180664, -1.651580810546875, 14.518951416015625, 30.689483642578125, 46.860023498535156, 63.030555725097656, 79.20108795166016]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 8.0, 8.0, 16.0, 17.0, 7.0, 13.0, 17.0, 29.0, 22.0, 21.0, 25.0, 31.0, 29.0, 30.0, 41.0, 45.0, 43.0, 40.0, 45.0, 34.0, 42.0, 41.0, 41.0, 34.0, 45.0, 31.0, 32.0, 19.0, 31.0, 19.0, 19.0, 21.0, 18.0, 16.0, 15.0, 12.0, 8.0, 6.0, 6.0, 4.0, 5.0, 5.0, 9.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.43505859375, -46.72454071044922, -45.0140266418457, -43.30350875854492, -41.59299087524414, -39.882476806640625, -38.171958923339844, -36.46144104003906, -34.75092315673828, -33.0404052734375, -31.32988929748535, -29.619373321533203, -27.908855438232422, -26.198339462280273, -24.487823486328125, -22.777305603027344, -21.066791534423828, -19.35627555847168, -17.6457576751709, -15.93524169921875, -14.224724769592285, -12.51420783996582, -10.803691864013672, -9.093174934387207, -7.382658004760742, -5.672141075134277, -3.9616246223449707, -2.251108169555664, -0.5405912399291992, 1.1699256896972656, 2.880441665649414, 4.590958595275879, 6.301475524902344, 8.011992454528809, 9.722509384155273, 11.433025360107422, 13.143542289733887, 14.854059219360352, 16.5645751953125, 18.27509307861328, 19.98560905456543, 21.696125030517578, 23.40664291381836, 25.117158889770508, 26.827674865722656, 28.538192749023438, 30.248708724975586, 31.959224700927734, 33.669742584228516, 35.3802604675293, 37.09077453613281, 38.801292419433594, 40.511810302734375, 42.222328186035156, 43.93284225463867, 45.64336013793945, 47.35387420654297, 49.06439208984375, 50.774906158447266, 52.48542404174805, 54.19594192504883, 55.906455993652344, 57.616973876953125, 59.327491760253906, 61.03800964355469]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 4.0, 2.0, 4.0, 7.0, 9.0, 17.0, 13.0, 16.0, 22.0, 17.0, 25.0, 38.0, 29.0, 36.0, 37.0, 38.0, 43.0, 58.0, 47.0, 44.0, 47.0, 55.0, 51.0, 50.0, 38.0, 38.0, 33.0, 27.0, 26.0, 24.0, 19.0, 27.0, 16.0, 12.0, 9.0, 5.0, 9.0, 2.0, 6.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.171875, -12.781982421875, -12.39208984375, -12.002197265625, -11.6123046875, -11.222412109375, -10.83251953125, -10.442626953125, -10.052734375, -9.662841796875, -9.27294921875, -8.883056640625, -8.4931640625, -8.103271484375, -7.71337890625, -7.323486328125, -6.93359375, -6.543701171875, -6.15380859375, -5.763916015625, -5.3740234375, -4.984130859375, -4.59423828125, -4.204345703125, -3.814453125, -3.424560546875, -3.03466796875, -2.644775390625, -2.2548828125, -1.864990234375, -1.47509765625, -1.085205078125, -0.6953125, -0.305419921875, 0.08447265625, 0.474365234375, 0.8642578125, 1.254150390625, 1.64404296875, 2.033935546875, 2.423828125, 2.813720703125, 3.20361328125, 3.593505859375, 3.9833984375, 4.373291015625, 4.76318359375, 5.153076171875, 5.54296875, 5.932861328125, 6.32275390625, 6.712646484375, 7.1025390625, 7.492431640625, 7.88232421875, 8.272216796875, 8.662109375, 9.052001953125, 9.44189453125, 9.831787109375, 10.2216796875, 10.611572265625, 11.00146484375, 11.391357421875, 11.78125]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 12.0, 16.0, 16.0, 18.0, 34.0, 49.0, 74.0, 114.0, 161.0, 250.0, 294.0, 474.0, 667.0, 883.0, 1306.0, 1933.0, 2638.0, 4054.0, 6149.0, 9040.0, 13995.0, 20733.0, 32112.0, 49117.0, 76438.0, 122291.0, 194058.0, 185837.0, 115655.0, 72732.0, 46896.0, 30442.0, 19860.0, 13222.0, 8711.0, 5776.0, 3817.0, 2733.0, 1792.0, 1255.0, 894.0, 608.0, 397.0, 296.0, 237.0, 138.0, 112.0, 69.0, 50.0, 41.0, 37.0, 20.0, 10.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.501953125, -1.45635986328125, -1.4107666015625, -1.36517333984375, -1.319580078125, -1.27398681640625, -1.2283935546875, -1.18280029296875, -1.13720703125, -1.09161376953125, -1.0460205078125, -1.00042724609375, -0.954833984375, -0.90924072265625, -0.8636474609375, -0.81805419921875, -0.7724609375, -0.72686767578125, -0.6812744140625, -0.63568115234375, -0.590087890625, -0.54449462890625, -0.4989013671875, -0.45330810546875, -0.40771484375, -0.36212158203125, -0.3165283203125, -0.27093505859375, -0.225341796875, -0.17974853515625, -0.1341552734375, -0.08856201171875, -0.04296875, 0.00262451171875, 0.0482177734375, 0.09381103515625, 0.139404296875, 0.18499755859375, 0.2305908203125, 0.27618408203125, 0.32177734375, 0.36737060546875, 0.4129638671875, 0.45855712890625, 0.504150390625, 0.54974365234375, 0.5953369140625, 0.64093017578125, 0.6865234375, 0.73211669921875, 0.7777099609375, 0.82330322265625, 0.868896484375, 0.91448974609375, 0.9600830078125, 1.00567626953125, 1.05126953125, 1.09686279296875, 1.1424560546875, 1.18804931640625, 1.233642578125, 1.27923583984375, 1.3248291015625, 1.37042236328125, 1.416015625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 4.0, 8.0, 5.0, 10.0, 10.0, 11.0, 19.0, 13.0, 18.0, 21.0, 21.0, 26.0, 30.0, 30.0, 31.0, 35.0, 42.0, 36.0, 40.0, 33.0, 1065.0, 38.0, 40.0, 39.0, 41.0, 36.0, 50.0, 28.0, 37.0, 27.0, 24.0, 27.0, 10.0, 17.0, 15.0, 14.0, 10.0, 10.0, 14.0, 16.0, 4.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.9140625, -5.71533203125, -5.5166015625, -5.31787109375, -5.119140625, -4.92041015625, -4.7216796875, -4.52294921875, -4.32421875, -4.12548828125, -3.9267578125, -3.72802734375, -3.529296875, -3.33056640625, -3.1318359375, -2.93310546875, -2.734375, -2.53564453125, -2.3369140625, -2.13818359375, -1.939453125, -1.74072265625, -1.5419921875, -1.34326171875, -1.14453125, -0.94580078125, -0.7470703125, -0.54833984375, -0.349609375, -0.15087890625, 0.0478515625, 0.24658203125, 0.4453125, 0.64404296875, 0.8427734375, 1.04150390625, 1.240234375, 1.43896484375, 1.6376953125, 1.83642578125, 2.03515625, 2.23388671875, 2.4326171875, 2.63134765625, 2.830078125, 3.02880859375, 3.2275390625, 3.42626953125, 3.625, 3.82373046875, 4.0224609375, 4.22119140625, 4.419921875, 4.61865234375, 4.8173828125, 5.01611328125, 5.21484375, 5.41357421875, 5.6123046875, 5.81103515625, 6.009765625, 6.20849609375, 6.4072265625, 6.60595703125, 6.8046875]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 6.0, 3.0, 7.0, 8.0, 15.0, 23.0, 26.0, 51.0, 69.0, 99.0, 160.0, 233.0, 336.0, 477.0, 648.0, 1033.0, 1635.0, 2292.0, 3556.0, 5312.0, 8088.0, 12724.0, 19916.0, 31327.0, 49623.0, 79181.0, 123660.0, 1154455.0, 266695.0, 122198.0, 77339.0, 48870.0, 30911.0, 19822.0, 12677.0, 7944.0, 5230.0, 3567.0, 2269.0, 1517.0, 1024.0, 688.0, 446.0, 324.0, 203.0, 152.0, 86.0, 75.0, 52.0, 32.0, 25.0, 10.0, 14.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.3095703125, -1.267303466796875, -1.22503662109375, -1.182769775390625, -1.1405029296875, -1.098236083984375, -1.05596923828125, -1.013702392578125, -0.971435546875, -0.929168701171875, -0.88690185546875, -0.844635009765625, -0.8023681640625, -0.760101318359375, -0.71783447265625, -0.675567626953125, -0.63330078125, -0.591033935546875, -0.54876708984375, -0.506500244140625, -0.4642333984375, -0.421966552734375, -0.37969970703125, -0.337432861328125, -0.295166015625, -0.252899169921875, -0.21063232421875, -0.168365478515625, -0.1260986328125, -0.083831787109375, -0.04156494140625, 0.000701904296875, 0.04296875, 0.085235595703125, 0.12750244140625, 0.169769287109375, 0.2120361328125, 0.254302978515625, 0.29656982421875, 0.338836669921875, 0.381103515625, 0.423370361328125, 0.46563720703125, 0.507904052734375, 0.5501708984375, 0.592437744140625, 0.63470458984375, 0.676971435546875, 0.71923828125, 0.761505126953125, 0.80377197265625, 0.846038818359375, 0.8883056640625, 0.930572509765625, 0.97283935546875, 1.015106201171875, 1.057373046875, 1.099639892578125, 1.14190673828125, 1.184173583984375, 1.2264404296875, 1.268707275390625, 1.31097412109375, 1.353240966796875, 1.3955078125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 4.0, 2.0, 3.0, 5.0, 6.0, 9.0, 9.0, 10.0, 30.0, 25.0, 27.0, 35.0, 27.0, 42.0, 38.0, 60.0, 63.0, 66.0, 72.0, 70.0, 57.0, 58.0, 53.0, 35.0, 33.0, 28.0, 29.0, 18.0, 24.0, 12.0, 14.0, 8.0, 9.0, 6.0, 2.0, 5.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.00247955322265625, -0.0024029910564422607, -0.0023264288902282715, -0.0022498667240142822, -0.002173304557800293, -0.0020967423915863037, -0.0020201802253723145, -0.0019436180591583252, -0.001867055892944336, -0.0017904937267303467, -0.0017139315605163574, -0.0016373693943023682, -0.001560807228088379, -0.0014842450618743896, -0.0014076828956604004, -0.0013311207294464111, -0.0012545585632324219, -0.0011779963970184326, -0.0011014342308044434, -0.001024872064590454, -0.0009483098983764648, -0.0008717477321624756, -0.0007951855659484863, -0.0007186233997344971, -0.0006420612335205078, -0.0005654990673065186, -0.0004889369010925293, -0.00041237473487854004, -0.0003358125686645508, -0.0002592504024505615, -0.00018268823623657227, -0.00010612607002258301, -2.956390380859375e-05, 4.699826240539551e-05, 0.00012356042861938477, 0.00020012259483337402, 0.0002766847610473633, 0.00035324692726135254, 0.0004298090934753418, 0.0005063712596893311, 0.0005829334259033203, 0.0006594955921173096, 0.0007360577583312988, 0.0008126199245452881, 0.0008891820907592773, 0.0009657442569732666, 0.0010423064231872559, 0.0011188685894012451, 0.0011954307556152344, 0.0012719929218292236, 0.0013485550880432129, 0.0014251172542572021, 0.0015016794204711914, 0.0015782415866851807, 0.00165480375289917, 0.0017313659191131592, 0.0018079280853271484, 0.0018844902515411377, 0.001961052417755127, 0.002037614583969116, 0.0021141767501831055, 0.0021907389163970947, 0.002267301082611084, 0.0023438632488250732, 0.0024204254150390625]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 1.0, 4.0, 3.0, 8.0, 8.0, 10.0, 14.0, 14.0, 22.0, 21.0, 28.0, 42.0, 54.0, 71.0, 102.0, 158.0, 253.0, 531.0, 1812.0, 982875.0, 60642.0, 856.0, 380.0, 181.0, 128.0, 77.0, 63.0, 54.0, 32.0, 25.0, 27.0, 10.0, 10.0, 11.0, 10.0, 5.0, 7.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.060272216796875, -0.05853986740112305, -0.056807518005371094, -0.05507516860961914, -0.05334281921386719, -0.051610469818115234, -0.04987812042236328, -0.04814577102661133, -0.046413421630859375, -0.04468107223510742, -0.04294872283935547, -0.041216373443603516, -0.03948402404785156, -0.03775167465209961, -0.036019325256347656, -0.0342869758605957, -0.03255462646484375, -0.030822277069091797, -0.029089927673339844, -0.02735757827758789, -0.025625228881835938, -0.023892879486083984, -0.02216053009033203, -0.020428180694580078, -0.018695831298828125, -0.016963481903076172, -0.015231132507324219, -0.013498783111572266, -0.011766433715820312, -0.01003408432006836, -0.008301734924316406, -0.006569385528564453, -0.0048370361328125, -0.003104686737060547, -0.0013723373413085938, 0.0003600120544433594, 0.0020923614501953125, 0.0038247108459472656, 0.005557060241699219, 0.007289409637451172, 0.009021759033203125, 0.010754108428955078, 0.012486457824707031, 0.014218807220458984, 0.015951156616210938, 0.01768350601196289, 0.019415855407714844, 0.021148204803466797, 0.02288055419921875, 0.024612903594970703, 0.026345252990722656, 0.02807760238647461, 0.029809951782226562, 0.031542301177978516, 0.03327465057373047, 0.03500699996948242, 0.036739349365234375, 0.03847169876098633, 0.04020404815673828, 0.041936397552490234, 0.04366874694824219, 0.04540109634399414, 0.047133445739746094, 0.04886579513549805, 0.05059814453125]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 38.0, 244.0, 482.0, 209.0, 38.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0028597526252269745, -0.002674409653991461, -0.002489066682755947, -0.0023037237115204334, -0.0021183807402849197, -0.0019330378854647279, -0.001747695030644536, -0.0015623520594090223, -0.0013770090881735086, -0.001191666116937995, -0.0010063231457024813, -0.0008209802908822894, -0.0006356373196467757, -0.00045029434841126204, -0.0002649514935910702, -7.960852235555649e-05, 0.0001057344488799572, 0.00029107739101164043, 0.00047642033314332366, 0.0006617632461711764, 0.0008471062174066901, 0.0010324491886422038, 0.0012177920434623957, 0.0014031350146979094, 0.001588477985933423, 0.0017738209571689367, 0.0019591639284044504, 0.0021445066668093204, 0.002329849638044834, 0.002515192609280348, 0.0027005355805158615, 0.002885878551751375, 0.003071221522986889, 0.0032565644942224026, 0.0034419074654579163, 0.00362725043669343, 0.0038125934079289436, 0.003997936379164457, 0.004183279350399971, 0.004368621855974197, 0.004553965292870998, 0.004739308264106512, 0.004924651235342026, 0.0051099942065775394, 0.005295337177813053, 0.005480680149048567, 0.0056660231202840805, 0.005851365625858307, 0.006036708597093821, 0.006222051568329334, 0.006407394539564848, 0.006592737510800362, 0.006778080482035875, 0.006963423453271389, 0.007148765958845615, 0.007334109395742416, 0.007519451901316643, 0.0077047948725521564, 0.00789013784378767, 0.008075480349361897, 0.008260823786258698, 0.008446166291832924, 0.008631509728729725, 0.008816852234303951, 0.009002195671200752]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 3.0, 3.0, 7.0, 6.0, 8.0, 8.0, 13.0, 13.0, 7.0, 16.0, 17.0, 24.0, 24.0, 30.0, 32.0, 22.0, 35.0, 42.0, 33.0, 28.0, 34.0, 48.0, 38.0, 48.0, 41.0, 33.0, 39.0, 37.0, 37.0, 32.0, 32.0, 25.0, 24.0, 20.0, 22.0, 24.0, 11.0, 15.0, 16.0, 15.0, 8.0, 4.0, 5.0, 3.0, 5.0, 3.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0], "bins": [-0.0012595653533935547, -0.0012222090736031532, -0.0011848527938127518, -0.0011474965140223503, -0.0011101402342319489, -0.0010727839544415474, -0.001035427674651146, -0.0009980713948607445, -0.000960715115070343, -0.0009233588352799416, -0.0008860025554895401, -0.0008486462756991386, -0.0008112899959087372, -0.0007739337161183357, -0.0007365774363279343, -0.0006992211565375328, -0.0006618648767471313, -0.0006245085969567299, -0.0005871523171663284, -0.000549796037375927, -0.0005124397575855255, -0.00047508347779512405, -0.0004377271980047226, -0.00040037091821432114, -0.0003630146384239197, -0.0003256583586335182, -0.00028830207884311676, -0.0002509457990527153, -0.00021358951926231384, -0.00017623323947191238, -0.00013887695968151093, -0.00010152067989110947, -6.416440010070801e-05, -2.680812031030655e-05, 1.054815948009491e-05, 4.790443927049637e-05, 8.526071906089783e-05, 0.00012261699885129929, 0.00015997327864170074, 0.0001973295584321022, 0.00023468583822250366, 0.0002720421180129051, 0.0003093983978033066, 0.00034675467759370804, 0.0003841109573841095, 0.00042146723717451096, 0.0004588235169649124, 0.0004961797967553139, 0.0005335360765457153, 0.0005708923563361168, 0.0006082486361265182, 0.0006456049159169197, 0.0006829611957073212, 0.0007203174754977226, 0.0007576737552881241, 0.0007950300350785255, 0.000832386314868927, 0.0008697425946593285, 0.0009070988744497299, 0.0009444551542401314, 0.0009818114340305328, 0.0010191677138209343, 0.0010565239936113358, 0.0010938802734017372, 0.0011312365531921387]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 4.0, 2.0, 4.0, 7.0, 9.0, 17.0, 13.0, 16.0, 22.0, 17.0, 25.0, 38.0, 29.0, 36.0, 37.0, 38.0, 43.0, 58.0, 47.0, 44.0, 47.0, 55.0, 51.0, 50.0, 38.0, 38.0, 33.0, 27.0, 26.0, 24.0, 19.0, 27.0, 16.0, 12.0, 9.0, 5.0, 9.0, 2.0, 6.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.171875, -12.781982421875, -12.39208984375, -12.002197265625, -11.6123046875, -11.222412109375, -10.83251953125, -10.442626953125, -10.052734375, -9.662841796875, -9.27294921875, -8.883056640625, -8.4931640625, -8.103271484375, -7.71337890625, -7.323486328125, -6.93359375, -6.543701171875, -6.15380859375, -5.763916015625, -5.3740234375, -4.984130859375, -4.59423828125, -4.204345703125, -3.814453125, -3.424560546875, -3.03466796875, -2.644775390625, -2.2548828125, -1.864990234375, -1.47509765625, -1.085205078125, -0.6953125, -0.305419921875, 0.08447265625, 0.474365234375, 0.8642578125, 1.254150390625, 1.64404296875, 2.033935546875, 2.423828125, 2.813720703125, 3.20361328125, 3.593505859375, 3.9833984375, 4.373291015625, 4.76318359375, 5.153076171875, 5.54296875, 5.932861328125, 6.32275390625, 6.712646484375, 7.1025390625, 7.492431640625, 7.88232421875, 8.272216796875, 8.662109375, 9.052001953125, 9.44189453125, 9.831787109375, 10.2216796875, 10.611572265625, 11.00146484375, 11.391357421875, 11.78125]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 3.0, 5.0, 10.0, 16.0, 18.0, 23.0, 29.0, 52.0, 61.0, 75.0, 123.0, 154.0, 324.0, 636.0, 1221.0, 3184.0, 8592.0, 25904.0, 86328.0, 400235.0, 395655.0, 85708.0, 25699.0, 8614.0, 3117.0, 1293.0, 583.0, 299.0, 173.0, 128.0, 78.0, 53.0, 41.0, 38.0, 17.0, 23.0, 6.0, 14.0, 6.0, 4.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-17.09375, -16.5909423828125, -16.088134765625, -15.5853271484375, -15.08251953125, -14.5797119140625, -14.076904296875, -13.5740966796875, -13.0712890625, -12.5684814453125, -12.065673828125, -11.5628662109375, -11.06005859375, -10.5572509765625, -10.054443359375, -9.5516357421875, -9.048828125, -8.5460205078125, -8.043212890625, -7.5404052734375, -7.03759765625, -6.5347900390625, -6.031982421875, -5.5291748046875, -5.0263671875, -4.5235595703125, -4.020751953125, -3.5179443359375, -3.01513671875, -2.5123291015625, -2.009521484375, -1.5067138671875, -1.00390625, -0.5010986328125, 0.001708984375, 0.5045166015625, 1.00732421875, 1.5101318359375, 2.012939453125, 2.5157470703125, 3.0185546875, 3.5213623046875, 4.024169921875, 4.5269775390625, 5.02978515625, 5.5325927734375, 6.035400390625, 6.5382080078125, 7.041015625, 7.5438232421875, 8.046630859375, 8.5494384765625, 9.05224609375, 9.5550537109375, 10.057861328125, 10.5606689453125, 11.0634765625, 11.5662841796875, 12.069091796875, 12.5718994140625, 13.07470703125, 13.5775146484375, 14.080322265625, 14.5831298828125, 15.0859375]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 1.0, 4.0, 6.0, 10.0, 5.0, 2.0, 9.0, 10.0, 8.0, 8.0, 15.0, 18.0, 17.0, 19.0, 18.0, 22.0, 23.0, 33.0, 28.0, 32.0, 49.0, 47.0, 53.0, 92.0, 178.0, 1580.0, 244.0, 103.0, 69.0, 42.0, 36.0, 28.0, 20.0, 26.0, 24.0, 24.0, 28.0, 16.0, 22.0, 15.0, 18.0, 6.0, 7.0, 10.0, 13.0, 6.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.59375, -24.7294921875, -23.865234375, -23.0009765625, -22.13671875, -21.2724609375, -20.408203125, -19.5439453125, -18.6796875, -17.8154296875, -16.951171875, -16.0869140625, -15.22265625, -14.3583984375, -13.494140625, -12.6298828125, -11.765625, -10.9013671875, -10.037109375, -9.1728515625, -8.30859375, -7.4443359375, -6.580078125, -5.7158203125, -4.8515625, -3.9873046875, -3.123046875, -2.2587890625, -1.39453125, -0.5302734375, 0.333984375, 1.1982421875, 2.0625, 2.9267578125, 3.791015625, 4.6552734375, 5.51953125, 6.3837890625, 7.248046875, 8.1123046875, 8.9765625, 9.8408203125, 10.705078125, 11.5693359375, 12.43359375, 13.2978515625, 14.162109375, 15.0263671875, 15.890625, 16.7548828125, 17.619140625, 18.4833984375, 19.34765625, 20.2119140625, 21.076171875, 21.9404296875, 22.8046875, 23.6689453125, 24.533203125, 25.3974609375, 26.26171875, 27.1259765625, 27.990234375, 28.8544921875, 29.71875]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 4.0, 6.0, 7.0, 9.0, 2.0, 11.0, 18.0, 30.0, 20.0, 36.0, 34.0, 73.0, 64.0, 112.0, 146.0, 198.0, 320.0, 628.0, 2268.0, 26725.0, 2303653.0, 790290.0, 17700.0, 1741.0, 544.0, 283.0, 197.0, 137.0, 107.0, 86.0, 54.0, 43.0, 30.0, 28.0, 19.0, 13.0, 22.0, 10.0, 9.0, 4.0, 5.0, 3.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.0, -40.5966796875, -39.193359375, -37.7900390625, -36.38671875, -34.9833984375, -33.580078125, -32.1767578125, -30.7734375, -29.3701171875, -27.966796875, -26.5634765625, -25.16015625, -23.7568359375, -22.353515625, -20.9501953125, -19.546875, -18.1435546875, -16.740234375, -15.3369140625, -13.93359375, -12.5302734375, -11.126953125, -9.7236328125, -8.3203125, -6.9169921875, -5.513671875, -4.1103515625, -2.70703125, -1.3037109375, 0.099609375, 1.5029296875, 2.90625, 4.3095703125, 5.712890625, 7.1162109375, 8.51953125, 9.9228515625, 11.326171875, 12.7294921875, 14.1328125, 15.5361328125, 16.939453125, 18.3427734375, 19.74609375, 21.1494140625, 22.552734375, 23.9560546875, 25.359375, 26.7626953125, 28.166015625, 29.5693359375, 30.97265625, 32.3759765625, 33.779296875, 35.1826171875, 36.5859375, 37.9892578125, 39.392578125, 40.7958984375, 42.19921875, 43.6025390625, 45.005859375, 46.4091796875, 47.8125]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 212.0, 785.0, 19.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-571.7947387695312, -561.2528076171875, -550.7108154296875, -540.1688842773438, -529.6268920898438, -519.0849609375, -508.54296875, -498.00103759765625, -487.4590759277344, -476.9171142578125, -466.3751525878906, -455.83319091796875, -445.2912292480469, -434.749267578125, -424.20733642578125, -413.6653747558594, -403.1234130859375, -392.5814514160156, -382.03948974609375, -371.4975280761719, -360.95556640625, -350.41363525390625, -339.87164306640625, -329.3297119140625, -318.7877197265625, -308.2457580566406, -297.70379638671875, -287.1618347167969, -276.619873046875, -266.07794189453125, -255.5359649658203, -244.9940185546875, -234.45208740234375, -223.91012573242188, -213.3681640625, -202.82620239257812, -192.2842559814453, -181.74229431152344, -171.20033264160156, -160.65838623046875, -150.1164093017578, -139.57444763183594, -129.03248596191406, -118.49053192138672, -107.94857788085938, -97.4066162109375, -86.86465454101562, -76.32270050048828, -65.7807388305664, -55.2387809753418, -44.69682312011719, -34.15486145019531, -23.612903594970703, -13.070945739746094, -2.5289840698242188, 8.012969970703125, 18.554931640625, 29.09688949584961, 39.63884735107422, 50.180809020996094, 60.7227668762207, 71.26472473144531, 81.80668640136719, 92.34864044189453, 102.8906021118164]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 2.0, 5.0, 8.0, 12.0, 7.0, 18.0, 10.0, 12.0, 14.0, 17.0, 19.0, 18.0, 29.0, 27.0, 21.0, 39.0, 29.0, 52.0, 28.0, 45.0, 49.0, 42.0, 41.0, 34.0, 36.0, 40.0, 43.0, 39.0, 26.0, 27.0, 31.0, 24.0, 31.0, 17.0, 15.0, 14.0, 14.0, 16.0, 12.0, 10.0, 5.0, 4.0, 4.0, 3.0, 2.0, 8.0, 2.0, 3.0, 0.0, 2.0, 3.0, 0.0, 2.0], "bins": [-67.27494812011719, -65.1795883178711, -63.084232330322266, -60.98887634277344, -58.89352035522461, -56.79816436767578, -54.70280456542969, -52.60744857788086, -50.51209259033203, -48.4167366027832, -46.32137680053711, -44.22602081298828, -42.13066482543945, -40.035308837890625, -37.93994903564453, -35.8445930480957, -33.74923324584961, -31.65387535095215, -29.55851936340332, -27.46316146850586, -25.36780548095703, -23.27244758605957, -21.17708969116211, -19.08173370361328, -16.98637580871582, -14.891018867492676, -12.795661926269531, -10.70030403137207, -8.604947090148926, -6.509590148925781, -4.41423225402832, -2.318875312805176, -0.22351837158203125, 1.8718388080596924, 3.967195987701416, 6.062553405761719, 8.157910346984863, 10.253267288208008, 12.348625183105469, 14.443982124328613, 16.539339065551758, 18.63469696044922, 20.730052947998047, 22.825410842895508, 24.92076873779297, 27.016124725341797, 29.111482620239258, 31.20684051513672, 33.30219650268555, 35.397552490234375, 37.49291229248047, 39.5882682800293, 41.683624267578125, 43.77898406982422, 45.87434005737305, 47.969696044921875, 50.06505584716797, 52.1604118347168, 54.25577163696289, 56.35112762451172, 58.44648361206055, 60.541839599609375, 62.63719940185547, 64.73255920410156, 66.82791137695312]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 5.0, 4.0, 12.0, 12.0, 11.0, 21.0, 8.0, 34.0, 18.0, 20.0, 30.0, 41.0, 38.0, 35.0, 46.0, 48.0, 39.0, 36.0, 59.0, 50.0, 49.0, 54.0, 47.0, 34.0, 30.0, 34.0, 16.0, 28.0, 28.0, 24.0, 23.0, 9.0, 13.0, 13.0, 5.0, 10.0, 5.0, 4.0, 1.0, 1.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-13.3046875, -12.91943359375, -12.5341796875, -12.14892578125, -11.763671875, -11.37841796875, -10.9931640625, -10.60791015625, -10.22265625, -9.83740234375, -9.4521484375, -9.06689453125, -8.681640625, -8.29638671875, -7.9111328125, -7.52587890625, -7.140625, -6.75537109375, -6.3701171875, -5.98486328125, -5.599609375, -5.21435546875, -4.8291015625, -4.44384765625, -4.05859375, -3.67333984375, -3.2880859375, -2.90283203125, -2.517578125, -2.13232421875, -1.7470703125, -1.36181640625, -0.9765625, -0.59130859375, -0.2060546875, 0.17919921875, 0.564453125, 0.94970703125, 1.3349609375, 1.72021484375, 2.10546875, 2.49072265625, 2.8759765625, 3.26123046875, 3.646484375, 4.03173828125, 4.4169921875, 4.80224609375, 5.1875, 5.57275390625, 5.9580078125, 6.34326171875, 6.728515625, 7.11376953125, 7.4990234375, 7.88427734375, 8.26953125, 8.65478515625, 9.0400390625, 9.42529296875, 9.810546875, 10.19580078125, 10.5810546875, 10.96630859375, 11.3515625]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 7.0, 4.0, 10.0, 9.0, 15.0, 12.0, 24.0, 17.0, 21.0, 33.0, 50.0, 72.0, 132.0, 350.0, 1223.0, 4552.0, 26972.0, 791875.0, 3219900.0, 134142.0, 11212.0, 2456.0, 612.0, 245.0, 108.0, 63.0, 37.0, 31.0, 20.0, 15.0, 9.0, 13.0, 13.0, 8.0, 6.0, 4.0, 5.0, 3.0, 3.0, 0.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.96875, -33.81396484375, -32.6591796875, -31.50439453125, -30.349609375, -29.19482421875, -28.0400390625, -26.88525390625, -25.73046875, -24.57568359375, -23.4208984375, -22.26611328125, -21.111328125, -19.95654296875, -18.8017578125, -17.64697265625, -16.4921875, -15.33740234375, -14.1826171875, -13.02783203125, -11.873046875, -10.71826171875, -9.5634765625, -8.40869140625, -7.25390625, -6.09912109375, -4.9443359375, -3.78955078125, -2.634765625, -1.47998046875, -0.3251953125, 0.82958984375, 1.984375, 3.13916015625, 4.2939453125, 5.44873046875, 6.603515625, 7.75830078125, 8.9130859375, 10.06787109375, 11.22265625, 12.37744140625, 13.5322265625, 14.68701171875, 15.841796875, 16.99658203125, 18.1513671875, 19.30615234375, 20.4609375, 21.61572265625, 22.7705078125, 23.92529296875, 25.080078125, 26.23486328125, 27.3896484375, 28.54443359375, 29.69921875, 30.85400390625, 32.0087890625, 33.16357421875, 34.318359375, 35.47314453125, 36.6279296875, 37.78271484375, 38.9375]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 8.0, 9.0, 18.0, 9.0, 15.0, 17.0, 26.0, 37.0, 45.0, 82.0, 101.0, 152.0, 233.0, 394.0, 591.0, 609.0, 611.0, 408.0, 253.0, 144.0, 97.0, 69.0, 42.0, 36.0, 21.0, 16.0, 10.0, 8.0, 7.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.71875, -24.09326171875, -23.4677734375, -22.84228515625, -22.216796875, -21.59130859375, -20.9658203125, -20.34033203125, -19.71484375, -19.08935546875, -18.4638671875, -17.83837890625, -17.212890625, -16.58740234375, -15.9619140625, -15.33642578125, -14.7109375, -14.08544921875, -13.4599609375, -12.83447265625, -12.208984375, -11.58349609375, -10.9580078125, -10.33251953125, -9.70703125, -9.08154296875, -8.4560546875, -7.83056640625, -7.205078125, -6.57958984375, -5.9541015625, -5.32861328125, -4.703125, -4.07763671875, -3.4521484375, -2.82666015625, -2.201171875, -1.57568359375, -0.9501953125, -0.32470703125, 0.30078125, 0.92626953125, 1.5517578125, 2.17724609375, 2.802734375, 3.42822265625, 4.0537109375, 4.67919921875, 5.3046875, 5.93017578125, 6.5556640625, 7.18115234375, 7.806640625, 8.43212890625, 9.0576171875, 9.68310546875, 10.30859375, 10.93408203125, 11.5595703125, 12.18505859375, 12.810546875, 13.43603515625, 14.0615234375, 14.68701171875, 15.3125]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 6.0, 2.0, 1.0, 1.0, 11.0, 6.0, 9.0, 8.0, 14.0, 17.0, 23.0, 35.0, 54.0, 111.0, 151.0, 279.0, 588.0, 1420.0, 5363.0, 29450.0, 318200.0, 3553644.0, 252934.0, 24811.0, 4632.0, 1308.0, 481.0, 275.0, 153.0, 68.0, 66.0, 44.0, 33.0, 22.0, 16.0, 8.0, 11.0, 14.0, 7.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-34.84375, -33.736328125, -32.62890625, -31.521484375, -30.4140625, -29.306640625, -28.19921875, -27.091796875, -25.984375, -24.876953125, -23.76953125, -22.662109375, -21.5546875, -20.447265625, -19.33984375, -18.232421875, -17.125, -16.017578125, -14.91015625, -13.802734375, -12.6953125, -11.587890625, -10.48046875, -9.373046875, -8.265625, -7.158203125, -6.05078125, -4.943359375, -3.8359375, -2.728515625, -1.62109375, -0.513671875, 0.59375, 1.701171875, 2.80859375, 3.916015625, 5.0234375, 6.130859375, 7.23828125, 8.345703125, 9.453125, 10.560546875, 11.66796875, 12.775390625, 13.8828125, 14.990234375, 16.09765625, 17.205078125, 18.3125, 19.419921875, 20.52734375, 21.634765625, 22.7421875, 23.849609375, 24.95703125, 26.064453125, 27.171875, 28.279296875, 29.38671875, 30.494140625, 31.6015625, 32.708984375, 33.81640625, 34.923828125, 36.03125]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 8.0, 22.0, 50.0, 130.0, 226.0, 231.0, 179.0, 103.0, 28.0, 19.0, 8.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-173.52529907226562, -170.01736450195312, -166.50941467285156, -163.00148010253906, -159.4935302734375, -155.985595703125, -152.47764587402344, -148.96971130371094, -145.46176147460938, -141.95382690429688, -138.4458770751953, -134.9379425048828, -131.42999267578125, -127.92205047607422, -124.41410827636719, -120.90617370605469, -117.39823150634766, -113.89028930664062, -110.3823471069336, -106.87440490722656, -103.36646270751953, -99.8585205078125, -96.3505859375, -92.84263610839844, -89.33470153808594, -85.8267593383789, -82.31881713867188, -78.81087493896484, -75.30293273925781, -71.79499053955078, -68.28704833984375, -64.77911376953125, -61.27117156982422, -57.76322937011719, -54.255287170410156, -50.747344970703125, -47.239402770996094, -43.73146057128906, -40.2235221862793, -36.715579986572266, -33.207637786865234, -29.699695587158203, -26.191753387451172, -22.683813095092773, -19.175870895385742, -15.667928695678711, -12.159988403320312, -8.652046203613281, -5.14410400390625, -1.636162281036377, 1.871779441833496, 5.379720687866211, 8.887662887573242, 12.395605087280273, 15.903545379638672, 19.411487579345703, 22.919429779052734, 26.427371978759766, 29.935314178466797, 33.44325256347656, 36.951194763183594, 40.459136962890625, 43.967079162597656, 47.47502136230469, 50.98296356201172]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 2.0, 8.0, 4.0, 7.0, 14.0, 12.0, 13.0, 27.0, 26.0, 22.0, 32.0, 30.0, 36.0, 35.0, 43.0, 50.0, 43.0, 47.0, 41.0, 39.0, 44.0, 56.0, 40.0, 40.0, 40.0, 28.0, 32.0, 32.0, 26.0, 21.0, 16.0, 15.0, 17.0, 14.0, 12.0, 10.0, 11.0, 7.0, 4.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-57.31184005737305, -55.43180847167969, -53.551780700683594, -51.671749114990234, -49.79172134399414, -47.91168975830078, -46.03166198730469, -44.15163040161133, -42.27159881591797, -40.39156723022461, -38.511539459228516, -36.631507873535156, -34.75148010253906, -32.8714485168457, -30.991418838500977, -29.11138916015625, -27.231361389160156, -25.35133171081543, -23.471302032470703, -21.591270446777344, -19.71124267578125, -17.83121109008789, -15.951181411743164, -14.071151733398438, -12.191122055053711, -10.311092376708984, -8.431062698364258, -6.551032066345215, -4.671002388000488, -2.7909727096557617, -0.9109420776367188, 0.9690876007080078, 2.8491134643554688, 4.729143142700195, 6.60917329788208, 8.489203453063965, 10.369233131408691, 12.249262809753418, 14.129293441772461, 16.009323120117188, 17.889352798461914, 19.76938247680664, 21.649412155151367, 23.529441833496094, 25.409473419189453, 27.289501190185547, 29.169532775878906, 31.049562454223633, 32.92959213256836, 34.80962371826172, 36.68965148925781, 38.56968307495117, 40.449710845947266, 42.329742431640625, 44.20977020263672, 46.08980178833008, 47.96983337402344, 49.8498649597168, 51.72989273071289, 53.60992431640625, 55.489952087402344, 57.3699836730957, 59.25001525878906, 61.130043029785156, 63.01007080078125]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 3.0, 1.0, 3.0, 11.0, 4.0, 10.0, 15.0, 13.0, 12.0, 19.0, 28.0, 21.0, 21.0, 33.0, 22.0, 29.0, 32.0, 35.0, 48.0, 44.0, 41.0, 38.0, 48.0, 44.0, 41.0, 44.0, 39.0, 40.0, 28.0, 25.0, 22.0, 29.0, 24.0, 24.0, 19.0, 16.0, 16.0, 12.0, 4.0, 17.0, 6.0, 7.0, 7.0, 2.0, 3.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-11.2109375, -10.8543701171875, -10.497802734375, -10.1412353515625, -9.78466796875, -9.4281005859375, -9.071533203125, -8.7149658203125, -8.3583984375, -8.0018310546875, -7.645263671875, -7.2886962890625, -6.93212890625, -6.5755615234375, -6.218994140625, -5.8624267578125, -5.505859375, -5.1492919921875, -4.792724609375, -4.4361572265625, -4.07958984375, -3.7230224609375, -3.366455078125, -3.0098876953125, -2.6533203125, -2.2967529296875, -1.940185546875, -1.5836181640625, -1.22705078125, -0.8704833984375, -0.513916015625, -0.1573486328125, 0.19921875, 0.5557861328125, 0.912353515625, 1.2689208984375, 1.62548828125, 1.9820556640625, 2.338623046875, 2.6951904296875, 3.0517578125, 3.4083251953125, 3.764892578125, 4.1214599609375, 4.47802734375, 4.8345947265625, 5.191162109375, 5.5477294921875, 5.904296875, 6.2608642578125, 6.617431640625, 6.9739990234375, 7.33056640625, 7.6871337890625, 8.043701171875, 8.4002685546875, 8.7568359375, 9.1134033203125, 9.469970703125, 9.8265380859375, 10.18310546875, 10.5396728515625, 10.896240234375, 11.2528076171875, 11.609375]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 6.0, 2.0, 11.0, 11.0, 17.0, 23.0, 35.0, 55.0, 69.0, 113.0, 153.0, 201.0, 298.0, 464.0, 645.0, 1004.0, 1456.0, 2164.0, 3401.0, 5241.0, 8283.0, 13221.0, 20938.0, 34417.0, 56590.0, 96935.0, 167362.0, 232381.0, 163245.0, 94146.0, 55419.0, 33699.0, 20545.0, 12833.0, 8004.0, 5205.0, 3329.0, 2176.0, 1456.0, 952.0, 658.0, 397.0, 314.0, 237.0, 133.0, 95.0, 75.0, 43.0, 33.0, 26.0, 10.0, 13.0, 10.0, 9.0, 3.0, 2.0, 1.0, 3.0], "bins": [-1.8154296875, -1.761199951171875, -1.70697021484375, -1.652740478515625, -1.5985107421875, -1.544281005859375, -1.49005126953125, -1.435821533203125, -1.381591796875, -1.327362060546875, -1.27313232421875, -1.218902587890625, -1.1646728515625, -1.110443115234375, -1.05621337890625, -1.001983642578125, -0.94775390625, -0.893524169921875, -0.83929443359375, -0.785064697265625, -0.7308349609375, -0.676605224609375, -0.62237548828125, -0.568145751953125, -0.513916015625, -0.459686279296875, -0.40545654296875, -0.351226806640625, -0.2969970703125, -0.242767333984375, -0.18853759765625, -0.134307861328125, -0.080078125, -0.025848388671875, 0.02838134765625, 0.082611083984375, 0.1368408203125, 0.191070556640625, 0.24530029296875, 0.299530029296875, 0.353759765625, 0.407989501953125, 0.46221923828125, 0.516448974609375, 0.5706787109375, 0.624908447265625, 0.67913818359375, 0.733367919921875, 0.78759765625, 0.841827392578125, 0.89605712890625, 0.950286865234375, 1.0045166015625, 1.058746337890625, 1.11297607421875, 1.167205810546875, 1.221435546875, 1.275665283203125, 1.32989501953125, 1.384124755859375, 1.4383544921875, 1.492584228515625, 1.54681396484375, 1.601043701171875, 1.6552734375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 5.0, 8.0, 1.0, 7.0, 17.0, 5.0, 7.0, 7.0, 19.0, 26.0, 24.0, 35.0, 28.0, 34.0, 28.0, 25.0, 35.0, 38.0, 50.0, 43.0, 42.0, 1072.0, 33.0, 53.0, 60.0, 49.0, 33.0, 35.0, 24.0, 30.0, 29.0, 15.0, 23.0, 17.0, 13.0, 16.0, 10.0, 8.0, 11.0, 3.0, 3.0, 7.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.578125, -8.3406982421875, -8.103271484375, -7.8658447265625, -7.62841796875, -7.3909912109375, -7.153564453125, -6.9161376953125, -6.6787109375, -6.4412841796875, -6.203857421875, -5.9664306640625, -5.72900390625, -5.4915771484375, -5.254150390625, -5.0167236328125, -4.779296875, -4.5418701171875, -4.304443359375, -4.0670166015625, -3.82958984375, -3.5921630859375, -3.354736328125, -3.1173095703125, -2.8798828125, -2.6424560546875, -2.405029296875, -2.1676025390625, -1.93017578125, -1.6927490234375, -1.455322265625, -1.2178955078125, -0.98046875, -0.7430419921875, -0.505615234375, -0.2681884765625, -0.03076171875, 0.2066650390625, 0.444091796875, 0.6815185546875, 0.9189453125, 1.1563720703125, 1.393798828125, 1.6312255859375, 1.86865234375, 2.1060791015625, 2.343505859375, 2.5809326171875, 2.818359375, 3.0557861328125, 3.293212890625, 3.5306396484375, 3.76806640625, 4.0054931640625, 4.242919921875, 4.4803466796875, 4.7177734375, 4.9552001953125, 5.192626953125, 5.4300537109375, 5.66748046875, 5.9049072265625, 6.142333984375, 6.3797607421875, 6.6171875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 6.0, 2.0, 3.0, 8.0, 11.0, 12.0, 28.0, 37.0, 48.0, 63.0, 109.0, 160.0, 241.0, 343.0, 548.0, 782.0, 1261.0, 1837.0, 2833.0, 4263.0, 6344.0, 9724.0, 14726.0, 23056.0, 36298.0, 57566.0, 92299.0, 150842.0, 1258960.0, 162509.0, 99884.0, 62108.0, 38855.0, 24959.0, 15996.0, 10350.0, 6841.0, 4432.0, 2888.0, 1942.0, 1294.0, 926.0, 578.0, 361.0, 292.0, 171.0, 121.0, 79.0, 54.0, 35.0, 22.0, 15.0, 8.0, 15.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4296875, -1.3829345703125, -1.336181640625, -1.2894287109375, -1.24267578125, -1.1959228515625, -1.149169921875, -1.1024169921875, -1.0556640625, -1.0089111328125, -0.962158203125, -0.9154052734375, -0.86865234375, -0.8218994140625, -0.775146484375, -0.7283935546875, -0.681640625, -0.6348876953125, -0.588134765625, -0.5413818359375, -0.49462890625, -0.4478759765625, -0.401123046875, -0.3543701171875, -0.3076171875, -0.2608642578125, -0.214111328125, -0.1673583984375, -0.12060546875, -0.0738525390625, -0.027099609375, 0.0196533203125, 0.06640625, 0.1131591796875, 0.159912109375, 0.2066650390625, 0.25341796875, 0.3001708984375, 0.346923828125, 0.3936767578125, 0.4404296875, 0.4871826171875, 0.533935546875, 0.5806884765625, 0.62744140625, 0.6741943359375, 0.720947265625, 0.7677001953125, 0.814453125, 0.8612060546875, 0.907958984375, 0.9547119140625, 1.00146484375, 1.0482177734375, 1.094970703125, 1.1417236328125, 1.1884765625, 1.2352294921875, 1.281982421875, 1.3287353515625, 1.37548828125, 1.4222412109375, 1.468994140625, 1.5157470703125, 1.5625]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 3.0, 7.0, 3.0, 9.0, 12.0, 9.0, 15.0, 19.0, 31.0, 39.0, 39.0, 60.0, 49.0, 65.0, 54.0, 59.0, 67.0, 63.0, 52.0, 44.0, 54.0, 51.0, 36.0, 27.0, 24.0, 24.0, 12.0, 19.0, 13.0, 6.0, 8.0, 5.0, 3.0, 5.0, 0.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.003002166748046875, -0.002920866012573242, -0.0028395652770996094, -0.0027582645416259766, -0.0026769638061523438, -0.002595663070678711, -0.002514362335205078, -0.0024330615997314453, -0.0023517608642578125, -0.0022704601287841797, -0.002189159393310547, -0.002107858657836914, -0.0020265579223632812, -0.0019452571868896484, -0.0018639564514160156, -0.0017826557159423828, -0.00170135498046875, -0.0016200542449951172, -0.0015387535095214844, -0.0014574527740478516, -0.0013761520385742188, -0.001294851303100586, -0.0012135505676269531, -0.0011322498321533203, -0.0010509490966796875, -0.0009696483612060547, -0.0008883476257324219, -0.0008070468902587891, -0.0007257461547851562, -0.0006444454193115234, -0.0005631446838378906, -0.0004818439483642578, -0.000400543212890625, -0.0003192424774169922, -0.00023794174194335938, -0.00015664100646972656, -7.534027099609375e-05, 5.9604644775390625e-06, 8.726119995117188e-05, 0.0001685619354248047, 0.0002498626708984375, 0.0003311634063720703, 0.0004124641418457031, 0.0004937648773193359, 0.0005750656127929688, 0.0006563663482666016, 0.0007376670837402344, 0.0008189678192138672, 0.0009002685546875, 0.0009815692901611328, 0.0010628700256347656, 0.0011441707611083984, 0.0012254714965820312, 0.001306772232055664, 0.0013880729675292969, 0.0014693737030029297, 0.0015506744384765625, 0.0016319751739501953, 0.0017132759094238281, 0.001794576644897461, 0.0018758773803710938, 0.0019571781158447266, 0.0020384788513183594, 0.002119779586791992, 0.002201080322265625]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 5.0, 3.0, 8.0, 6.0, 7.0, 22.0, 14.0, 22.0, 23.0, 30.0, 40.0, 51.0, 74.0, 100.0, 119.0, 186.0, 286.0, 551.0, 2066.0, 929521.0, 113110.0, 1043.0, 450.0, 227.0, 152.0, 116.0, 78.0, 70.0, 38.0, 31.0, 15.0, 16.0, 13.0, 12.0, 10.0, 11.0, 5.0, 5.0, 9.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.045013427734375, -0.0433964729309082, -0.041779518127441406, -0.04016256332397461, -0.03854560852050781, -0.036928653717041016, -0.03531169891357422, -0.03369474411010742, -0.032077789306640625, -0.030460834503173828, -0.02884387969970703, -0.027226924896240234, -0.025609970092773438, -0.02399301528930664, -0.022376060485839844, -0.020759105682373047, -0.01914215087890625, -0.017525196075439453, -0.015908241271972656, -0.01429128646850586, -0.012674331665039062, -0.011057376861572266, -0.009440422058105469, -0.007823467254638672, -0.006206512451171875, -0.004589557647705078, -0.0029726028442382812, -0.0013556480407714844, 0.0002613067626953125, 0.0018782615661621094, 0.0034952163696289062, 0.005112171173095703, 0.0067291259765625, 0.008346080780029297, 0.009963035583496094, 0.01157999038696289, 0.013196945190429688, 0.014813899993896484, 0.01643085479736328, 0.018047809600830078, 0.019664764404296875, 0.021281719207763672, 0.02289867401123047, 0.024515628814697266, 0.026132583618164062, 0.02774953842163086, 0.029366493225097656, 0.030983448028564453, 0.03260040283203125, 0.03421735763549805, 0.035834312438964844, 0.03745126724243164, 0.03906822204589844, 0.040685176849365234, 0.04230213165283203, 0.04391908645629883, 0.045536041259765625, 0.04715299606323242, 0.04876995086669922, 0.050386905670166016, 0.05200386047363281, 0.05362081527709961, 0.055237770080566406, 0.0568547248840332, 0.0584716796875]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 23.0, 159.0, 567.0, 231.0, 31.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01107342541217804, -0.010858663357794285, -0.010643900372087955, -0.0104291383177042, -0.010214376263320446, -0.009999613277614117, -0.009784851223230362, -0.009570089168846607, -0.009355326183140278, -0.009140564128756523, -0.008925801143050194, -0.008711039088666439, -0.008496277034282684, -0.008281514048576355, -0.0080667519941926, -0.007851989939808846, -0.0076372274197638035, -0.0074224648997187614, -0.007207702845335007, -0.006992940325289965, -0.006778177805244923, -0.006563415750861168, -0.006348653230816126, -0.006133890710771084, -0.005919128656387329, -0.005704366136342287, -0.005489604081958532, -0.00527484156191349, -0.005060079041868448, -0.004845316521823406, -0.0046305544674396515, -0.0044157919473946095, -0.004201029427349567, -0.003986266907304525, -0.003771504620090127, -0.0035567423328757286, -0.0033419798128306866, -0.003127217525616288, -0.00291245523840189, -0.0026976927183568478, -0.002482930663973093, -0.0022681683767586946, -0.0020534058567136526, -0.0018386435694992542, -0.001623881165869534, -0.0014091187622398138, -0.0011943564750254154, -0.0009795940713956952, -0.000764831667765975, -0.0005500692641362548, -0.0003353069187141955, -0.00012054457329213619, 9.421783033758402e-05, 0.00030898023396730423, 0.0005237425211817026, 0.0007385049248114228, 0.000953267328441143, 0.0011680297320708632, 0.0013827921357005835, 0.0015975544229149818, 0.001812316826544702, 0.0020270792301744223, 0.0022418415173888206, 0.0024566040374338627, 0.002671366324648261]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 5.0, 3.0, 4.0, 12.0, 7.0, 10.0, 11.0, 10.0, 19.0, 20.0, 20.0, 19.0, 23.0, 30.0, 39.0, 32.0, 31.0, 38.0, 37.0, 33.0, 39.0, 44.0, 28.0, 29.0, 35.0, 43.0, 34.0, 36.0, 24.0, 34.0, 36.0, 26.0, 35.0, 15.0, 20.0, 18.0, 7.0, 17.0, 14.0, 20.0, 6.0, 5.0, 6.0, 11.0, 4.0, 3.0, 6.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.00114518404006958, -0.0011092368513345718, -0.0010732896625995636, -0.0010373424738645554, -0.0010013952851295471, -0.0009654480963945389, -0.0009295009076595306, -0.0008935537189245224, -0.0008576065301895142, -0.0008216593414545059, -0.0007857121527194977, -0.0007497649639844894, -0.0007138177752494812, -0.000677870586514473, -0.0006419233977794647, -0.0006059762090444565, -0.0005700290203094482, -0.00053408183157444, -0.0004981346428394318, -0.0004621874541044235, -0.0004262402653694153, -0.00039029307663440704, -0.0003543458878993988, -0.00031839869916439056, -0.0002824515104293823, -0.0002465043216943741, -0.00021055713295936584, -0.0001746099442243576, -0.00013866275548934937, -0.00010271556675434113, -6.676837801933289e-05, -3.0821189284324646e-05, 5.125999450683594e-06, 4.1073188185691833e-05, 7.702037692070007e-05, 0.00011296756565570831, 0.00014891475439071655, 0.0001848619431257248, 0.00022080913186073303, 0.00025675632059574127, 0.0002927035093307495, 0.00032865069806575775, 0.000364597886800766, 0.00040054507553577423, 0.00043649226427078247, 0.0004724394530057907, 0.000508386641740799, 0.0005443338304758072, 0.0005802810192108154, 0.0006162282079458237, 0.0006521753966808319, 0.0006881225854158401, 0.0007240697741508484, 0.0007600169628858566, 0.0007959641516208649, 0.0008319113403558731, 0.0008678585290908813, 0.0009038057178258896, 0.0009397529065608978, 0.0009757000952959061, 0.0010116472840309143, 0.0010475944727659225, 0.0010835416615009308, 0.001119488850235939, 0.0011554360389709473]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 3.0, 1.0, 3.0, 11.0, 4.0, 10.0, 15.0, 13.0, 12.0, 19.0, 28.0, 21.0, 21.0, 33.0, 22.0, 29.0, 32.0, 35.0, 48.0, 44.0, 41.0, 38.0, 48.0, 44.0, 41.0, 44.0, 39.0, 40.0, 28.0, 25.0, 22.0, 29.0, 24.0, 24.0, 19.0, 16.0, 16.0, 12.0, 4.0, 17.0, 6.0, 7.0, 7.0, 2.0, 3.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-11.2109375, -10.8543701171875, -10.497802734375, -10.1412353515625, -9.78466796875, -9.4281005859375, -9.071533203125, -8.7149658203125, -8.3583984375, -8.0018310546875, -7.645263671875, -7.2886962890625, -6.93212890625, -6.5755615234375, -6.218994140625, -5.8624267578125, -5.505859375, -5.1492919921875, -4.792724609375, -4.4361572265625, -4.07958984375, -3.7230224609375, -3.366455078125, -3.0098876953125, -2.6533203125, -2.2967529296875, -1.940185546875, -1.5836181640625, -1.22705078125, -0.8704833984375, -0.513916015625, -0.1573486328125, 0.19921875, 0.5557861328125, 0.912353515625, 1.2689208984375, 1.62548828125, 1.9820556640625, 2.338623046875, 2.6951904296875, 3.0517578125, 3.4083251953125, 3.764892578125, 4.1214599609375, 4.47802734375, 4.8345947265625, 5.191162109375, 5.5477294921875, 5.904296875, 6.2608642578125, 6.617431640625, 6.9739990234375, 7.33056640625, 7.6871337890625, 8.043701171875, 8.4002685546875, 8.7568359375, 9.1134033203125, 9.469970703125, 9.8265380859375, 10.18310546875, 10.5396728515625, 10.896240234375, 11.2528076171875, 11.609375]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 6.0, 3.0, 22.0, 10.0, 24.0, 23.0, 46.0, 54.0, 80.0, 98.0, 145.0, 241.0, 318.0, 429.0, 620.0, 989.0, 1715.0, 3290.0, 7053.0, 17460.0, 46330.0, 138051.0, 459733.0, 250180.0, 73824.0, 26794.0, 10538.0, 4539.0, 2288.0, 1174.0, 749.0, 487.0, 337.0, 266.0, 191.0, 143.0, 79.0, 70.0, 45.0, 46.0, 19.0, 18.0, 8.0, 4.0, 9.0, 8.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.015625, -12.6053466796875, -12.195068359375, -11.7847900390625, -11.37451171875, -10.9642333984375, -10.553955078125, -10.1436767578125, -9.7333984375, -9.3231201171875, -8.912841796875, -8.5025634765625, -8.09228515625, -7.6820068359375, -7.271728515625, -6.8614501953125, -6.451171875, -6.0408935546875, -5.630615234375, -5.2203369140625, -4.81005859375, -4.3997802734375, -3.989501953125, -3.5792236328125, -3.1689453125, -2.7586669921875, -2.348388671875, -1.9381103515625, -1.52783203125, -1.1175537109375, -0.707275390625, -0.2969970703125, 0.11328125, 0.5235595703125, 0.933837890625, 1.3441162109375, 1.75439453125, 2.1646728515625, 2.574951171875, 2.9852294921875, 3.3955078125, 3.8057861328125, 4.216064453125, 4.6263427734375, 5.03662109375, 5.4468994140625, 5.857177734375, 6.2674560546875, 6.677734375, 7.0880126953125, 7.498291015625, 7.9085693359375, 8.31884765625, 8.7291259765625, 9.139404296875, 9.5496826171875, 9.9599609375, 10.3702392578125, 10.780517578125, 11.1907958984375, 11.60107421875, 12.0113525390625, 12.421630859375, 12.8319091796875, 13.2421875]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 1.0, 2.0, 6.0, 3.0, 5.0, 9.0, 11.0, 18.0, 13.0, 15.0, 15.0, 20.0, 24.0, 24.0, 35.0, 23.0, 27.0, 41.0, 36.0, 50.0, 65.0, 120.0, 310.0, 1564.0, 148.0, 73.0, 53.0, 45.0, 35.0, 29.0, 26.0, 20.0, 31.0, 22.0, 27.0, 20.0, 17.0, 14.0, 9.0, 7.0, 7.0, 9.0, 8.0, 5.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-27.4375, -26.634765625, -25.83203125, -25.029296875, -24.2265625, -23.423828125, -22.62109375, -21.818359375, -21.015625, -20.212890625, -19.41015625, -18.607421875, -17.8046875, -17.001953125, -16.19921875, -15.396484375, -14.59375, -13.791015625, -12.98828125, -12.185546875, -11.3828125, -10.580078125, -9.77734375, -8.974609375, -8.171875, -7.369140625, -6.56640625, -5.763671875, -4.9609375, -4.158203125, -3.35546875, -2.552734375, -1.75, -0.947265625, -0.14453125, 0.658203125, 1.4609375, 2.263671875, 3.06640625, 3.869140625, 4.671875, 5.474609375, 6.27734375, 7.080078125, 7.8828125, 8.685546875, 9.48828125, 10.291015625, 11.09375, 11.896484375, 12.69921875, 13.501953125, 14.3046875, 15.107421875, 15.91015625, 16.712890625, 17.515625, 18.318359375, 19.12109375, 19.923828125, 20.7265625, 21.529296875, 22.33203125, 23.134765625, 23.9375]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 3.0, 6.0, 10.0, 14.0, 14.0, 20.0, 38.0, 27.0, 53.0, 73.0, 96.0, 163.0, 231.0, 369.0, 801.0, 5957.0, 326591.0, 2791882.0, 16797.0, 1247.0, 429.0, 271.0, 176.0, 115.0, 93.0, 60.0, 39.0, 31.0, 25.0, 15.0, 16.0, 9.0, 12.0, 4.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-61.84375, -60.0849609375, -58.326171875, -56.5673828125, -54.80859375, -53.0498046875, -51.291015625, -49.5322265625, -47.7734375, -46.0146484375, -44.255859375, -42.4970703125, -40.73828125, -38.9794921875, -37.220703125, -35.4619140625, -33.703125, -31.9443359375, -30.185546875, -28.4267578125, -26.66796875, -24.9091796875, -23.150390625, -21.3916015625, -19.6328125, -17.8740234375, -16.115234375, -14.3564453125, -12.59765625, -10.8388671875, -9.080078125, -7.3212890625, -5.5625, -3.8037109375, -2.044921875, -0.2861328125, 1.47265625, 3.2314453125, 4.990234375, 6.7490234375, 8.5078125, 10.2666015625, 12.025390625, 13.7841796875, 15.54296875, 17.3017578125, 19.060546875, 20.8193359375, 22.578125, 24.3369140625, 26.095703125, 27.8544921875, 29.61328125, 31.3720703125, 33.130859375, 34.8896484375, 36.6484375, 38.4072265625, 40.166015625, 41.9248046875, 43.68359375, 45.4423828125, 47.201171875, 48.9599609375, 50.71875]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 30.0, 221.0, 497.0, 244.0, 24.0, 1.0, 1.0], "bins": [-249.39454650878906, -245.20701599121094, -241.01947021484375, -236.83193969726562, -232.6444091796875, -228.4568634033203, -224.2693328857422, -220.08180236816406, -215.89425659179688, -211.70672607421875, -207.51918029785156, -203.33164978027344, -199.1441192626953, -194.95657348632812, -190.76904296875, -186.58151245117188, -182.39398193359375, -178.20645141601562, -174.01890563964844, -169.8313751220703, -165.6438446044922, -161.456298828125, -157.26876831054688, -153.08123779296875, -148.89369201660156, -144.70616149902344, -140.51861572265625, -136.33108520507812, -132.1435546875, -127.95600891113281, -123.76847839355469, -119.58094024658203, -115.39338684082031, -111.20584869384766, -107.01831817626953, -102.83078002929688, -98.64324188232422, -94.45570373535156, -90.26817321777344, -86.08063507080078, -81.89310455322266, -77.70556640625, -73.51803588867188, -69.33049774169922, -65.14295959472656, -60.95542526245117, -56.76789093017578, -52.580352783203125, -48.392818450927734, -44.205284118652344, -40.01774597167969, -35.8302116394043, -31.642675399780273, -27.45513916015625, -23.26760482788086, -19.080068588256836, -14.892532348632812, -10.704996109008789, -6.517460823059082, -2.329925537109375, 1.8576107025146484, 6.045146942138672, 10.232681274414062, 14.420217514038086, 18.60775375366211]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 4.0, 4.0, 7.0, 6.0, 10.0, 9.0, 12.0, 15.0, 18.0, 19.0, 34.0, 32.0, 27.0, 36.0, 33.0, 30.0, 32.0, 33.0, 34.0, 33.0, 40.0, 45.0, 41.0, 41.0, 44.0, 34.0, 42.0, 40.0, 30.0, 26.0, 25.0, 20.0, 22.0, 14.0, 14.0, 18.0, 15.0, 12.0, 9.0, 9.0, 7.0, 5.0, 5.0, 5.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-62.89476013183594, -61.11080551147461, -59.32685089111328, -57.54289245605469, -55.75893783569336, -53.97498321533203, -52.1910285949707, -50.407073974609375, -48.62311935424805, -46.83916473388672, -45.05521011352539, -43.27125549316406, -41.48729705810547, -39.70334243774414, -37.91938781738281, -36.135433197021484, -34.351478576660156, -32.56752395629883, -30.783567428588867, -28.99961280822754, -27.21565818786621, -25.43170166015625, -23.647747039794922, -21.863792419433594, -20.079833984375, -18.295879364013672, -16.51192283630371, -14.727968215942383, -12.944013595581055, -11.16005802154541, -9.376102447509766, -7.5921478271484375, -5.808193206787109, -4.024238109588623, -2.2402827739715576, -0.4563274383544922, 1.3276276588439941, 3.1115827560424805, 4.895538330078125, 6.679492950439453, 8.463448524475098, 10.247404098510742, 12.03135871887207, 13.815314292907715, 15.59926986694336, 17.383224487304688, 19.167179107666016, 20.951133728027344, 22.735090255737305, 24.519044876098633, 26.303001403808594, 28.086956024169922, 29.87091064453125, 31.654865264892578, 33.438819885253906, 35.2227783203125, 37.00673294067383, 38.790687561035156, 40.574642181396484, 42.35859680175781, 44.142555236816406, 45.926509857177734, 47.71046447753906, 49.49441909790039, 51.27837371826172]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 6.0, 6.0, 7.0, 13.0, 14.0, 15.0, 21.0, 23.0, 17.0, 21.0, 29.0, 30.0, 32.0, 37.0, 34.0, 40.0, 35.0, 48.0, 58.0, 55.0, 37.0, 36.0, 46.0, 45.0, 34.0, 33.0, 23.0, 34.0, 30.0, 24.0, 18.0, 29.0, 13.0, 9.0, 11.0, 10.0, 7.0, 7.0, 3.0, 7.0, 3.0, 2.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.21875, -11.842529296875, -11.46630859375, -11.090087890625, -10.7138671875, -10.337646484375, -9.96142578125, -9.585205078125, -9.208984375, -8.832763671875, -8.45654296875, -8.080322265625, -7.7041015625, -7.327880859375, -6.95166015625, -6.575439453125, -6.19921875, -5.822998046875, -5.44677734375, -5.070556640625, -4.6943359375, -4.318115234375, -3.94189453125, -3.565673828125, -3.189453125, -2.813232421875, -2.43701171875, -2.060791015625, -1.6845703125, -1.308349609375, -0.93212890625, -0.555908203125, -0.1796875, 0.196533203125, 0.57275390625, 0.948974609375, 1.3251953125, 1.701416015625, 2.07763671875, 2.453857421875, 2.830078125, 3.206298828125, 3.58251953125, 3.958740234375, 4.3349609375, 4.711181640625, 5.08740234375, 5.463623046875, 5.83984375, 6.216064453125, 6.59228515625, 6.968505859375, 7.3447265625, 7.720947265625, 8.09716796875, 8.473388671875, 8.849609375, 9.225830078125, 9.60205078125, 9.978271484375, 10.3544921875, 10.730712890625, 11.10693359375, 11.483154296875, 11.859375]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 6.0, 4.0, 4.0, 13.0, 12.0, 13.0, 18.0, 28.0, 27.0, 36.0, 53.0, 62.0, 92.0, 124.0, 188.0, 273.0, 335.0, 461.0, 2908.0, 4186821.0, 1144.0, 477.0, 343.0, 223.0, 165.0, 121.0, 81.0, 62.0, 48.0, 34.0, 28.0, 12.0, 11.0, 22.0, 9.0, 6.0, 8.0, 5.0, 3.0, 2.0, 2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-289.5, -279.96875, -270.4375, -260.90625, -251.375, -241.84375, -232.3125, -222.78125, -213.25, -203.71875, -194.1875, -184.65625, -175.125, -165.59375, -156.0625, -146.53125, -137.0, -127.46875, -117.9375, -108.40625, -98.875, -89.34375, -79.8125, -70.28125, -60.75, -51.21875, -41.6875, -32.15625, -22.625, -13.09375, -3.5625, 5.96875, 15.5, 25.03125, 34.5625, 44.09375, 53.625, 63.15625, 72.6875, 82.21875, 91.75, 101.28125, 110.8125, 120.34375, 129.875, 139.40625, 148.9375, 158.46875, 168.0, 177.53125, 187.0625, 196.59375, 206.125, 215.65625, 225.1875, 234.71875, 244.25, 253.78125, 263.3125, 272.84375, 282.375, 291.90625, 301.4375, 310.96875, 320.5]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 12.0, 16.0, 37.0, 46.0, 66.0, 144.0, 312.0, 771.0, 1212.0, 801.0, 306.0, 157.0, 82.0, 41.0, 35.0, 16.0, 15.0, 4.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.0, -29.87353515625, -28.7470703125, -27.62060546875, -26.494140625, -25.36767578125, -24.2412109375, -23.11474609375, -21.98828125, -20.86181640625, -19.7353515625, -18.60888671875, -17.482421875, -16.35595703125, -15.2294921875, -14.10302734375, -12.9765625, -11.85009765625, -10.7236328125, -9.59716796875, -8.470703125, -7.34423828125, -6.2177734375, -5.09130859375, -3.96484375, -2.83837890625, -1.7119140625, -0.58544921875, 0.541015625, 1.66748046875, 2.7939453125, 3.92041015625, 5.046875, 6.17333984375, 7.2998046875, 8.42626953125, 9.552734375, 10.67919921875, 11.8056640625, 12.93212890625, 14.05859375, 15.18505859375, 16.3115234375, 17.43798828125, 18.564453125, 19.69091796875, 20.8173828125, 21.94384765625, 23.0703125, 24.19677734375, 25.3232421875, 26.44970703125, 27.576171875, 28.70263671875, 29.8291015625, 30.95556640625, 32.08203125, 33.20849609375, 34.3349609375, 35.46142578125, 36.587890625, 37.71435546875, 38.8408203125, 39.96728515625, 41.09375]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 4.0, 6.0, 9.0, 13.0, 12.0, 16.0, 20.0, 20.0, 22.0, 25.0, 34.0, 51.0, 60.0, 70.0, 137.0, 383.0, 5507.0, 4171130.0, 15705.0, 549.0, 156.0, 65.0, 62.0, 40.0, 33.0, 24.0, 22.0, 20.0, 28.0, 17.0, 9.0, 8.0, 7.0, 6.0, 3.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-170.875, -166.072265625, -161.26953125, -156.466796875, -151.6640625, -146.861328125, -142.05859375, -137.255859375, -132.453125, -127.650390625, -122.84765625, -118.044921875, -113.2421875, -108.439453125, -103.63671875, -98.833984375, -94.03125, -89.228515625, -84.42578125, -79.623046875, -74.8203125, -70.017578125, -65.21484375, -60.412109375, -55.609375, -50.806640625, -46.00390625, -41.201171875, -36.3984375, -31.595703125, -26.79296875, -21.990234375, -17.1875, -12.384765625, -7.58203125, -2.779296875, 2.0234375, 6.826171875, 11.62890625, 16.431640625, 21.234375, 26.037109375, 30.83984375, 35.642578125, 40.4453125, 45.248046875, 50.05078125, 54.853515625, 59.65625, 64.458984375, 69.26171875, 74.064453125, 78.8671875, 83.669921875, 88.47265625, 93.275390625, 98.078125, 102.880859375, 107.68359375, 112.486328125, 117.2890625, 122.091796875, 126.89453125, 131.697265625, 136.5]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 17.0, 40.0, 180.0, 319.0, 301.0, 118.0, 32.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-126.09324645996094, -121.01203918457031, -115.93083190917969, -110.84961700439453, -105.7684097290039, -100.68720245361328, -95.60598754882812, -90.5247802734375, -85.44357299804688, -80.36236572265625, -75.28115844726562, -70.19994354248047, -65.11873626708984, -60.03752899169922, -54.95631790161133, -49.87510681152344, -44.79389953613281, -39.71269226074219, -34.6314811706543, -29.55027198791504, -24.46906280517578, -19.387853622436523, -14.306644439697266, -9.225433349609375, -4.14422607421875, 0.9369831085205078, 6.018192291259766, 11.099401473999023, 16.18061065673828, 21.26181983947754, 26.343029022216797, 31.424240112304688, 36.50544738769531, 41.58665466308594, 46.66786575317383, 51.74907684326172, 56.830284118652344, 61.91149139404297, 66.99270629882812, 72.07391357421875, 77.15512084960938, 82.236328125, 87.31753540039062, 92.39875030517578, 97.4799575805664, 102.56116485595703, 107.64237976074219, 112.72358703613281, 117.80479431152344, 122.88600158691406, 127.96720886230469, 133.0484161376953, 138.129638671875, 143.21084594726562, 148.29205322265625, 153.37326049804688, 158.4544677734375, 163.53567504882812, 168.61688232421875, 173.69808959960938, 178.779296875, 183.8605194091797, 188.9417266845703, 194.02293395996094, 199.10414123535156]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 4.0, 10.0, 6.0, 7.0, 13.0, 9.0, 21.0, 24.0, 20.0, 15.0, 35.0, 30.0, 33.0, 44.0, 47.0, 46.0, 34.0, 41.0, 48.0, 51.0, 44.0, 36.0, 37.0, 26.0, 45.0, 39.0, 23.0, 26.0, 28.0, 24.0, 24.0, 24.0, 18.0, 17.0, 10.0, 8.0, 9.0, 8.0, 7.0, 1.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-60.21525573730469, -58.28989028930664, -56.364524841308594, -54.43915939331055, -52.5137939453125, -50.58842468261719, -48.66305923461914, -46.737693786621094, -44.81232833862305, -42.886962890625, -40.96159744262695, -39.036231994628906, -37.110862731933594, -35.18550109863281, -33.2601318359375, -31.334766387939453, -29.409400939941406, -27.48403549194336, -25.558670043945312, -23.633302688598633, -21.707937240600586, -19.78257179260254, -17.85720443725586, -15.931838989257812, -14.006473541259766, -12.081108093261719, -10.155741691589355, -8.230375289916992, -6.305009841918945, -4.379644393920898, -2.454277992248535, -0.5289115905761719, 1.396453857421875, 3.32181978225708, 5.247185707092285, 7.17255163192749, 9.097917556762695, 11.023283004760742, 12.948649406433105, 14.874015808105469, 16.799381256103516, 18.724746704101562, 20.65011215209961, 22.57547950744629, 24.500844955444336, 26.426210403442383, 28.351577758789062, 30.27694320678711, 32.202308654785156, 34.1276741027832, 36.05303955078125, 37.9784049987793, 39.903770446777344, 41.829139709472656, 43.7545051574707, 45.67987060546875, 47.6052360534668, 49.530601501464844, 51.45596694946289, 53.38133239746094, 55.30670166015625, 57.23206329345703, 59.157432556152344, 61.08279800415039, 63.00816345214844]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 2.0, 2.0, 4.0, 3.0, 8.0, 4.0, 4.0, 10.0, 7.0, 15.0, 21.0, 15.0, 18.0, 16.0, 25.0, 18.0, 26.0, 20.0, 27.0, 36.0, 24.0, 42.0, 40.0, 53.0, 32.0, 49.0, 33.0, 49.0, 31.0, 31.0, 39.0, 28.0, 27.0, 34.0, 25.0, 28.0, 23.0, 14.0, 19.0, 11.0, 22.0, 15.0, 12.0, 11.0, 7.0, 9.0, 4.0, 5.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0], "bins": [-9.3046875, -8.9827880859375, -8.660888671875, -8.3389892578125, -8.01708984375, -7.6951904296875, -7.373291015625, -7.0513916015625, -6.7294921875, -6.4075927734375, -6.085693359375, -5.7637939453125, -5.44189453125, -5.1199951171875, -4.798095703125, -4.4761962890625, -4.154296875, -3.8323974609375, -3.510498046875, -3.1885986328125, -2.86669921875, -2.5447998046875, -2.222900390625, -1.9010009765625, -1.5791015625, -1.2572021484375, -0.935302734375, -0.6134033203125, -0.29150390625, 0.0303955078125, 0.352294921875, 0.6741943359375, 0.99609375, 1.3179931640625, 1.639892578125, 1.9617919921875, 2.28369140625, 2.6055908203125, 2.927490234375, 3.2493896484375, 3.5712890625, 3.8931884765625, 4.215087890625, 4.5369873046875, 4.85888671875, 5.1807861328125, 5.502685546875, 5.8245849609375, 6.146484375, 6.4683837890625, 6.790283203125, 7.1121826171875, 7.43408203125, 7.7559814453125, 8.077880859375, 8.3997802734375, 8.7216796875, 9.0435791015625, 9.365478515625, 9.6873779296875, 10.00927734375, 10.3311767578125, 10.653076171875, 10.9749755859375, 11.296875]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 9.0, 10.0, 14.0, 22.0, 30.0, 57.0, 65.0, 120.0, 184.0, 282.0, 457.0, 816.0, 1287.0, 2349.0, 4101.0, 7127.0, 13172.0, 24340.0, 46690.0, 91519.0, 181940.0, 295030.0, 183914.0, 92618.0, 47368.0, 24522.0, 13407.0, 7265.0, 4092.0, 2302.0, 1369.0, 784.0, 479.0, 311.0, 179.0, 104.0, 86.0, 53.0, 28.0, 21.0, 11.0, 7.0, 3.0, 6.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.09765625, -2.028900146484375, -1.96014404296875, -1.891387939453125, -1.8226318359375, -1.753875732421875, -1.68511962890625, -1.616363525390625, -1.547607421875, -1.478851318359375, -1.41009521484375, -1.341339111328125, -1.2725830078125, -1.203826904296875, -1.13507080078125, -1.066314697265625, -0.99755859375, -0.928802490234375, -0.86004638671875, -0.791290283203125, -0.7225341796875, -0.653778076171875, -0.58502197265625, -0.516265869140625, -0.447509765625, -0.378753662109375, -0.30999755859375, -0.241241455078125, -0.1724853515625, -0.103729248046875, -0.03497314453125, 0.033782958984375, 0.1025390625, 0.171295166015625, 0.24005126953125, 0.308807373046875, 0.3775634765625, 0.446319580078125, 0.51507568359375, 0.583831787109375, 0.652587890625, 0.721343994140625, 0.79010009765625, 0.858856201171875, 0.9276123046875, 0.996368408203125, 1.06512451171875, 1.133880615234375, 1.20263671875, 1.271392822265625, 1.34014892578125, 1.408905029296875, 1.4776611328125, 1.546417236328125, 1.61517333984375, 1.683929443359375, 1.752685546875, 1.821441650390625, 1.89019775390625, 1.958953857421875, 2.0277099609375, 2.096466064453125, 2.16522216796875, 2.233978271484375, 2.302734375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 1.0, 5.0, 6.0, 7.0, 10.0, 16.0, 11.0, 13.0, 15.0, 26.0, 31.0, 35.0, 41.0, 34.0, 33.0, 47.0, 37.0, 45.0, 50.0, 1078.0, 40.0, 48.0, 57.0, 45.0, 22.0, 42.0, 39.0, 38.0, 28.0, 28.0, 29.0, 14.0, 10.0, 10.0, 8.0, 10.0, 8.0, 4.0, 6.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.90625, -7.641845703125, -7.37744140625, -7.113037109375, -6.8486328125, -6.584228515625, -6.31982421875, -6.055419921875, -5.791015625, -5.526611328125, -5.26220703125, -4.997802734375, -4.7333984375, -4.468994140625, -4.20458984375, -3.940185546875, -3.67578125, -3.411376953125, -3.14697265625, -2.882568359375, -2.6181640625, -2.353759765625, -2.08935546875, -1.824951171875, -1.560546875, -1.296142578125, -1.03173828125, -0.767333984375, -0.5029296875, -0.238525390625, 0.02587890625, 0.290283203125, 0.5546875, 0.819091796875, 1.08349609375, 1.347900390625, 1.6123046875, 1.876708984375, 2.14111328125, 2.405517578125, 2.669921875, 2.934326171875, 3.19873046875, 3.463134765625, 3.7275390625, 3.991943359375, 4.25634765625, 4.520751953125, 4.78515625, 5.049560546875, 5.31396484375, 5.578369140625, 5.8427734375, 6.107177734375, 6.37158203125, 6.635986328125, 6.900390625, 7.164794921875, 7.42919921875, 7.693603515625, 7.9580078125, 8.222412109375, 8.48681640625, 8.751220703125, 9.015625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 6.0, 9.0, 16.0, 20.0, 34.0, 38.0, 68.0, 139.0, 184.0, 341.0, 539.0, 918.0, 1512.0, 2420.0, 4053.0, 6998.0, 11793.0, 19922.0, 34904.0, 60925.0, 109274.0, 197086.0, 1301775.0, 149166.0, 83046.0, 46597.0, 26851.0, 15618.0, 9292.0, 5538.0, 3249.0, 1912.0, 1125.0, 674.0, 443.0, 230.0, 166.0, 94.0, 52.0, 47.0, 29.0, 12.0, 10.0, 4.0, 5.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8974609375, -1.838653564453125, -1.77984619140625, -1.721038818359375, -1.6622314453125, -1.603424072265625, -1.54461669921875, -1.485809326171875, -1.427001953125, -1.368194580078125, -1.30938720703125, -1.250579833984375, -1.1917724609375, -1.132965087890625, -1.07415771484375, -1.015350341796875, -0.95654296875, -0.897735595703125, -0.83892822265625, -0.780120849609375, -0.7213134765625, -0.662506103515625, -0.60369873046875, -0.544891357421875, -0.486083984375, -0.427276611328125, -0.36846923828125, -0.309661865234375, -0.2508544921875, -0.192047119140625, -0.13323974609375, -0.074432373046875, -0.015625, 0.043182373046875, 0.10198974609375, 0.160797119140625, 0.2196044921875, 0.278411865234375, 0.33721923828125, 0.396026611328125, 0.454833984375, 0.513641357421875, 0.57244873046875, 0.631256103515625, 0.6900634765625, 0.748870849609375, 0.80767822265625, 0.866485595703125, 0.92529296875, 0.984100341796875, 1.04290771484375, 1.101715087890625, 1.1605224609375, 1.219329833984375, 1.27813720703125, 1.336944580078125, 1.395751953125, 1.454559326171875, 1.51336669921875, 1.572174072265625, 1.6309814453125, 1.689788818359375, 1.74859619140625, 1.807403564453125, 1.8662109375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 9.0, 11.0, 13.0, 17.0, 13.0, 26.0, 18.0, 27.0, 43.0, 50.0, 66.0, 62.0, 78.0, 83.0, 65.0, 76.0, 74.0, 46.0, 40.0, 40.0, 27.0, 29.0, 12.0, 13.0, 10.0, 8.0, 12.0, 8.0, 4.0, 2.0, 2.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.002712249755859375, -0.0026206672191619873, -0.0025290846824645996, -0.002437502145767212, -0.0023459196090698242, -0.0022543370723724365, -0.002162754535675049, -0.002071171998977661, -0.0019795894622802734, -0.0018880069255828857, -0.001796424388885498, -0.0017048418521881104, -0.0016132593154907227, -0.001521676778793335, -0.0014300942420959473, -0.0013385117053985596, -0.0012469291687011719, -0.0011553466320037842, -0.0010637640953063965, -0.0009721815586090088, -0.0008805990219116211, -0.0007890164852142334, -0.0006974339485168457, -0.000605851411819458, -0.0005142688751220703, -0.0004226863384246826, -0.0003311038017272949, -0.00023952126502990723, -0.00014793872833251953, -5.6356191635131836e-05, 3.522634506225586e-05, 0.00012680888175964355, 0.00021839141845703125, 0.00030997395515441895, 0.00040155649185180664, 0.0004931390285491943, 0.000584721565246582, 0.0006763041019439697, 0.0007678866386413574, 0.0008594691753387451, 0.0009510517120361328, 0.0010426342487335205, 0.0011342167854309082, 0.001225799322128296, 0.0013173818588256836, 0.0014089643955230713, 0.001500546932220459, 0.0015921294689178467, 0.0016837120056152344, 0.001775294542312622, 0.0018668770790100098, 0.0019584596157073975, 0.002050042152404785, 0.002141624689102173, 0.0022332072257995605, 0.0023247897624969482, 0.002416372299194336, 0.0025079548358917236, 0.0025995373725891113, 0.002691119909286499, 0.0027827024459838867, 0.0028742849826812744, 0.002965867519378662, 0.00305745005607605, 0.0031490325927734375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 7.0, 4.0, 7.0, 8.0, 6.0, 5.0, 10.0, 24.0, 14.0, 26.0, 22.0, 41.0, 63.0, 82.0, 102.0, 152.0, 217.0, 376.0, 617.0, 1405.0, 584950.0, 457275.0, 1401.0, 610.0, 358.0, 208.0, 143.0, 98.0, 72.0, 73.0, 46.0, 31.0, 33.0, 15.0, 8.0, 7.0, 5.0, 3.0, 3.0, 5.0, 4.0, 4.0, 5.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.053497314453125, -0.05196809768676758, -0.050438880920410156, -0.048909664154052734, -0.04738044738769531, -0.04585123062133789, -0.04432201385498047, -0.04279279708862305, -0.041263580322265625, -0.0397343635559082, -0.03820514678955078, -0.03667593002319336, -0.03514671325683594, -0.033617496490478516, -0.032088279724121094, -0.030559062957763672, -0.02902984619140625, -0.027500629425048828, -0.025971412658691406, -0.024442195892333984, -0.022912979125976562, -0.02138376235961914, -0.01985454559326172, -0.018325328826904297, -0.016796112060546875, -0.015266895294189453, -0.013737678527832031, -0.01220846176147461, -0.010679244995117188, -0.009150028228759766, -0.007620811462402344, -0.006091594696044922, -0.0045623779296875, -0.003033161163330078, -0.0015039443969726562, 2.5272369384765625e-05, 0.0015544891357421875, 0.0030837059020996094, 0.004612922668457031, 0.006142139434814453, 0.007671356201171875, 0.009200572967529297, 0.010729789733886719, 0.01225900650024414, 0.013788223266601562, 0.015317440032958984, 0.016846656799316406, 0.018375873565673828, 0.01990509033203125, 0.021434307098388672, 0.022963523864746094, 0.024492740631103516, 0.026021957397460938, 0.02755117416381836, 0.02908039093017578, 0.030609607696533203, 0.032138824462890625, 0.03366804122924805, 0.03519725799560547, 0.03672647476196289, 0.03825569152832031, 0.039784908294677734, 0.041314125061035156, 0.04284334182739258, 0.04437255859375]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 12.0, 100.0, 471.0, 371.0, 58.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.008021735586225986, -0.007834665477275848, -0.007647596299648285, -0.007460526656359434, -0.007273457013070583, -0.007086386904120445, -0.0068993172608315945, -0.006712247617542744, -0.006525177974253893, -0.006338108330965042, -0.006151038687676191, -0.0059639690443873405, -0.0057768989354372025, -0.005589829292148352, -0.005402759648859501, -0.00521569000557065, -0.005028620362281799, -0.0048415507189929485, -0.004654481075704098, -0.004467411432415247, -0.004280341789126396, -0.004093271680176258, -0.0039062020368874073, -0.0037191323935985565, -0.0035320627503097057, -0.003344993107020855, -0.003157923463732004, -0.0029708535876125097, -0.002783783944323659, -0.002596714301034808, -0.0024096444249153137, -0.002222574781626463, -0.002035504672676325, -0.001848435029387474, -0.0016613652696833014, -0.0014742955099791288, -0.001287225866690278, -0.0011001562234014273, -0.0009130864636972547, -0.000726016703993082, -0.0005389470607042313, -0.00035187735920771956, -0.00016480765771120787, 2.226204378530383e-05, 0.00020933174528181553, 0.0003964014467783272, 0.0005834711482748389, 0.0007705409079790115, 0.0009576105512678623, 0.001144680194556713, 0.0013317499542608857, 0.0015188197139650583, 0.0017058893572539091, 0.00189295900054276, 0.0020800288766622543, 0.002267098519951105, 0.002454168163239956, 0.0026412378065288067, 0.0028283074498176575, 0.003015377325937152, 0.0032024469692260027, 0.0033895166125148535, 0.003576586488634348, 0.0037636561319231987, 0.0039507257752120495]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 5.0, 6.0, 8.0, 6.0, 10.0, 14.0, 15.0, 8.0, 18.0, 24.0, 19.0, 28.0, 31.0, 36.0, 40.0, 50.0, 36.0, 48.0, 54.0, 52.0, 61.0, 47.0, 42.0, 44.0, 35.0, 35.0, 35.0, 36.0, 26.0, 25.0, 13.0, 22.0, 10.0, 15.0, 14.0, 7.0, 10.0, 5.0, 6.0, 4.0, 3.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00129777193069458, -0.0012513287365436554, -0.0012048855423927307, -0.001158442348241806, -0.0011119991540908813, -0.0010655559599399567, -0.001019112765789032, -0.0009726695716381073, -0.0009262263774871826, -0.0008797831833362579, -0.0008333399891853333, -0.0007868967950344086, -0.0007404536008834839, -0.0006940104067325592, -0.0006475672125816345, -0.0006011240184307098, -0.0005546808242797852, -0.0005082376301288605, -0.0004617944359779358, -0.0004153512418270111, -0.0003689080476760864, -0.00032246485352516174, -0.00027602165937423706, -0.00022957846522331238, -0.0001831352710723877, -0.000136692076921463, -9.024888277053833e-05, -4.380568861961365e-05, 2.637505531311035e-06, 4.908069968223572e-05, 9.55238938331604e-05, 0.00014196708798408508, 0.00018841028213500977, 0.00023485347628593445, 0.00028129667043685913, 0.0003277398645877838, 0.0003741830587387085, 0.0004206262528896332, 0.00046706944704055786, 0.0005135126411914825, 0.0005599558353424072, 0.0006063990294933319, 0.0006528422236442566, 0.0006992854177951813, 0.000745728611946106, 0.0007921718060970306, 0.0008386150002479553, 0.00088505819439888, 0.0009315013885498047, 0.0009779445827007294, 0.001024387776851654, 0.0010708309710025787, 0.0011172741651535034, 0.001163717359304428, 0.0012101605534553528, 0.0012566037476062775, 0.0013030469417572021, 0.0013494901359081268, 0.0013959333300590515, 0.0014423765242099762, 0.0014888197183609009, 0.0015352629125118256, 0.0015817061066627502, 0.001628149300813675, 0.0016745924949645996]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 2.0, 2.0, 4.0, 3.0, 8.0, 4.0, 4.0, 10.0, 7.0, 15.0, 21.0, 15.0, 18.0, 16.0, 25.0, 18.0, 26.0, 20.0, 27.0, 36.0, 24.0, 42.0, 40.0, 53.0, 32.0, 49.0, 33.0, 49.0, 31.0, 31.0, 39.0, 28.0, 27.0, 34.0, 25.0, 28.0, 23.0, 14.0, 19.0, 11.0, 22.0, 15.0, 12.0, 11.0, 7.0, 9.0, 4.0, 5.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0], "bins": [-9.3046875, -8.9827880859375, -8.660888671875, -8.3389892578125, -8.01708984375, -7.6951904296875, -7.373291015625, -7.0513916015625, -6.7294921875, -6.4075927734375, -6.085693359375, -5.7637939453125, -5.44189453125, -5.1199951171875, -4.798095703125, -4.4761962890625, -4.154296875, -3.8323974609375, -3.510498046875, -3.1885986328125, -2.86669921875, -2.5447998046875, -2.222900390625, -1.9010009765625, -1.5791015625, -1.2572021484375, -0.935302734375, -0.6134033203125, -0.29150390625, 0.0303955078125, 0.352294921875, 0.6741943359375, 0.99609375, 1.3179931640625, 1.639892578125, 1.9617919921875, 2.28369140625, 2.6055908203125, 2.927490234375, 3.2493896484375, 3.5712890625, 3.8931884765625, 4.215087890625, 4.5369873046875, 4.85888671875, 5.1807861328125, 5.502685546875, 5.8245849609375, 6.146484375, 6.4683837890625, 6.790283203125, 7.1121826171875, 7.43408203125, 7.7559814453125, 8.077880859375, 8.3997802734375, 8.7216796875, 9.0435791015625, 9.365478515625, 9.6873779296875, 10.00927734375, 10.3311767578125, 10.653076171875, 10.9749755859375, 11.296875]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 5.0, 1.0, 5.0, 8.0, 7.0, 12.0, 12.0, 19.0, 23.0, 40.0, 44.0, 56.0, 99.0, 94.0, 150.0, 196.0, 298.0, 377.0, 443.0, 612.0, 819.0, 1154.0, 1891.0, 4145.0, 14035.0, 71630.0, 419636.0, 433038.0, 74598.0, 14326.0, 4291.0, 2002.0, 1165.0, 851.0, 598.0, 466.0, 388.0, 266.0, 179.0, 157.0, 106.0, 83.0, 71.0, 46.0, 29.0, 22.0, 17.0, 19.0, 10.0, 10.0, 5.0, 6.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-18.609375, -18.00927734375, -17.4091796875, -16.80908203125, -16.208984375, -15.60888671875, -15.0087890625, -14.40869140625, -13.80859375, -13.20849609375, -12.6083984375, -12.00830078125, -11.408203125, -10.80810546875, -10.2080078125, -9.60791015625, -9.0078125, -8.40771484375, -7.8076171875, -7.20751953125, -6.607421875, -6.00732421875, -5.4072265625, -4.80712890625, -4.20703125, -3.60693359375, -3.0068359375, -2.40673828125, -1.806640625, -1.20654296875, -0.6064453125, -0.00634765625, 0.59375, 1.19384765625, 1.7939453125, 2.39404296875, 2.994140625, 3.59423828125, 4.1943359375, 4.79443359375, 5.39453125, 5.99462890625, 6.5947265625, 7.19482421875, 7.794921875, 8.39501953125, 8.9951171875, 9.59521484375, 10.1953125, 10.79541015625, 11.3955078125, 11.99560546875, 12.595703125, 13.19580078125, 13.7958984375, 14.39599609375, 14.99609375, 15.59619140625, 16.1962890625, 16.79638671875, 17.396484375, 17.99658203125, 18.5966796875, 19.19677734375, 19.796875]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 6.0, 3.0, 4.0, 6.0, 2.0, 7.0, 11.0, 11.0, 17.0, 19.0, 16.0, 21.0, 26.0, 26.0, 31.0, 38.0, 43.0, 54.0, 80.0, 107.0, 404.0, 1504.0, 126.0, 73.0, 55.0, 58.0, 42.0, 40.0, 32.0, 23.0, 25.0, 35.0, 17.0, 23.0, 11.0, 14.0, 6.0, 10.0, 5.0, 2.0, 7.0, 4.0, 3.0, 5.0, 1.0, 5.0, 2.0, 0.0, 1.0, 2.0], "bins": [-31.046875, -30.1611328125, -29.275390625, -28.3896484375, -27.50390625, -26.6181640625, -25.732421875, -24.8466796875, -23.9609375, -23.0751953125, -22.189453125, -21.3037109375, -20.41796875, -19.5322265625, -18.646484375, -17.7607421875, -16.875, -15.9892578125, -15.103515625, -14.2177734375, -13.33203125, -12.4462890625, -11.560546875, -10.6748046875, -9.7890625, -8.9033203125, -8.017578125, -7.1318359375, -6.24609375, -5.3603515625, -4.474609375, -3.5888671875, -2.703125, -1.8173828125, -0.931640625, -0.0458984375, 0.83984375, 1.7255859375, 2.611328125, 3.4970703125, 4.3828125, 5.2685546875, 6.154296875, 7.0400390625, 7.92578125, 8.8115234375, 9.697265625, 10.5830078125, 11.46875, 12.3544921875, 13.240234375, 14.1259765625, 15.01171875, 15.8974609375, 16.783203125, 17.6689453125, 18.5546875, 19.4404296875, 20.326171875, 21.2119140625, 22.09765625, 22.9833984375, 23.869140625, 24.7548828125, 25.640625]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 3.0, 7.0, 9.0, 7.0, 9.0, 14.0, 13.0, 9.0, 17.0, 23.0, 25.0, 36.0, 42.0, 53.0, 87.0, 140.0, 194.0, 356.0, 585.0, 1367.0, 52055.0, 3085553.0, 3103.0, 830.0, 412.0, 226.0, 151.0, 107.0, 58.0, 43.0, 45.0, 32.0, 15.0, 10.0, 9.0, 10.0, 6.0, 10.0, 6.0, 6.0, 3.0, 9.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0], "bins": [-115.875, -112.7646484375, -109.654296875, -106.5439453125, -103.43359375, -100.3232421875, -97.212890625, -94.1025390625, -90.9921875, -87.8818359375, -84.771484375, -81.6611328125, -78.55078125, -75.4404296875, -72.330078125, -69.2197265625, -66.109375, -62.9990234375, -59.888671875, -56.7783203125, -53.66796875, -50.5576171875, -47.447265625, -44.3369140625, -41.2265625, -38.1162109375, -35.005859375, -31.8955078125, -28.78515625, -25.6748046875, -22.564453125, -19.4541015625, -16.34375, -13.2333984375, -10.123046875, -7.0126953125, -3.90234375, -0.7919921875, 2.318359375, 5.4287109375, 8.5390625, 11.6494140625, 14.759765625, 17.8701171875, 20.98046875, 24.0908203125, 27.201171875, 30.3115234375, 33.421875, 36.5322265625, 39.642578125, 42.7529296875, 45.86328125, 48.9736328125, 52.083984375, 55.1943359375, 58.3046875, 61.4150390625, 64.525390625, 67.6357421875, 70.74609375, 73.8564453125, 76.966796875, 80.0771484375, 83.1875]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 50.0, 329.0, 527.0, 104.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-155.00137329101562, -148.02281188964844, -141.0442352294922, -134.065673828125, -127.08710479736328, -120.10853576660156, -113.12997436523438, -106.15140533447266, -99.17283630371094, -92.19426727294922, -85.21570587158203, -78.23713684082031, -71.2585678100586, -64.27999877929688, -57.30143737792969, -50.32286834716797, -43.34430694580078, -36.36574172973633, -29.38717269897461, -22.408607482910156, -15.43004035949707, -8.451473236083984, -1.4729080200195312, 5.5056610107421875, 12.48422622680664, 19.462793350219727, 26.441360473632812, 33.419925689697266, 40.39849090576172, 47.37705993652344, 54.35562515258789, 61.33419418334961, 68.31275939941406, 75.29132843017578, 82.26988983154297, 89.24845886230469, 96.2270278930664, 103.20559692382812, 110.18415832519531, 117.16272735595703, 124.14129638671875, 131.11985778808594, 138.0984344482422, 145.07699584960938, 152.05555725097656, 159.0341339111328, 166.0126953125, 172.99127197265625, 179.96981811523438, 186.94837951660156, 193.9269561767578, 200.905517578125, 207.8840789794922, 214.86265563964844, 221.84121704101562, 228.81979370117188, 235.79835510253906, 242.77691650390625, 249.7554931640625, 256.73406982421875, 263.7126159667969, 270.6911926269531, 277.66973876953125, 284.6483154296875, 291.62689208984375]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 5.0, 5.0, 13.0, 13.0, 16.0, 8.0, 18.0, 9.0, 20.0, 28.0, 16.0, 25.0, 21.0, 28.0, 38.0, 26.0, 30.0, 42.0, 48.0, 43.0, 47.0, 36.0, 43.0, 40.0, 34.0, 37.0, 29.0, 40.0, 34.0, 31.0, 29.0, 30.0, 14.0, 18.0, 10.0, 20.0, 15.0, 6.0, 4.0, 4.0, 6.0, 7.0, 10.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0], "bins": [-77.30536651611328, -75.1236343383789, -72.94190979003906, -70.76017761230469, -68.57844543457031, -66.39671325683594, -64.2149887084961, -62.03325653076172, -59.851524353027344, -57.669795989990234, -55.48806381225586, -53.30633544921875, -51.124603271484375, -48.942874908447266, -46.761146545410156, -44.57941436767578, -42.39768600463867, -40.21595764160156, -38.03422546386719, -35.85249710083008, -33.6707649230957, -31.489036560058594, -29.30730628967285, -27.12557601928711, -24.943845748901367, -22.762115478515625, -20.580385208129883, -18.39865493774414, -16.21692657470703, -14.035195350646973, -11.853466033935547, -9.671735763549805, -7.4900054931640625, -5.30827522277832, -3.1265454292297363, -0.9448156356811523, 1.2369146347045898, 3.418644905090332, 5.600374221801758, 7.7821044921875, 9.963834762573242, 12.145565032958984, 14.327295303344727, 16.50902557373047, 18.690753936767578, 20.872486114501953, 23.054214477539062, 25.235944747924805, 27.417675018310547, 29.59940528869629, 31.78113555908203, 33.96286392211914, 36.144596099853516, 38.326324462890625, 40.508056640625, 42.68978500366211, 44.87151336669922, 47.05324172973633, 49.2349739074707, 51.41670227050781, 53.59843444824219, 55.7801628112793, 57.961891174316406, 60.14362335205078, 62.325355529785156]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 4.0, 3.0, 2.0, 6.0, 6.0, 5.0, 3.0, 8.0, 13.0, 17.0, 17.0, 17.0, 20.0, 19.0, 28.0, 25.0, 42.0, 27.0, 34.0, 40.0, 37.0, 35.0, 47.0, 54.0, 38.0, 36.0, 49.0, 41.0, 34.0, 27.0, 33.0, 33.0, 40.0, 24.0, 20.0, 18.0, 17.0, 15.0, 15.0, 12.0, 12.0, 8.0, 10.0, 3.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.53125, -9.181396484375, -8.83154296875, -8.481689453125, -8.1318359375, -7.781982421875, -7.43212890625, -7.082275390625, -6.732421875, -6.382568359375, -6.03271484375, -5.682861328125, -5.3330078125, -4.983154296875, -4.63330078125, -4.283447265625, -3.93359375, -3.583740234375, -3.23388671875, -2.884033203125, -2.5341796875, -2.184326171875, -1.83447265625, -1.484619140625, -1.134765625, -0.784912109375, -0.43505859375, -0.085205078125, 0.2646484375, 0.614501953125, 0.96435546875, 1.314208984375, 1.6640625, 2.013916015625, 2.36376953125, 2.713623046875, 3.0634765625, 3.413330078125, 3.76318359375, 4.113037109375, 4.462890625, 4.812744140625, 5.16259765625, 5.512451171875, 5.8623046875, 6.212158203125, 6.56201171875, 6.911865234375, 7.26171875, 7.611572265625, 7.96142578125, 8.311279296875, 8.6611328125, 9.010986328125, 9.36083984375, 9.710693359375, 10.060546875, 10.410400390625, 10.76025390625, 11.110107421875, 11.4599609375, 11.809814453125, 12.15966796875, 12.509521484375, 12.859375]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 4.0, 6.0, 3.0, 8.0, 10.0, 10.0, 17.0, 19.0, 18.0, 36.0, 39.0, 43.0, 68.0, 83.0, 105.0, 172.0, 266.0, 453.0, 1136.0, 3186.0, 15300.0, 227280.0, 2921422.0, 975070.0, 39895.0, 6127.0, 1786.0, 663.0, 333.0, 204.0, 131.0, 93.0, 61.0, 59.0, 43.0, 34.0, 25.0, 18.0, 12.0, 16.0, 10.0, 5.0, 6.0, 6.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-32.53125, -31.566650390625, -30.60205078125, -29.637451171875, -28.6728515625, -27.708251953125, -26.74365234375, -25.779052734375, -24.814453125, -23.849853515625, -22.88525390625, -21.920654296875, -20.9560546875, -19.991455078125, -19.02685546875, -18.062255859375, -17.09765625, -16.133056640625, -15.16845703125, -14.203857421875, -13.2392578125, -12.274658203125, -11.31005859375, -10.345458984375, -9.380859375, -8.416259765625, -7.45166015625, -6.487060546875, -5.5224609375, -4.557861328125, -3.59326171875, -2.628662109375, -1.6640625, -0.699462890625, 0.26513671875, 1.229736328125, 2.1943359375, 3.158935546875, 4.12353515625, 5.088134765625, 6.052734375, 7.017333984375, 7.98193359375, 8.946533203125, 9.9111328125, 10.875732421875, 11.84033203125, 12.804931640625, 13.76953125, 14.734130859375, 15.69873046875, 16.663330078125, 17.6279296875, 18.592529296875, 19.55712890625, 20.521728515625, 21.486328125, 22.450927734375, 23.41552734375, 24.380126953125, 25.3447265625, 26.309326171875, 27.27392578125, 28.238525390625, 29.203125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 6.0, 12.0, 19.0, 21.0, 45.0, 66.0, 73.0, 60.0, 113.0, 145.0, 214.0, 289.0, 481.0, 653.0, 559.0, 401.0, 271.0, 170.0, 118.0, 92.0, 57.0, 55.0, 42.0, 32.0, 16.0, 10.0, 18.0, 9.0, 10.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-25.953125, -25.283203125, -24.61328125, -23.943359375, -23.2734375, -22.603515625, -21.93359375, -21.263671875, -20.59375, -19.923828125, -19.25390625, -18.583984375, -17.9140625, -17.244140625, -16.57421875, -15.904296875, -15.234375, -14.564453125, -13.89453125, -13.224609375, -12.5546875, -11.884765625, -11.21484375, -10.544921875, -9.875, -9.205078125, -8.53515625, -7.865234375, -7.1953125, -6.525390625, -5.85546875, -5.185546875, -4.515625, -3.845703125, -3.17578125, -2.505859375, -1.8359375, -1.166015625, -0.49609375, 0.173828125, 0.84375, 1.513671875, 2.18359375, 2.853515625, 3.5234375, 4.193359375, 4.86328125, 5.533203125, 6.203125, 6.873046875, 7.54296875, 8.212890625, 8.8828125, 9.552734375, 10.22265625, 10.892578125, 11.5625, 12.232421875, 12.90234375, 13.572265625, 14.2421875, 14.912109375, 15.58203125, 16.251953125, 16.921875]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 3.0, 7.0, 11.0, 23.0, 42.0, 71.0, 114.0, 257.0, 652.0, 2369.0, 32903.0, 4035404.0, 117573.0, 3360.0, 865.0, 293.0, 152.0, 74.0, 48.0, 23.0, 16.0, 10.0, 9.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-89.8125, -87.4248046875, -85.037109375, -82.6494140625, -80.26171875, -77.8740234375, -75.486328125, -73.0986328125, -70.7109375, -68.3232421875, -65.935546875, -63.5478515625, -61.16015625, -58.7724609375, -56.384765625, -53.9970703125, -51.609375, -49.2216796875, -46.833984375, -44.4462890625, -42.05859375, -39.6708984375, -37.283203125, -34.8955078125, -32.5078125, -30.1201171875, -27.732421875, -25.3447265625, -22.95703125, -20.5693359375, -18.181640625, -15.7939453125, -13.40625, -11.0185546875, -8.630859375, -6.2431640625, -3.85546875, -1.4677734375, 0.919921875, 3.3076171875, 5.6953125, 8.0830078125, 10.470703125, 12.8583984375, 15.24609375, 17.6337890625, 20.021484375, 22.4091796875, 24.796875, 27.1845703125, 29.572265625, 31.9599609375, 34.34765625, 36.7353515625, 39.123046875, 41.5107421875, 43.8984375, 46.2861328125, 48.673828125, 51.0615234375, 53.44921875, 55.8369140625, 58.224609375, 60.6123046875, 63.0]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 37.0, 868.0, 110.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-1249.329345703125, -1227.6512451171875, -1205.97314453125, -1184.295166015625, -1162.6170654296875, -1140.93896484375, -1119.260986328125, -1097.5828857421875, -1075.90478515625, -1054.2266845703125, -1032.548583984375, -1010.87060546875, -989.1925048828125, -967.514404296875, -945.8363647460938, -924.1583251953125, -902.480224609375, -880.8021240234375, -859.1240844726562, -837.446044921875, -815.7679443359375, -794.08984375, -772.4118041992188, -750.7337646484375, -729.0556640625, -707.3775634765625, -685.6995239257812, -664.021484375, -642.3433837890625, -620.665283203125, -598.9872436523438, -577.3092041015625, -555.631103515625, -533.9530029296875, -512.2749633789062, -490.5968933105469, -468.9188232421875, -447.2407531738281, -425.56268310546875, -403.8846130371094, -382.20654296875, -360.5284729003906, -338.85040283203125, -317.1723327636719, -295.4942626953125, -273.8161926269531, -252.13812255859375, -230.46005249023438, -208.78199768066406, -187.1039276123047, -165.4258575439453, -143.74778747558594, -122.06971740722656, -100.39164733886719, -78.71357727050781, -57.03550720214844, -35.35743713378906, -13.679367065429688, 7.9987030029296875, 29.676773071289062, 51.35484313964844, 73.03291320800781, 94.71098327636719, 116.38905334472656, 138.06712341308594]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 7.0, 5.0, 7.0, 7.0, 3.0, 8.0, 12.0, 6.0, 15.0, 13.0, 26.0, 28.0, 19.0, 32.0, 34.0, 24.0, 31.0, 35.0, 43.0, 49.0, 39.0, 41.0, 62.0, 53.0, 48.0, 35.0, 35.0, 40.0, 30.0, 22.0, 35.0, 27.0, 19.0, 21.0, 12.0, 20.0, 15.0, 13.0, 8.0, 2.0, 8.0, 4.0, 4.0, 3.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-80.67355346679688, -78.47052764892578, -76.26750946044922, -74.06448364257812, -71.86146545410156, -69.65843963623047, -67.45541381835938, -65.25239562988281, -63.04936981201172, -60.84634780883789, -58.64332580566406, -56.44029998779297, -54.23727798461914, -52.03425598144531, -49.831233978271484, -47.628211975097656, -45.42518997192383, -43.22216796875, -41.01914596557617, -38.816123962402344, -36.61309814453125, -34.41007614135742, -32.207054138183594, -30.004032135009766, -27.801008224487305, -25.597986221313477, -23.394962310791016, -21.191940307617188, -18.98891830444336, -16.7858943939209, -14.58287239074707, -12.379849433898926, -10.176826477050781, -7.973803520202637, -5.77078104019165, -3.567758560180664, -1.3647356033325195, 0.838287353515625, 3.041309356689453, 5.244332313537598, 7.447355270385742, 9.650378227233887, 11.853401184082031, 14.05642318725586, 16.259445190429688, 18.46246910095215, 20.665491104125977, 22.868515014648438, 25.071537017822266, 27.274559020996094, 29.477582931518555, 31.680604934692383, 33.883628845214844, 36.08665084838867, 38.2896728515625, 40.49269485473633, 42.695716857910156, 44.898738861083984, 47.10176086425781, 49.304786682128906, 51.507808685302734, 53.71083068847656, 55.91385269165039, 58.11687469482422, 60.31990051269531]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 7.0, 3.0, 4.0, 6.0, 5.0, 10.0, 12.0, 16.0, 13.0, 13.0, 23.0, 24.0, 29.0, 38.0, 33.0, 43.0, 47.0, 44.0, 48.0, 44.0, 43.0, 34.0, 41.0, 39.0, 46.0, 44.0, 34.0, 39.0, 29.0, 41.0, 26.0, 21.0, 28.0, 15.0, 13.0, 13.0, 10.0, 10.0, 10.0, 8.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.7265625, -7.43310546875, -7.1396484375, -6.84619140625, -6.552734375, -6.25927734375, -5.9658203125, -5.67236328125, -5.37890625, -5.08544921875, -4.7919921875, -4.49853515625, -4.205078125, -3.91162109375, -3.6181640625, -3.32470703125, -3.03125, -2.73779296875, -2.4443359375, -2.15087890625, -1.857421875, -1.56396484375, -1.2705078125, -0.97705078125, -0.68359375, -0.39013671875, -0.0966796875, 0.19677734375, 0.490234375, 0.78369140625, 1.0771484375, 1.37060546875, 1.6640625, 1.95751953125, 2.2509765625, 2.54443359375, 2.837890625, 3.13134765625, 3.4248046875, 3.71826171875, 4.01171875, 4.30517578125, 4.5986328125, 4.89208984375, 5.185546875, 5.47900390625, 5.7724609375, 6.06591796875, 6.359375, 6.65283203125, 6.9462890625, 7.23974609375, 7.533203125, 7.82666015625, 8.1201171875, 8.41357421875, 8.70703125, 9.00048828125, 9.2939453125, 9.58740234375, 9.880859375, 10.17431640625, 10.4677734375, 10.76123046875, 11.0546875]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 8.0, 4.0, 9.0, 14.0, 18.0, 24.0, 38.0, 52.0, 76.0, 150.0, 231.0, 384.0, 655.0, 1076.0, 1929.0, 3248.0, 5529.0, 9897.0, 17208.0, 30398.0, 54229.0, 97185.0, 177252.0, 263811.0, 171365.0, 93386.0, 52025.0, 29023.0, 16836.0, 9469.0, 5412.0, 3115.0, 1815.0, 1087.0, 635.0, 367.0, 220.0, 145.0, 81.0, 51.0, 29.0, 19.0, 13.0, 14.0, 6.0, 6.0, 7.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.5927734375, -1.5437164306640625, -1.494659423828125, -1.4456024169921875, -1.39654541015625, -1.3474884033203125, -1.298431396484375, -1.2493743896484375, -1.2003173828125, -1.1512603759765625, -1.102203369140625, -1.0531463623046875, -1.00408935546875, -0.9550323486328125, -0.905975341796875, -0.8569183349609375, -0.807861328125, -0.7588043212890625, -0.709747314453125, -0.6606903076171875, -0.61163330078125, -0.5625762939453125, -0.513519287109375, -0.4644622802734375, -0.4154052734375, -0.3663482666015625, -0.317291259765625, -0.2682342529296875, -0.21917724609375, -0.1701202392578125, -0.121063232421875, -0.0720062255859375, -0.02294921875, 0.0261077880859375, 0.075164794921875, 0.1242218017578125, 0.17327880859375, 0.2223358154296875, 0.271392822265625, 0.3204498291015625, 0.3695068359375, 0.4185638427734375, 0.467620849609375, 0.5166778564453125, 0.56573486328125, 0.6147918701171875, 0.663848876953125, 0.7129058837890625, 0.761962890625, 0.8110198974609375, 0.860076904296875, 0.9091339111328125, 0.95819091796875, 1.0072479248046875, 1.056304931640625, 1.1053619384765625, 1.1544189453125, 1.2034759521484375, 1.252532958984375, 1.3015899658203125, 1.35064697265625, 1.3997039794921875, 1.448760986328125, 1.4978179931640625, 1.546875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 9.0, 9.0, 4.0, 12.0, 9.0, 18.0, 22.0, 24.0, 23.0, 17.0, 28.0, 26.0, 37.0, 30.0, 27.0, 32.0, 47.0, 28.0, 41.0, 1064.0, 34.0, 41.0, 47.0, 38.0, 36.0, 43.0, 33.0, 28.0, 30.0, 22.0, 34.0, 25.0, 15.0, 15.0, 13.0, 16.0, 10.0, 10.0, 10.0, 8.0, 5.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6171875, -4.44537353515625, -4.2735595703125, -4.10174560546875, -3.929931640625, -3.75811767578125, -3.5863037109375, -3.41448974609375, -3.24267578125, -3.07086181640625, -2.8990478515625, -2.72723388671875, -2.555419921875, -2.38360595703125, -2.2117919921875, -2.03997802734375, -1.8681640625, -1.69635009765625, -1.5245361328125, -1.35272216796875, -1.180908203125, -1.00909423828125, -0.8372802734375, -0.66546630859375, -0.49365234375, -0.32183837890625, -0.1500244140625, 0.02178955078125, 0.193603515625, 0.36541748046875, 0.5372314453125, 0.70904541015625, 0.880859375, 1.05267333984375, 1.2244873046875, 1.39630126953125, 1.568115234375, 1.73992919921875, 1.9117431640625, 2.08355712890625, 2.25537109375, 2.42718505859375, 2.5989990234375, 2.77081298828125, 2.942626953125, 3.11444091796875, 3.2862548828125, 3.45806884765625, 3.6298828125, 3.80169677734375, 3.9735107421875, 4.14532470703125, 4.317138671875, 4.48895263671875, 4.6607666015625, 4.83258056640625, 5.00439453125, 5.17620849609375, 5.3480224609375, 5.51983642578125, 5.691650390625, 5.86346435546875, 6.0352783203125, 6.20709228515625, 6.37890625]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 2.0, 3.0, 6.0, 7.0, 14.0, 20.0, 38.0, 48.0, 73.0, 100.0, 148.0, 216.0, 323.0, 461.0, 684.0, 1037.0, 1492.0, 2314.0, 3425.0, 5283.0, 8004.0, 11987.0, 18794.0, 28827.0, 45585.0, 71928.0, 113044.0, 175366.0, 1243680.0, 131286.0, 83446.0, 52886.0, 33833.0, 21450.0, 14190.0, 9228.0, 6067.0, 3902.0, 2569.0, 1726.0, 1222.0, 797.0, 542.0, 354.0, 235.0, 155.0, 110.0, 63.0, 61.0, 37.0, 15.0, 23.0, 7.0, 10.0, 7.0, 4.0, 2.0, 3.0, 0.0, 3.0], "bins": [-1.1328125, -1.09759521484375, -1.0623779296875, -1.02716064453125, -0.991943359375, -0.95672607421875, -0.9215087890625, -0.88629150390625, -0.85107421875, -0.81585693359375, -0.7806396484375, -0.74542236328125, -0.710205078125, -0.67498779296875, -0.6397705078125, -0.60455322265625, -0.5693359375, -0.53411865234375, -0.4989013671875, -0.46368408203125, -0.428466796875, -0.39324951171875, -0.3580322265625, -0.32281494140625, -0.28759765625, -0.25238037109375, -0.2171630859375, -0.18194580078125, -0.146728515625, -0.11151123046875, -0.0762939453125, -0.04107666015625, -0.005859375, 0.02935791015625, 0.0645751953125, 0.09979248046875, 0.135009765625, 0.17022705078125, 0.2054443359375, 0.24066162109375, 0.27587890625, 0.31109619140625, 0.3463134765625, 0.38153076171875, 0.416748046875, 0.45196533203125, 0.4871826171875, 0.52239990234375, 0.5576171875, 0.59283447265625, 0.6280517578125, 0.66326904296875, 0.698486328125, 0.73370361328125, 0.7689208984375, 0.80413818359375, 0.83935546875, 0.87457275390625, 0.9097900390625, 0.94500732421875, 0.980224609375, 1.01544189453125, 1.0506591796875, 1.08587646484375, 1.12109375]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 7.0, 5.0, 4.0, 11.0, 17.0, 11.0, 14.0, 21.0, 25.0, 19.0, 33.0, 42.0, 40.0, 61.0, 47.0, 55.0, 55.0, 65.0, 61.0, 51.0, 52.0, 52.0, 39.0, 28.0, 35.0, 33.0, 26.0, 16.0, 17.0, 10.0, 10.0, 15.0, 6.0, 7.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002025604248046875, -0.0019669532775878906, -0.0019083023071289062, -0.0018496513366699219, -0.0017910003662109375, -0.0017323493957519531, -0.0016736984252929688, -0.0016150474548339844, -0.001556396484375, -0.0014977455139160156, -0.0014390945434570312, -0.0013804435729980469, -0.0013217926025390625, -0.0012631416320800781, -0.0012044906616210938, -0.0011458396911621094, -0.001087188720703125, -0.0010285377502441406, -0.0009698867797851562, -0.0009112358093261719, -0.0008525848388671875, -0.0007939338684082031, -0.0007352828979492188, -0.0006766319274902344, -0.00061798095703125, -0.0005593299865722656, -0.0005006790161132812, -0.0004420280456542969, -0.0003833770751953125, -0.0003247261047363281, -0.00026607513427734375, -0.00020742416381835938, -0.000148773193359375, -9.012222290039062e-05, -3.147125244140625e-05, 2.7179718017578125e-05, 8.58306884765625e-05, 0.00014448165893554688, 0.00020313262939453125, 0.0002617835998535156, 0.0003204345703125, 0.0003790855407714844, 0.00043773651123046875, 0.0004963874816894531, 0.0005550384521484375, 0.0006136894226074219, 0.0006723403930664062, 0.0007309913635253906, 0.000789642333984375, 0.0008482933044433594, 0.0009069442749023438, 0.0009655952453613281, 0.0010242462158203125, 0.0010828971862792969, 0.0011415481567382812, 0.0012001991271972656, 0.00125885009765625, 0.0013175010681152344, 0.0013761520385742188, 0.0014348030090332031, 0.0014934539794921875, 0.0015521049499511719, 0.0016107559204101562, 0.0016694068908691406, 0.001728057861328125]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 6.0, 6.0, 12.0, 14.0, 12.0, 25.0, 24.0, 33.0, 46.0, 72.0, 104.0, 131.0, 174.0, 263.0, 441.0, 773.0, 4489.0, 1029541.0, 10002.0, 913.0, 456.0, 297.0, 202.0, 132.0, 87.0, 67.0, 69.0, 31.0, 42.0, 17.0, 19.0, 10.0, 9.0, 10.0, 7.0, 2.0, 8.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.038787841796875, -0.03755903244018555, -0.036330223083496094, -0.03510141372680664, -0.03387260437011719, -0.032643795013427734, -0.03141498565673828, -0.030186176300048828, -0.028957366943359375, -0.027728557586669922, -0.02649974822998047, -0.025270938873291016, -0.024042129516601562, -0.02281332015991211, -0.021584510803222656, -0.020355701446533203, -0.01912689208984375, -0.017898082733154297, -0.016669273376464844, -0.01544046401977539, -0.014211654663085938, -0.012982845306396484, -0.011754035949707031, -0.010525226593017578, -0.009296417236328125, -0.008067607879638672, -0.006838798522949219, -0.005609989166259766, -0.0043811798095703125, -0.0031523704528808594, -0.0019235610961914062, -0.0006947517395019531, 0.0005340576171875, 0.0017628669738769531, 0.0029916763305664062, 0.004220485687255859, 0.0054492950439453125, 0.006678104400634766, 0.007906913757324219, 0.009135723114013672, 0.010364532470703125, 0.011593341827392578, 0.012822151184082031, 0.014050960540771484, 0.015279769897460938, 0.01650857925415039, 0.017737388610839844, 0.018966197967529297, 0.02019500732421875, 0.021423816680908203, 0.022652626037597656, 0.02388143539428711, 0.025110244750976562, 0.026339054107666016, 0.02756786346435547, 0.028796672821044922, 0.030025482177734375, 0.03125429153442383, 0.03248310089111328, 0.033711910247802734, 0.03494071960449219, 0.03616952896118164, 0.037398338317871094, 0.03862714767456055, 0.03985595703125]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 65.0, 662.0, 278.0, 8.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0074579487554728985, -0.007230037357658148, -0.007002125959843397, -0.0067742145620286465, -0.006546303164213896, -0.006318391766399145, -0.006090480834245682, -0.005862569436430931, -0.00563465803861618, -0.00540674664080143, -0.005178835242986679, -0.004950923845171928, -0.004723012447357178, -0.004495101049542427, -0.004267189651727676, -0.004039278253912926, -0.003811366856098175, -0.0035834554582834244, -0.0033555440604686737, -0.003127632662653923, -0.0028997212648391724, -0.0026718098670244217, -0.0024438987020403147, -0.002215987304225564, -0.0019880759064108133, -0.0017601645085960627, -0.001532253110781312, -0.0013043418293818831, -0.0010764304315671325, -0.0008485190337523818, -0.000620607752352953, -0.0003926963545382023, -0.00016478542238473892, 6.312594632618129e-05, 0.0002910373150371015, 0.0005189486546441913, 0.0007468600524589419, 0.0009747714502736926, 0.0012026827316731215, 0.0014305941294878721, 0.0016585055273026228, 0.0018864169251173735, 0.002114328322932124, 0.002342239487916231, 0.002570150885730982, 0.0027980622835457325, 0.003025973681360483, 0.003253885079175234, 0.0034817964769899845, 0.003709707874804735, 0.003937619272619486, 0.0041655306704342365, 0.004393442068248987, 0.004621353466063738, 0.004849264398217201, 0.005077175796031952, 0.005305087193846703, 0.005532998591661453, 0.005760909989476204, 0.005988821387290955, 0.006216732785105705, 0.006444644182920456, 0.006672555580735207, 0.006900466978549957, 0.007128378376364708]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 6.0, 2.0, 10.0, 5.0, 16.0, 12.0, 16.0, 20.0, 24.0, 24.0, 29.0, 34.0, 34.0, 48.0, 45.0, 46.0, 53.0, 45.0, 43.0, 40.0, 47.0, 44.0, 45.0, 48.0, 34.0, 37.0, 34.0, 36.0, 23.0, 14.0, 23.0, 17.0, 13.0, 8.0, 7.0, 5.0, 6.0, 7.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0012417435646057129, -0.001206129789352417, -0.001170516014099121, -0.0011349022388458252, -0.0010992884635925293, -0.0010636746883392334, -0.0010280609130859375, -0.0009924471378326416, -0.0009568333625793457, -0.0009212195873260498, -0.0008856058120727539, -0.000849992036819458, -0.0008143782615661621, -0.0007787644863128662, -0.0007431507110595703, -0.0007075369358062744, -0.0006719231605529785, -0.0006363093852996826, -0.0006006956100463867, -0.0005650818347930908, -0.0005294680595397949, -0.000493854284286499, -0.0004582405090332031, -0.0004226267337799072, -0.00038701295852661133, -0.00035139918327331543, -0.00031578540802001953, -0.00028017163276672363, -0.00024455785751342773, -0.00020894408226013184, -0.00017333030700683594, -0.00013771653175354004, -0.00010210275650024414, -6.648898124694824e-05, -3.0875205993652344e-05, 4.738569259643555e-06, 4.035234451293945e-05, 7.596611976623535e-05, 0.00011157989501953125, 0.00014719367027282715, 0.00018280744552612305, 0.00021842122077941895, 0.00025403499603271484, 0.00028964877128601074, 0.00032526254653930664, 0.00036087632179260254, 0.00039649009704589844, 0.00043210387229919434, 0.00046771764755249023, 0.0005033314228057861, 0.000538945198059082, 0.0005745589733123779, 0.0006101727485656738, 0.0006457865238189697, 0.0006814002990722656, 0.0007170140743255615, 0.0007526278495788574, 0.0007882416248321533, 0.0008238554000854492, 0.0008594691753387451, 0.000895082950592041, 0.0009306967258453369, 0.0009663105010986328, 0.0010019242763519287, 0.0010375380516052246]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 7.0, 3.0, 4.0, 6.0, 5.0, 10.0, 12.0, 17.0, 12.0, 13.0, 23.0, 24.0, 29.0, 38.0, 33.0, 43.0, 47.0, 44.0, 48.0, 44.0, 43.0, 34.0, 41.0, 39.0, 46.0, 44.0, 34.0, 39.0, 29.0, 41.0, 26.0, 21.0, 28.0, 15.0, 13.0, 13.0, 10.0, 10.0, 10.0, 8.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.7265625, -7.43310546875, -7.1396484375, -6.84619140625, -6.552734375, -6.25927734375, -5.9658203125, -5.67236328125, -5.37890625, -5.08544921875, -4.7919921875, -4.49853515625, -4.205078125, -3.91162109375, -3.6181640625, -3.32470703125, -3.03125, -2.73779296875, -2.4443359375, -2.15087890625, -1.857421875, -1.56396484375, -1.2705078125, -0.97705078125, -0.68359375, -0.39013671875, -0.0966796875, 0.19677734375, 0.490234375, 0.78369140625, 1.0771484375, 1.37060546875, 1.6640625, 1.95751953125, 2.2509765625, 2.54443359375, 2.837890625, 3.13134765625, 3.4248046875, 3.71826171875, 4.01171875, 4.30517578125, 4.5986328125, 4.89208984375, 5.185546875, 5.47900390625, 5.7724609375, 6.06591796875, 6.359375, 6.65283203125, 6.9462890625, 7.23974609375, 7.533203125, 7.82666015625, 8.1201171875, 8.41357421875, 8.70703125, 9.00048828125, 9.2939453125, 9.58740234375, 9.880859375, 10.17431640625, 10.4677734375, 10.76123046875, 11.0546875]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 6.0, 5.0, 6.0, 13.0, 17.0, 34.0, 36.0, 67.0, 78.0, 101.0, 188.0, 270.0, 467.0, 664.0, 1045.0, 1604.0, 2959.0, 6359.0, 23034.0, 272233.0, 668350.0, 52175.0, 9500.0, 3847.0, 2021.0, 1236.0, 743.0, 532.0, 307.0, 211.0, 139.0, 110.0, 67.0, 39.0, 38.0, 24.0, 5.0, 4.0, 7.0, 10.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-28.5, -27.690185546875, -26.88037109375, -26.070556640625, -25.2607421875, -24.450927734375, -23.64111328125, -22.831298828125, -22.021484375, -21.211669921875, -20.40185546875, -19.592041015625, -18.7822265625, -17.972412109375, -17.16259765625, -16.352783203125, -15.54296875, -14.733154296875, -13.92333984375, -13.113525390625, -12.3037109375, -11.493896484375, -10.68408203125, -9.874267578125, -9.064453125, -8.254638671875, -7.44482421875, -6.635009765625, -5.8251953125, -5.015380859375, -4.20556640625, -3.395751953125, -2.5859375, -1.776123046875, -0.96630859375, -0.156494140625, 0.6533203125, 1.463134765625, 2.27294921875, 3.082763671875, 3.892578125, 4.702392578125, 5.51220703125, 6.322021484375, 7.1318359375, 7.941650390625, 8.75146484375, 9.561279296875, 10.37109375, 11.180908203125, 11.99072265625, 12.800537109375, 13.6103515625, 14.420166015625, 15.22998046875, 16.039794921875, 16.849609375, 17.659423828125, 18.46923828125, 19.279052734375, 20.0888671875, 20.898681640625, 21.70849609375, 22.518310546875, 23.328125]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 9.0, 11.0, 10.0, 7.0, 10.0, 13.0, 10.0, 13.0, 18.0, 28.0, 26.0, 23.0, 40.0, 60.0, 42.0, 61.0, 87.0, 182.0, 1649.0, 286.0, 94.0, 66.0, 47.0, 50.0, 38.0, 28.0, 37.0, 19.0, 25.0, 14.0, 15.0, 7.0, 5.0, 5.0, 6.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.109375, -24.26318359375, -23.4169921875, -22.57080078125, -21.724609375, -20.87841796875, -20.0322265625, -19.18603515625, -18.33984375, -17.49365234375, -16.6474609375, -15.80126953125, -14.955078125, -14.10888671875, -13.2626953125, -12.41650390625, -11.5703125, -10.72412109375, -9.8779296875, -9.03173828125, -8.185546875, -7.33935546875, -6.4931640625, -5.64697265625, -4.80078125, -3.95458984375, -3.1083984375, -2.26220703125, -1.416015625, -0.56982421875, 0.2763671875, 1.12255859375, 1.96875, 2.81494140625, 3.6611328125, 4.50732421875, 5.353515625, 6.19970703125, 7.0458984375, 7.89208984375, 8.73828125, 9.58447265625, 10.4306640625, 11.27685546875, 12.123046875, 12.96923828125, 13.8154296875, 14.66162109375, 15.5078125, 16.35400390625, 17.2001953125, 18.04638671875, 18.892578125, 19.73876953125, 20.5849609375, 21.43115234375, 22.27734375, 23.12353515625, 23.9697265625, 24.81591796875, 25.662109375, 26.50830078125, 27.3544921875, 28.20068359375, 29.046875]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 2.0, 5.0, 8.0, 11.0, 18.0, 26.0, 30.0, 46.0, 74.0, 93.0, 124.0, 231.0, 359.0, 737.0, 3243.0, 3096460.0, 41438.0, 1393.0, 505.0, 266.0, 191.0, 102.0, 83.0, 75.0, 49.0, 21.0, 32.0, 14.0, 23.0, 9.0, 4.0, 10.0, 6.0, 3.0, 7.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-97.4375, -94.6337890625, -91.830078125, -89.0263671875, -86.22265625, -83.4189453125, -80.615234375, -77.8115234375, -75.0078125, -72.2041015625, -69.400390625, -66.5966796875, -63.79296875, -60.9892578125, -58.185546875, -55.3818359375, -52.578125, -49.7744140625, -46.970703125, -44.1669921875, -41.36328125, -38.5595703125, -35.755859375, -32.9521484375, -30.1484375, -27.3447265625, -24.541015625, -21.7373046875, -18.93359375, -16.1298828125, -13.326171875, -10.5224609375, -7.71875, -4.9150390625, -2.111328125, 0.6923828125, 3.49609375, 6.2998046875, 9.103515625, 11.9072265625, 14.7109375, 17.5146484375, 20.318359375, 23.1220703125, 25.92578125, 28.7294921875, 31.533203125, 34.3369140625, 37.140625, 39.9443359375, 42.748046875, 45.5517578125, 48.35546875, 51.1591796875, 53.962890625, 56.7666015625, 59.5703125, 62.3740234375, 65.177734375, 67.9814453125, 70.78515625, 73.5888671875, 76.392578125, 79.1962890625, 82.0]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 12.0, 121.0, 427.0, 351.0, 87.0, 10.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-236.39105224609375, -230.99803161621094, -225.60501098632812, -220.21197509765625, -214.81895446777344, -209.42593383789062, -204.0329132080078, -198.639892578125, -193.24685668945312, -187.8538360595703, -182.4608154296875, -177.06777954101562, -171.6747589111328, -166.28173828125, -160.8887176513672, -155.49569702148438, -150.1026611328125, -144.7096405029297, -139.31661987304688, -133.923583984375, -128.5305633544922, -123.13754272460938, -117.74452209472656, -112.35149383544922, -106.95848083496094, -101.56546020507812, -96.17243194580078, -90.77941131591797, -85.38638305664062, -79.99336242675781, -74.600341796875, -69.20731353759766, -63.814292907714844, -58.421268463134766, -53.02824401855469, -47.635223388671875, -42.24219512939453, -36.84917449951172, -31.45615005493164, -26.063125610351562, -20.670101165771484, -15.277076721191406, -9.884053230285645, -4.491029739379883, 0.9019947052001953, 6.295019149780273, 11.688041687011719, 17.081066131591797, 22.474090576171875, 27.867115020751953, 33.26013946533203, 38.653160095214844, 44.04618835449219, 49.439208984375, 54.83223342895508, 60.225257873535156, 65.6182861328125, 71.01130676269531, 76.40433502197266, 81.79735565185547, 87.19038391113281, 92.58340454101562, 97.97642517089844, 103.36945343017578, 108.7624740600586]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 4.0, 4.0, 8.0, 4.0, 7.0, 12.0, 14.0, 20.0, 19.0, 17.0, 34.0, 33.0, 30.0, 37.0, 35.0, 47.0, 43.0, 48.0, 33.0, 38.0, 52.0, 30.0, 41.0, 31.0, 37.0, 32.0, 39.0, 33.0, 20.0, 33.0, 25.0, 17.0, 17.0, 29.0, 21.0, 12.0, 14.0, 10.0, 4.0, 7.0, 3.0, 7.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-67.76932525634766, -65.67735290527344, -63.58538055419922, -61.493412017822266, -59.40143966674805, -57.30946731567383, -55.217498779296875, -53.125526428222656, -51.03355407714844, -48.94158172607422, -46.849609375, -44.75764083862305, -42.66566848754883, -40.57369613647461, -38.481727600097656, -36.38975524902344, -34.29778289794922, -32.205810546875, -30.113840103149414, -28.021869659423828, -25.92989730834961, -23.83792495727539, -21.745954513549805, -19.65398406982422, -17.56201171875, -15.470040321350098, -13.378068923950195, -11.286097526550293, -9.19412612915039, -7.102154731750488, -5.010183334350586, -2.9182119369506836, -0.8262481689453125, 1.2657232284545898, 3.357694625854492, 5.4496660232543945, 7.541637420654297, 9.6336088180542, 11.725580215454102, 13.817551612854004, 15.909523010253906, 18.001495361328125, 20.09346580505371, 22.185436248779297, 24.277408599853516, 26.369380950927734, 28.46135139465332, 30.553321838378906, 32.645294189453125, 34.737266540527344, 36.82923889160156, 38.921207427978516, 41.013179779052734, 43.10515213012695, 45.197120666503906, 47.289093017578125, 49.381065368652344, 51.47303771972656, 53.56501007080078, 55.656978607177734, 57.74895095825195, 59.84092330932617, 61.932891845703125, 64.02486419677734, 66.11683654785156]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 1.0, 5.0, 1.0, 5.0, 9.0, 4.0, 7.0, 8.0, 11.0, 7.0, 8.0, 11.0, 20.0, 29.0, 22.0, 25.0, 35.0, 31.0, 36.0, 55.0, 40.0, 42.0, 52.0, 40.0, 40.0, 34.0, 41.0, 43.0, 43.0, 32.0, 25.0, 41.0, 27.0, 28.0, 30.0, 24.0, 13.0, 17.0, 17.0, 10.0, 10.0, 3.0, 8.0, 5.0, 6.0, 1.0, 5.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.109375, -7.823486328125, -7.53759765625, -7.251708984375, -6.9658203125, -6.679931640625, -6.39404296875, -6.108154296875, -5.822265625, -5.536376953125, -5.25048828125, -4.964599609375, -4.6787109375, -4.392822265625, -4.10693359375, -3.821044921875, -3.53515625, -3.249267578125, -2.96337890625, -2.677490234375, -2.3916015625, -2.105712890625, -1.81982421875, -1.533935546875, -1.248046875, -0.962158203125, -0.67626953125, -0.390380859375, -0.1044921875, 0.181396484375, 0.46728515625, 0.753173828125, 1.0390625, 1.324951171875, 1.61083984375, 1.896728515625, 2.1826171875, 2.468505859375, 2.75439453125, 3.040283203125, 3.326171875, 3.612060546875, 3.89794921875, 4.183837890625, 4.4697265625, 4.755615234375, 5.04150390625, 5.327392578125, 5.61328125, 5.899169921875, 6.18505859375, 6.470947265625, 6.7568359375, 7.042724609375, 7.32861328125, 7.614501953125, 7.900390625, 8.186279296875, 8.47216796875, 8.758056640625, 9.0439453125, 9.329833984375, 9.61572265625, 9.901611328125, 10.1875]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 1.0, 6.0, 8.0, 14.0, 15.0, 21.0, 31.0, 43.0, 62.0, 74.0, 115.0, 152.0, 240.0, 373.0, 604.0, 1120.0, 2107.0, 4673.0, 15259.0, 117386.0, 1514459.0, 2284952.0, 220308.0, 20818.0, 5599.0, 2583.0, 1252.0, 752.0, 441.0, 276.0, 158.0, 104.0, 86.0, 61.0, 31.0, 28.0, 20.0, 15.0, 12.0, 14.0, 6.0, 6.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.8984375, -15.2655029296875, -14.632568359375, -13.9996337890625, -13.36669921875, -12.7337646484375, -12.100830078125, -11.4678955078125, -10.8349609375, -10.2020263671875, -9.569091796875, -8.9361572265625, -8.30322265625, -7.6702880859375, -7.037353515625, -6.4044189453125, -5.771484375, -5.1385498046875, -4.505615234375, -3.8726806640625, -3.23974609375, -2.6068115234375, -1.973876953125, -1.3409423828125, -0.7080078125, -0.0750732421875, 0.557861328125, 1.1907958984375, 1.82373046875, 2.4566650390625, 3.089599609375, 3.7225341796875, 4.35546875, 4.9884033203125, 5.621337890625, 6.2542724609375, 6.88720703125, 7.5201416015625, 8.153076171875, 8.7860107421875, 9.4189453125, 10.0518798828125, 10.684814453125, 11.3177490234375, 11.95068359375, 12.5836181640625, 13.216552734375, 13.8494873046875, 14.482421875, 15.1153564453125, 15.748291015625, 16.3812255859375, 17.01416015625, 17.6470947265625, 18.280029296875, 18.9129638671875, 19.5458984375, 20.1788330078125, 20.811767578125, 21.4447021484375, 22.07763671875, 22.7105712890625, 23.343505859375, 23.9764404296875, 24.609375]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 7.0, 2.0, 6.0, 21.0, 31.0, 44.0, 85.0, 196.0, 322.0, 631.0, 1025.0, 785.0, 406.0, 253.0, 125.0, 68.0, 27.0, 24.0, 11.0, 6.0, 2.0, 0.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.234375, -23.251220703125, -22.26806640625, -21.284912109375, -20.3017578125, -19.318603515625, -18.33544921875, -17.352294921875, -16.369140625, -15.385986328125, -14.40283203125, -13.419677734375, -12.4365234375, -11.453369140625, -10.47021484375, -9.487060546875, -8.50390625, -7.520751953125, -6.53759765625, -5.554443359375, -4.5712890625, -3.588134765625, -2.60498046875, -1.621826171875, -0.638671875, 0.344482421875, 1.32763671875, 2.310791015625, 3.2939453125, 4.277099609375, 5.26025390625, 6.243408203125, 7.2265625, 8.209716796875, 9.19287109375, 10.176025390625, 11.1591796875, 12.142333984375, 13.12548828125, 14.108642578125, 15.091796875, 16.074951171875, 17.05810546875, 18.041259765625, 19.0244140625, 20.007568359375, 20.99072265625, 21.973876953125, 22.95703125, 23.940185546875, 24.92333984375, 25.906494140625, 26.8896484375, 27.872802734375, 28.85595703125, 29.839111328125, 30.822265625, 31.805419921875, 32.78857421875, 33.771728515625, 34.7548828125, 35.738037109375, 36.72119140625, 37.704345703125, 38.6875]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 8.0, 5.0, 11.0, 24.0, 23.0, 36.0, 85.0, 127.0, 262.0, 542.0, 1339.0, 5606.0, 3060638.0, 1118962.0, 4474.0, 1164.0, 477.0, 214.0, 114.0, 69.0, 39.0, 21.0, 8.0, 14.0, 7.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-73.5625, -71.5712890625, -69.580078125, -67.5888671875, -65.59765625, -63.6064453125, -61.615234375, -59.6240234375, -57.6328125, -55.6416015625, -53.650390625, -51.6591796875, -49.66796875, -47.6767578125, -45.685546875, -43.6943359375, -41.703125, -39.7119140625, -37.720703125, -35.7294921875, -33.73828125, -31.7470703125, -29.755859375, -27.7646484375, -25.7734375, -23.7822265625, -21.791015625, -19.7998046875, -17.80859375, -15.8173828125, -13.826171875, -11.8349609375, -9.84375, -7.8525390625, -5.861328125, -3.8701171875, -1.87890625, 0.1123046875, 2.103515625, 4.0947265625, 6.0859375, 8.0771484375, 10.068359375, 12.0595703125, 14.05078125, 16.0419921875, 18.033203125, 20.0244140625, 22.015625, 24.0068359375, 25.998046875, 27.9892578125, 29.98046875, 31.9716796875, 33.962890625, 35.9541015625, 37.9453125, 39.9365234375, 41.927734375, 43.9189453125, 45.91015625, 47.9013671875, 49.892578125, 51.8837890625, 53.875]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 36.0, 297.0, 503.0, 163.0, 14.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-347.0843505859375, -339.4287109375, -331.7730407714844, -324.1174011230469, -316.4617614746094, -308.80609130859375, -301.15045166015625, -293.49481201171875, -285.83917236328125, -278.18353271484375, -270.5278625488281, -262.8722229003906, -255.21658325195312, -247.56092834472656, -239.9052734375, -232.2496337890625, -224.59396362304688, -216.9383087158203, -209.2826690673828, -201.62701416015625, -193.97137451171875, -186.3157196044922, -178.66006469726562, -171.00442504882812, -163.34878540039062, -155.69313049316406, -148.03749084472656, -140.3818359375, -132.7261962890625, -125.07054138183594, -117.4148941040039, -109.75924682617188, -102.10359191894531, -94.44794464111328, -86.79229736328125, -79.13664245605469, -71.48099517822266, -63.825347900390625, -56.169700622558594, -48.5140495300293, -40.858402252197266, -33.202754974365234, -25.547103881835938, -17.891456604003906, -10.235807418823242, -2.580158233642578, 5.075489044189453, 12.73114013671875, 20.38678741455078, 28.042436599731445, 35.69808578491211, 43.35373306274414, 51.00938415527344, 58.66503143310547, 66.3206787109375, 73.97633361816406, 81.63197326660156, 89.2876205444336, 96.94326782226562, 104.59892272949219, 112.25457000732422, 119.91021728515625, 127.56586456298828, 135.2215118408203, 142.87716674804688]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 2.0, 6.0, 13.0, 11.0, 16.0, 24.0, 32.0, 36.0, 42.0, 42.0, 54.0, 59.0, 55.0, 55.0, 45.0, 62.0, 58.0, 54.0, 43.0, 33.0, 48.0, 36.0, 43.0, 26.0, 30.0, 17.0, 13.0, 17.0, 4.0, 8.0, 4.0, 6.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.59625244140625, -82.1253890991211, -79.6545181274414, -77.18365478515625, -74.7127914428711, -72.24192810058594, -69.77105712890625, -67.3001937866211, -64.82933044433594, -62.358463287353516, -59.88759994506836, -57.41673278808594, -54.94586944580078, -52.47500228881836, -50.00413513183594, -47.53327178955078, -45.062400817871094, -42.59153366088867, -40.120670318603516, -37.649803161621094, -35.17893981933594, -32.708072662353516, -30.237205505371094, -27.766340255737305, -25.295475006103516, -22.824609756469727, -20.353744506835938, -17.882877349853516, -15.412012100219727, -12.941146850585938, -10.470280647277832, -7.999414443969727, -5.5285491943359375, -3.0576834678649902, -0.586817741394043, 1.8840479850769043, 4.354913711547852, 6.825778961181641, 9.296645164489746, 11.767511367797852, 14.23837661743164, 16.70924186706543, 19.18010711669922, 21.65097427368164, 24.12183952331543, 26.59270477294922, 29.06357192993164, 31.53443717956543, 34.00530242919922, 36.47616958618164, 38.9470329284668, 41.41790008544922, 43.888763427734375, 46.3596305847168, 48.83049774169922, 51.301361083984375, 53.7722282409668, 56.24309539794922, 58.713958740234375, 61.1848258972168, 63.65569305419922, 66.12655639648438, 68.59741973876953, 71.06829071044922, 73.53915405273438]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 6.0, 1.0, 1.0, 3.0, 1.0, 7.0, 3.0, 10.0, 11.0, 13.0, 12.0, 13.0, 18.0, 23.0, 31.0, 26.0, 27.0, 29.0, 39.0, 41.0, 46.0, 45.0, 42.0, 54.0, 39.0, 33.0, 45.0, 41.0, 33.0, 38.0, 32.0, 41.0, 30.0, 36.0, 17.0, 27.0, 24.0, 9.0, 15.0, 13.0, 10.0, 8.0, 8.0, 3.0, 2.0, 2.0, 7.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.140625, -5.90966796875, -5.6787109375, -5.44775390625, -5.216796875, -4.98583984375, -4.7548828125, -4.52392578125, -4.29296875, -4.06201171875, -3.8310546875, -3.60009765625, -3.369140625, -3.13818359375, -2.9072265625, -2.67626953125, -2.4453125, -2.21435546875, -1.9833984375, -1.75244140625, -1.521484375, -1.29052734375, -1.0595703125, -0.82861328125, -0.59765625, -0.36669921875, -0.1357421875, 0.09521484375, 0.326171875, 0.55712890625, 0.7880859375, 1.01904296875, 1.25, 1.48095703125, 1.7119140625, 1.94287109375, 2.173828125, 2.40478515625, 2.6357421875, 2.86669921875, 3.09765625, 3.32861328125, 3.5595703125, 3.79052734375, 4.021484375, 4.25244140625, 4.4833984375, 4.71435546875, 4.9453125, 5.17626953125, 5.4072265625, 5.63818359375, 5.869140625, 6.10009765625, 6.3310546875, 6.56201171875, 6.79296875, 7.02392578125, 7.2548828125, 7.48583984375, 7.716796875, 7.94775390625, 8.1787109375, 8.40966796875, 8.640625]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 7.0, 17.0, 18.0, 13.0, 35.0, 44.0, 72.0, 115.0, 168.0, 277.0, 413.0, 562.0, 780.0, 1273.0, 1906.0, 2814.0, 4227.0, 6276.0, 9613.0, 14867.0, 22425.0, 35802.0, 57045.0, 93449.0, 151441.0, 215842.0, 160862.0, 98987.0, 61219.0, 38206.0, 24180.0, 15395.0, 10103.0, 6633.0, 4345.0, 2951.0, 2085.0, 1302.0, 923.0, 647.0, 398.0, 258.0, 205.0, 120.0, 84.0, 62.0, 34.0, 20.0, 22.0, 10.0, 1.0, 3.0, 0.0, 5.0, 1.0, 0.0, 3.0], "bins": [-0.98291015625, -0.952728271484375, -0.92254638671875, -0.892364501953125, -0.8621826171875, -0.832000732421875, -0.80181884765625, -0.771636962890625, -0.741455078125, -0.711273193359375, -0.68109130859375, -0.650909423828125, -0.6207275390625, -0.590545654296875, -0.56036376953125, -0.530181884765625, -0.5, -0.469818115234375, -0.43963623046875, -0.409454345703125, -0.3792724609375, -0.349090576171875, -0.31890869140625, -0.288726806640625, -0.258544921875, -0.228363037109375, -0.19818115234375, -0.167999267578125, -0.1378173828125, -0.107635498046875, -0.07745361328125, -0.047271728515625, -0.01708984375, 0.013092041015625, 0.04327392578125, 0.073455810546875, 0.1036376953125, 0.133819580078125, 0.16400146484375, 0.194183349609375, 0.224365234375, 0.254547119140625, 0.28472900390625, 0.314910888671875, 0.3450927734375, 0.375274658203125, 0.40545654296875, 0.435638427734375, 0.4658203125, 0.496002197265625, 0.52618408203125, 0.556365966796875, 0.5865478515625, 0.616729736328125, 0.64691162109375, 0.677093505859375, 0.707275390625, 0.737457275390625, 0.76763916015625, 0.797821044921875, 0.8280029296875, 0.858184814453125, 0.88836669921875, 0.918548583984375, 0.94873046875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 8.0, 7.0, 6.0, 8.0, 7.0, 9.0, 10.0, 12.0, 20.0, 21.0, 19.0, 28.0, 28.0, 27.0, 23.0, 43.0, 25.0, 28.0, 36.0, 39.0, 35.0, 41.0, 1057.0, 33.0, 40.0, 38.0, 40.0, 31.0, 29.0, 38.0, 35.0, 32.0, 24.0, 18.0, 16.0, 17.0, 20.0, 11.0, 12.0, 7.0, 9.0, 6.0, 9.0, 7.0, 5.0, 4.0, 5.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-4.20703125, -4.0836181640625, -3.960205078125, -3.8367919921875, -3.71337890625, -3.5899658203125, -3.466552734375, -3.3431396484375, -3.2197265625, -3.0963134765625, -2.972900390625, -2.8494873046875, -2.72607421875, -2.6026611328125, -2.479248046875, -2.3558349609375, -2.232421875, -2.1090087890625, -1.985595703125, -1.8621826171875, -1.73876953125, -1.6153564453125, -1.491943359375, -1.3685302734375, -1.2451171875, -1.1217041015625, -0.998291015625, -0.8748779296875, -0.75146484375, -0.6280517578125, -0.504638671875, -0.3812255859375, -0.2578125, -0.1343994140625, -0.010986328125, 0.1124267578125, 0.23583984375, 0.3592529296875, 0.482666015625, 0.6060791015625, 0.7294921875, 0.8529052734375, 0.976318359375, 1.0997314453125, 1.22314453125, 1.3465576171875, 1.469970703125, 1.5933837890625, 1.716796875, 1.8402099609375, 1.963623046875, 2.0870361328125, 2.21044921875, 2.3338623046875, 2.457275390625, 2.5806884765625, 2.7041015625, 2.8275146484375, 2.950927734375, 3.0743408203125, 3.19775390625, 3.3211669921875, 3.444580078125, 3.5679931640625, 3.69140625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 6.0, 9.0, 21.0, 24.0, 43.0, 56.0, 96.0, 141.0, 204.0, 300.0, 426.0, 650.0, 871.0, 1375.0, 2031.0, 2990.0, 4499.0, 6493.0, 10018.0, 15036.0, 23051.0, 35432.0, 54516.0, 82779.0, 124564.0, 1224610.0, 168380.0, 115294.0, 76776.0, 50091.0, 32862.0, 21541.0, 14002.0, 9062.0, 6181.0, 4099.0, 2843.0, 1850.0, 1275.0, 858.0, 617.0, 352.0, 267.0, 177.0, 114.0, 81.0, 47.0, 41.0, 35.0, 19.0, 12.0, 6.0, 6.0, 3.0, 4.0, 1.0], "bins": [-0.88134765625, -0.8553543090820312, -0.8293609619140625, -0.8033676147460938, -0.777374267578125, -0.7513809204101562, -0.7253875732421875, -0.6993942260742188, -0.67340087890625, -0.6474075317382812, -0.6214141845703125, -0.5954208374023438, -0.569427490234375, -0.5434341430664062, -0.5174407958984375, -0.49144744873046875, -0.4654541015625, -0.43946075439453125, -0.4134674072265625, -0.38747406005859375, -0.361480712890625, -0.33548736572265625, -0.3094940185546875, -0.28350067138671875, -0.25750732421875, -0.23151397705078125, -0.2055206298828125, -0.17952728271484375, -0.153533935546875, -0.12754058837890625, -0.1015472412109375, -0.07555389404296875, -0.049560546875, -0.02356719970703125, 0.0024261474609375, 0.02841949462890625, 0.054412841796875, 0.08040618896484375, 0.1063995361328125, 0.13239288330078125, 0.15838623046875, 0.18437957763671875, 0.2103729248046875, 0.23636627197265625, 0.262359619140625, 0.28835296630859375, 0.3143463134765625, 0.34033966064453125, 0.3663330078125, 0.39232635498046875, 0.4183197021484375, 0.44431304931640625, 0.470306396484375, 0.49629974365234375, 0.5222930908203125, 0.5482864379882812, 0.57427978515625, 0.6002731323242188, 0.6262664794921875, 0.6522598266601562, 0.678253173828125, 0.7042465209960938, 0.7302398681640625, 0.7562332153320312, 0.7822265625]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 4.0, 5.0, 4.0, 6.0, 6.0, 11.0, 13.0, 24.0, 35.0, 42.0, 33.0, 49.0, 59.0, 56.0, 62.0, 78.0, 73.0, 68.0, 57.0, 54.0, 52.0, 38.0, 31.0, 26.0, 25.0, 16.0, 16.0, 10.0, 16.0, 4.0, 6.0, 2.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0017948150634765625, -0.0017390847206115723, -0.001683354377746582, -0.0016276240348815918, -0.0015718936920166016, -0.0015161633491516113, -0.001460433006286621, -0.0014047026634216309, -0.0013489723205566406, -0.0012932419776916504, -0.0012375116348266602, -0.00118178129196167, -0.0011260509490966797, -0.0010703206062316895, -0.0010145902633666992, -0.000958859920501709, -0.0009031295776367188, -0.0008473992347717285, -0.0007916688919067383, -0.000735938549041748, -0.0006802082061767578, -0.0006244778633117676, -0.0005687475204467773, -0.0005130171775817871, -0.0004572868347167969, -0.00040155649185180664, -0.0003458261489868164, -0.00029009580612182617, -0.00023436546325683594, -0.0001786351203918457, -0.00012290477752685547, -6.717443466186523e-05, -1.1444091796875e-05, 4.4286251068115234e-05, 0.00010001659393310547, 0.0001557469367980957, 0.00021147727966308594, 0.00026720762252807617, 0.0003229379653930664, 0.00037866830825805664, 0.0004343986511230469, 0.0004901289939880371, 0.0005458593368530273, 0.0006015896797180176, 0.0006573200225830078, 0.000713050365447998, 0.0007687807083129883, 0.0008245110511779785, 0.0008802413940429688, 0.000935971736907959, 0.0009917020797729492, 0.0010474324226379395, 0.0011031627655029297, 0.00115889310836792, 0.0012146234512329102, 0.0012703537940979004, 0.0013260841369628906, 0.0013818144798278809, 0.001437544822692871, 0.0014932751655578613, 0.0015490055084228516, 0.0016047358512878418, 0.001660466194152832, 0.0017161965370178223, 0.0017719268798828125]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 8.0, 6.0, 11.0, 7.0, 16.0, 18.0, 16.0, 26.0, 43.0, 62.0, 74.0, 72.0, 118.0, 148.0, 245.0, 343.0, 541.0, 1128.0, 151675.0, 890415.0, 1530.0, 667.0, 400.0, 266.0, 164.0, 118.0, 116.0, 65.0, 68.0, 36.0, 35.0, 15.0, 20.0, 17.0, 11.0, 8.0, 10.0, 9.0, 6.0, 7.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0], "bins": [-0.0292510986328125, -0.028340578079223633, -0.027430057525634766, -0.0265195369720459, -0.02560901641845703, -0.024698495864868164, -0.023787975311279297, -0.02287745475769043, -0.021966934204101562, -0.021056413650512695, -0.020145893096923828, -0.01923537254333496, -0.018324851989746094, -0.017414331436157227, -0.01650381088256836, -0.015593290328979492, -0.014682769775390625, -0.013772249221801758, -0.01286172866821289, -0.011951208114624023, -0.011040687561035156, -0.010130167007446289, -0.009219646453857422, -0.008309125900268555, -0.0073986053466796875, -0.00648808479309082, -0.005577564239501953, -0.004667043685913086, -0.0037565231323242188, -0.0028460025787353516, -0.0019354820251464844, -0.0010249614715576172, -0.00011444091796875, 0.0007960796356201172, 0.0017066001892089844, 0.0026171207427978516, 0.0035276412963867188, 0.004438161849975586, 0.005348682403564453, 0.00625920295715332, 0.0071697235107421875, 0.008080244064331055, 0.008990764617919922, 0.009901285171508789, 0.010811805725097656, 0.011722326278686523, 0.01263284683227539, 0.013543367385864258, 0.014453887939453125, 0.015364408493041992, 0.01627492904663086, 0.017185449600219727, 0.018095970153808594, 0.01900649070739746, 0.019917011260986328, 0.020827531814575195, 0.021738052368164062, 0.02264857292175293, 0.023559093475341797, 0.024469614028930664, 0.02538013458251953, 0.0262906551361084, 0.027201175689697266, 0.028111696243286133, 0.029022216796875]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 22.0, 310.0, 585.0, 92.0, 6.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.00799393281340599, -0.007854266092181206, -0.0077146003022789955, -0.007574933581054211, -0.007435267325490713, -0.007295601069927216, -0.007155934814363718, -0.0070162685588002205, -0.006876601837575436, -0.006736935582011938, -0.0065972693264484406, -0.006457602605223656, -0.006317936349660158, -0.006178270094096661, -0.006038603838533163, -0.0058989375829696655, -0.005759270861744881, -0.005619604606181383, -0.005479938350617886, -0.005340271629393101, -0.005200605373829603, -0.005060939118266106, -0.004921272862702608, -0.0047816066071391106, -0.004641940351575613, -0.0045022740960121155, -0.004362607840448618, -0.004222941119223833, -0.0040832748636603355, -0.003943608608096838, -0.0038039423525333405, -0.0036642758641391993, -0.003524609375745058, -0.0033849431201815605, -0.0032452766317874193, -0.0031056103762239218, -0.0029659438878297806, -0.002826277632266283, -0.0026866113767027855, -0.0025469448883086443, -0.002407278399914503, -0.0022676121443510056, -0.0021279456559568644, -0.001988279400393367, -0.0018486129119992256, -0.001708946656435728, -0.0015692802844569087, -0.0014296139124780893, -0.0012899476569145918, -0.0011502812849357724, -0.001010614912956953, -0.0008709485991857946, -0.0007312822272069752, -0.0005916158552281559, -0.0004519495414569974, -0.000312283169478178, -0.00017261679749935865, -3.295044007245451e-05, 0.00010671591735444963, 0.00024638226022943854, 0.0003860486322082579, 0.0005257150041870773, 0.0006653813179582357, 0.0008050476899370551, 0.0009447140619158745]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 7.0, 3.0, 4.0, 11.0, 9.0, 10.0, 19.0, 19.0, 17.0, 18.0, 35.0, 39.0, 36.0, 36.0, 35.0, 38.0, 45.0, 51.0, 47.0, 49.0, 50.0, 41.0, 45.0, 47.0, 44.0, 37.0, 30.0, 21.0, 32.0, 25.0, 16.0, 12.0, 8.0, 15.0, 15.0, 9.0, 5.0, 9.0, 3.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0008946657180786133, -0.0008666180074214935, -0.0008385702967643738, -0.000810522586107254, -0.0007824748754501343, -0.0007544271647930145, -0.0007263794541358948, -0.000698331743478775, -0.0006702840328216553, -0.0006422363221645355, -0.0006141886115074158, -0.000586140900850296, -0.0005580931901931763, -0.0005300454795360565, -0.0005019977688789368, -0.000473950058221817, -0.00044590234756469727, -0.0004178546369075775, -0.00038980692625045776, -0.000361759215593338, -0.00033371150493621826, -0.0003056637942790985, -0.00027761608362197876, -0.000249568372964859, -0.00022152066230773926, -0.0001934729516506195, -0.00016542524099349976, -0.00013737753033638, -0.00010932981967926025, -8.12821090221405e-05, -5.323439836502075e-05, -2.5186687707901e-05, 2.86102294921875e-06, 3.09087336063385e-05, 5.895644426345825e-05, 8.7004154920578e-05, 0.00011505186557769775, 0.0001430995762348175, 0.00017114728689193726, 0.000199194997549057, 0.00022724270820617676, 0.0002552904188632965, 0.00028333812952041626, 0.000311385840177536, 0.00033943355083465576, 0.0003674812614917755, 0.00039552897214889526, 0.000423576682806015, 0.00045162439346313477, 0.0004796721041202545, 0.0005077198147773743, 0.000535767525434494, 0.0005638152360916138, 0.0005918629467487335, 0.0006199106574058533, 0.000647958368062973, 0.0006760060787200928, 0.0007040537893772125, 0.0007321015000343323, 0.000760149210691452, 0.0007881969213485718, 0.0008162446320056915, 0.0008442923426628113, 0.000872340053319931, 0.0009003877639770508]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 6.0, 1.0, 1.0, 3.0, 1.0, 7.0, 3.0, 10.0, 11.0, 13.0, 12.0, 13.0, 18.0, 23.0, 31.0, 26.0, 27.0, 29.0, 39.0, 41.0, 46.0, 45.0, 42.0, 54.0, 39.0, 33.0, 45.0, 41.0, 33.0, 38.0, 32.0, 41.0, 30.0, 37.0, 16.0, 27.0, 24.0, 9.0, 15.0, 13.0, 10.0, 8.0, 8.0, 3.0, 2.0, 2.0, 7.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.140625, -5.90966796875, -5.6787109375, -5.44775390625, -5.216796875, -4.98583984375, -4.7548828125, -4.52392578125, -4.29296875, -4.06201171875, -3.8310546875, -3.60009765625, -3.369140625, -3.13818359375, -2.9072265625, -2.67626953125, -2.4453125, -2.21435546875, -1.9833984375, -1.75244140625, -1.521484375, -1.29052734375, -1.0595703125, -0.82861328125, -0.59765625, -0.36669921875, -0.1357421875, 0.09521484375, 0.326171875, 0.55712890625, 0.7880859375, 1.01904296875, 1.25, 1.48095703125, 1.7119140625, 1.94287109375, 2.173828125, 2.40478515625, 2.6357421875, 2.86669921875, 3.09765625, 3.32861328125, 3.5595703125, 3.79052734375, 4.021484375, 4.25244140625, 4.4833984375, 4.71435546875, 4.9453125, 5.17626953125, 5.4072265625, 5.63818359375, 5.869140625, 6.10009765625, 6.3310546875, 6.56201171875, 6.79296875, 7.02392578125, 7.2548828125, 7.48583984375, 7.716796875, 7.94775390625, 8.1787109375, 8.40966796875, 8.640625]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 5.0, 8.0, 7.0, 4.0, 10.0, 17.0, 15.0, 23.0, 33.0, 44.0, 59.0, 94.0, 116.0, 180.0, 241.0, 381.0, 553.0, 946.0, 1644.0, 3580.0, 8637.0, 28345.0, 134399.0, 628501.0, 185726.0, 35539.0, 10532.0, 4121.0, 1875.0, 1057.0, 601.0, 388.0, 256.0, 165.0, 130.0, 86.0, 64.0, 52.0, 27.0, 33.0, 14.0, 9.0, 8.0, 13.0, 5.0, 2.0, 7.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.9296875, -10.5185546875, -10.107421875, -9.6962890625, -9.28515625, -8.8740234375, -8.462890625, -8.0517578125, -7.640625, -7.2294921875, -6.818359375, -6.4072265625, -5.99609375, -5.5849609375, -5.173828125, -4.7626953125, -4.3515625, -3.9404296875, -3.529296875, -3.1181640625, -2.70703125, -2.2958984375, -1.884765625, -1.4736328125, -1.0625, -0.6513671875, -0.240234375, 0.1708984375, 0.58203125, 0.9931640625, 1.404296875, 1.8154296875, 2.2265625, 2.6376953125, 3.048828125, 3.4599609375, 3.87109375, 4.2822265625, 4.693359375, 5.1044921875, 5.515625, 5.9267578125, 6.337890625, 6.7490234375, 7.16015625, 7.5712890625, 7.982421875, 8.3935546875, 8.8046875, 9.2158203125, 9.626953125, 10.0380859375, 10.44921875, 10.8603515625, 11.271484375, 11.6826171875, 12.09375, 12.5048828125, 12.916015625, 13.3271484375, 13.73828125, 14.1494140625, 14.560546875, 14.9716796875, 15.3828125]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 3.0, 5.0, 2.0, 9.0, 10.0, 8.0, 11.0, 20.0, 14.0, 21.0, 34.0, 39.0, 29.0, 56.0, 52.0, 46.0, 78.0, 184.0, 1732.0, 251.0, 81.0, 33.0, 52.0, 44.0, 43.0, 30.0, 31.0, 20.0, 21.0, 20.0, 17.0, 10.0, 7.0, 10.0, 4.0, 6.0, 6.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-21.6875, -21.060302734375, -20.43310546875, -19.805908203125, -19.1787109375, -18.551513671875, -17.92431640625, -17.297119140625, -16.669921875, -16.042724609375, -15.41552734375, -14.788330078125, -14.1611328125, -13.533935546875, -12.90673828125, -12.279541015625, -11.65234375, -11.025146484375, -10.39794921875, -9.770751953125, -9.1435546875, -8.516357421875, -7.88916015625, -7.261962890625, -6.634765625, -6.007568359375, -5.38037109375, -4.753173828125, -4.1259765625, -3.498779296875, -2.87158203125, -2.244384765625, -1.6171875, -0.989990234375, -0.36279296875, 0.264404296875, 0.8916015625, 1.518798828125, 2.14599609375, 2.773193359375, 3.400390625, 4.027587890625, 4.65478515625, 5.281982421875, 5.9091796875, 6.536376953125, 7.16357421875, 7.790771484375, 8.41796875, 9.045166015625, 9.67236328125, 10.299560546875, 10.9267578125, 11.553955078125, 12.18115234375, 12.808349609375, 13.435546875, 14.062744140625, 14.68994140625, 15.317138671875, 15.9443359375, 16.571533203125, 17.19873046875, 17.825927734375, 18.453125]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 8.0, 3.0, 0.0, 6.0, 9.0, 10.0, 6.0, 14.0, 17.0, 19.0, 22.0, 38.0, 54.0, 84.0, 102.0, 193.0, 376.0, 796.0, 5138.0, 3129949.0, 6973.0, 870.0, 402.0, 221.0, 123.0, 68.0, 55.0, 31.0, 33.0, 22.0, 8.0, 16.0, 16.0, 6.0, 5.0, 3.0, 6.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-56.3125, -54.46826171875, -52.6240234375, -50.77978515625, -48.935546875, -47.09130859375, -45.2470703125, -43.40283203125, -41.55859375, -39.71435546875, -37.8701171875, -36.02587890625, -34.181640625, -32.33740234375, -30.4931640625, -28.64892578125, -26.8046875, -24.96044921875, -23.1162109375, -21.27197265625, -19.427734375, -17.58349609375, -15.7392578125, -13.89501953125, -12.05078125, -10.20654296875, -8.3623046875, -6.51806640625, -4.673828125, -2.82958984375, -0.9853515625, 0.85888671875, 2.703125, 4.54736328125, 6.3916015625, 8.23583984375, 10.080078125, 11.92431640625, 13.7685546875, 15.61279296875, 17.45703125, 19.30126953125, 21.1455078125, 22.98974609375, 24.833984375, 26.67822265625, 28.5224609375, 30.36669921875, 32.2109375, 34.05517578125, 35.8994140625, 37.74365234375, 39.587890625, 41.43212890625, 43.2763671875, 45.12060546875, 46.96484375, 48.80908203125, 50.6533203125, 52.49755859375, 54.341796875, 56.18603515625, 58.0302734375, 59.87451171875, 61.71875]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 30.0, 190.0, 546.0, 213.0, 27.0, 4.0, 2.0, 2.0], "bins": [-139.81094360351562, -137.4203338623047, -135.0297393798828, -132.63912963867188, -130.24853515625, -127.85792541503906, -125.46732330322266, -123.07672119140625, -120.68611907958984, -118.29551696777344, -115.90491485595703, -113.51431274414062, -111.12370300292969, -108.73310089111328, -106.34249877929688, -103.95189666748047, -101.56129455566406, -99.17069244384766, -96.78009033203125, -94.38948822021484, -91.99888610839844, -89.6082763671875, -87.2176742553711, -84.82707214355469, -82.43647003173828, -80.04586791992188, -77.65526580810547, -75.26466369628906, -72.87405395507812, -70.48345184326172, -68.09284973144531, -65.7022476196289, -63.311649322509766, -60.92104721069336, -58.53044128417969, -56.13983917236328, -53.749237060546875, -51.35863494873047, -48.96803283691406, -46.57742691040039, -44.186824798583984, -41.79622268676758, -39.405616760253906, -37.0150146484375, -34.624412536621094, -32.23381042480469, -29.84320640563965, -27.45260238647461, -25.062000274658203, -22.671398162841797, -20.280794143676758, -17.89019012451172, -15.499588012695312, -13.10898494720459, -10.718381881713867, -8.327777862548828, -5.937176704406738, -3.5465736389160156, -1.155970573425293, 1.2346324920654297, 3.6252355575561523, 6.015838623046875, 8.406441688537598, 10.797045707702637, 13.187647819519043]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 9.0, 3.0, 5.0, 6.0, 15.0, 10.0, 13.0, 16.0, 23.0, 23.0, 23.0, 23.0, 42.0, 24.0, 33.0, 41.0, 33.0, 38.0, 62.0, 45.0, 50.0, 51.0, 38.0, 34.0, 46.0, 28.0, 34.0, 35.0, 27.0, 23.0, 22.0, 23.0, 22.0, 13.0, 15.0, 11.0, 12.0, 11.0, 3.0, 5.0, 3.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-39.942039489746094, -38.56901168823242, -37.19598388671875, -35.822959899902344, -34.44993209838867, -33.076904296875, -31.70387840270996, -30.330852508544922, -28.95782470703125, -27.584796905517578, -26.21177101135254, -24.8387451171875, -23.465717315673828, -22.092689514160156, -20.719663619995117, -19.346637725830078, -17.973609924316406, -16.600582122802734, -15.227556228637695, -13.85452938079834, -12.481502532958984, -11.108475685119629, -9.735448837280273, -8.362421989440918, -6.9893951416015625, -5.616368293762207, -4.243341445922852, -2.870314598083496, -1.4972877502441406, -0.12426090240478516, 1.2487659454345703, 2.621792793273926, 3.9948158264160156, 5.367842674255371, 6.740869522094727, 8.113896369934082, 9.486923217773438, 10.859950065612793, 12.232976913452148, 13.606003761291504, 14.97903060913086, 16.35205841064453, 17.72508430480957, 19.09811019897461, 20.47113800048828, 21.844165802001953, 23.217191696166992, 24.59021759033203, 25.963245391845703, 27.336273193359375, 28.709299087524414, 30.082324981689453, 31.455352783203125, 32.8283805847168, 34.20140838623047, 35.574432373046875, 36.94746017456055, 38.32048797607422, 39.693511962890625, 41.0665397644043, 42.43956756591797, 43.81259536743164, 45.18562316894531, 46.55864715576172, 47.93167495727539]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 1.0, 3.0, 5.0, 6.0, 6.0, 3.0, 15.0, 15.0, 8.0, 16.0, 19.0, 24.0, 19.0, 27.0, 19.0, 29.0, 39.0, 42.0, 34.0, 38.0, 44.0, 41.0, 43.0, 45.0, 46.0, 41.0, 41.0, 48.0, 32.0, 30.0, 34.0, 31.0, 28.0, 19.0, 21.0, 20.0, 14.0, 15.0, 12.0, 2.0, 8.0, 7.0, 5.0, 3.0, 2.0, 4.0, 1.0, 1.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0, -7.734375, -7.46875, -7.203125, -6.9375, -6.671875, -6.40625, -6.140625, -5.875, -5.609375, -5.34375, -5.078125, -4.8125, -4.546875, -4.28125, -4.015625, -3.75, -3.484375, -3.21875, -2.953125, -2.6875, -2.421875, -2.15625, -1.890625, -1.625, -1.359375, -1.09375, -0.828125, -0.5625, -0.296875, -0.03125, 0.234375, 0.5, 0.765625, 1.03125, 1.296875, 1.5625, 1.828125, 2.09375, 2.359375, 2.625, 2.890625, 3.15625, 3.421875, 3.6875, 3.953125, 4.21875, 4.484375, 4.75, 5.015625, 5.28125, 5.546875, 5.8125, 6.078125, 6.34375, 6.609375, 6.875, 7.140625, 7.40625, 7.671875, 7.9375, 8.203125, 8.46875, 8.734375, 9.0]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 5.0, 2.0, 6.0, 11.0, 14.0, 14.0, 21.0, 31.0, 22.0, 41.0, 45.0, 61.0, 58.0, 96.0, 107.0, 146.0, 185.0, 235.0, 351.0, 530.0, 919.0, 2252.0, 14219.0, 2560446.0, 1599058.0, 10708.0, 1919.0, 849.0, 537.0, 338.0, 272.0, 169.0, 120.0, 96.0, 82.0, 57.0, 55.0, 43.0, 37.0, 22.0, 27.0, 21.0, 16.0, 16.0, 11.0, 6.0, 5.0, 6.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-46.3125, -44.765625, -43.21875, -41.671875, -40.125, -38.578125, -37.03125, -35.484375, -33.9375, -32.390625, -30.84375, -29.296875, -27.75, -26.203125, -24.65625, -23.109375, -21.5625, -20.015625, -18.46875, -16.921875, -15.375, -13.828125, -12.28125, -10.734375, -9.1875, -7.640625, -6.09375, -4.546875, -3.0, -1.453125, 0.09375, 1.640625, 3.1875, 4.734375, 6.28125, 7.828125, 9.375, 10.921875, 12.46875, 14.015625, 15.5625, 17.109375, 18.65625, 20.203125, 21.75, 23.296875, 24.84375, 26.390625, 27.9375, 29.484375, 31.03125, 32.578125, 34.125, 35.671875, 37.21875, 38.765625, 40.3125, 41.859375, 43.40625, 44.953125, 46.5, 48.046875, 49.59375, 51.140625, 52.6875]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 2.0, 7.0, 1.0, 10.0, 9.0, 23.0, 60.0, 82.0, 177.0, 335.0, 665.0, 1044.0, 776.0, 447.0, 196.0, 106.0, 67.0, 25.0, 22.0, 7.0, 8.0, 4.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-32.71875, -31.9862060546875, -31.253662109375, -30.5211181640625, -29.78857421875, -29.0560302734375, -28.323486328125, -27.5909423828125, -26.8583984375, -26.1258544921875, -25.393310546875, -24.6607666015625, -23.92822265625, -23.1956787109375, -22.463134765625, -21.7305908203125, -20.998046875, -20.2655029296875, -19.532958984375, -18.8004150390625, -18.06787109375, -17.3353271484375, -16.602783203125, -15.8702392578125, -15.1376953125, -14.4051513671875, -13.672607421875, -12.9400634765625, -12.20751953125, -11.4749755859375, -10.742431640625, -10.0098876953125, -9.27734375, -8.5447998046875, -7.812255859375, -7.0797119140625, -6.34716796875, -5.6146240234375, -4.882080078125, -4.1495361328125, -3.4169921875, -2.6844482421875, -1.951904296875, -1.2193603515625, -0.48681640625, 0.2457275390625, 0.978271484375, 1.7108154296875, 2.443359375, 3.1759033203125, 3.908447265625, 4.6409912109375, 5.37353515625, 6.1060791015625, 6.838623046875, 7.5711669921875, 8.3037109375, 9.0362548828125, 9.768798828125, 10.5013427734375, 11.23388671875, 11.9664306640625, 12.698974609375, 13.4315185546875, 14.1640625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 7.0, 10.0, 17.0, 39.0, 88.0, 166.0, 498.0, 2369.0, 40642.0, 3957252.0, 187404.0, 4612.0, 752.0, 219.0, 101.0, 46.0, 25.0, 12.0, 7.0, 8.0, 5.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.34375, -43.10009765625, -41.8564453125, -40.61279296875, -39.369140625, -38.12548828125, -36.8818359375, -35.63818359375, -34.39453125, -33.15087890625, -31.9072265625, -30.66357421875, -29.419921875, -28.17626953125, -26.9326171875, -25.68896484375, -24.4453125, -23.20166015625, -21.9580078125, -20.71435546875, -19.470703125, -18.22705078125, -16.9833984375, -15.73974609375, -14.49609375, -13.25244140625, -12.0087890625, -10.76513671875, -9.521484375, -8.27783203125, -7.0341796875, -5.79052734375, -4.546875, -3.30322265625, -2.0595703125, -0.81591796875, 0.427734375, 1.67138671875, 2.9150390625, 4.15869140625, 5.40234375, 6.64599609375, 7.8896484375, 9.13330078125, 10.376953125, 11.62060546875, 12.8642578125, 14.10791015625, 15.3515625, 16.59521484375, 17.8388671875, 19.08251953125, 20.326171875, 21.56982421875, 22.8134765625, 24.05712890625, 25.30078125, 26.54443359375, 27.7880859375, 29.03173828125, 30.275390625, 31.51904296875, 32.7626953125, 34.00634765625, 35.25]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 5.0, 8.0, 11.0, 20.0, 53.0, 61.0, 106.0, 147.0, 176.0, 153.0, 100.0, 67.0, 46.0, 15.0, 14.0, 9.0, 10.0, 3.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.93859100341797, -87.90706634521484, -83.87554931640625, -79.84402465820312, -75.8125, -71.78097534179688, -67.74945068359375, -63.717933654785156, -59.68640899658203, -55.654884338378906, -51.62336349487305, -47.59184265136719, -43.56031799316406, -39.52879333496094, -35.49727249145508, -31.465749740600586, -27.434226989746094, -23.4027042388916, -19.37118148803711, -15.339658737182617, -11.308135986328125, -7.276613235473633, -3.2450904846191406, 0.7864322662353516, 4.817955017089844, 8.849477767944336, 12.881000518798828, 16.91252326965332, 20.944046020507812, 24.975568771362305, 29.007091522216797, 33.038612365722656, 37.07014465332031, 41.10166931152344, 45.1331901550293, 49.164710998535156, 53.19623565673828, 57.227760314941406, 61.259281158447266, 65.29080200195312, 69.32232666015625, 73.35385131835938, 77.3853759765625, 81.4168930053711, 85.44841766357422, 89.47994232177734, 93.51145935058594, 97.54298400878906, 101.57450866699219, 105.60603332519531, 109.63755798339844, 113.66907501220703, 117.70059967041016, 121.73212432861328, 125.76364135742188, 129.795166015625, 133.82669067382812, 137.85821533203125, 141.88973999023438, 145.9212646484375, 149.95278930664062, 153.9842987060547, 158.0158233642578, 162.04734802246094, 166.07887268066406]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 3.0, 4.0, 7.0, 10.0, 15.0, 13.0, 13.0, 12.0, 21.0, 21.0, 20.0, 24.0, 27.0, 27.0, 31.0, 40.0, 34.0, 37.0, 45.0, 38.0, 30.0, 40.0, 43.0, 45.0, 36.0, 34.0, 39.0, 37.0, 42.0, 22.0, 25.0, 22.0, 24.0, 13.0, 16.0, 18.0, 17.0, 10.0, 6.0, 13.0, 8.0, 7.0, 5.0, 2.0, 1.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-47.35752487182617, -45.88702392578125, -44.416526794433594, -42.94602584838867, -41.47552490234375, -40.005027770996094, -38.53452682495117, -37.06402587890625, -35.593528747558594, -34.12302780151367, -32.652530670166016, -31.182029724121094, -29.711528778076172, -28.241029739379883, -26.770530700683594, -25.300029754638672, -23.82952880859375, -22.35902976989746, -20.88852882385254, -19.41802978515625, -17.947528839111328, -16.47702980041504, -15.00653076171875, -13.536030769348145, -12.065530776977539, -10.595030784606934, -9.124530792236328, -7.654031753540039, -6.183531761169434, -4.713031768798828, -3.242532730102539, -1.7720327377319336, -0.3015327453613281, 1.1689670085906982, 2.6394667625427246, 4.109966278076172, 5.580466270446777, 7.050966262817383, 8.521465301513672, 9.991965293884277, 11.462465286254883, 12.932965278625488, 14.403465270996094, 15.873964309692383, 17.344463348388672, 18.814964294433594, 20.285463333129883, 21.755962371826172, 23.226463317871094, 24.696962356567383, 26.167463302612305, 27.637962341308594, 29.108463287353516, 30.578962326049805, 32.049461364746094, 33.519962310791016, 34.99046325683594, 36.46096420288086, 37.931461334228516, 39.40196228027344, 40.87246322631836, 42.34296417236328, 43.81346130371094, 45.28396224975586, 46.754459381103516]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 4.0, 2.0, 9.0, 4.0, 11.0, 9.0, 10.0, 14.0, 11.0, 21.0, 14.0, 20.0, 27.0, 29.0, 31.0, 38.0, 40.0, 25.0, 36.0, 51.0, 37.0, 38.0, 32.0, 35.0, 32.0, 44.0, 43.0, 35.0, 39.0, 39.0, 29.0, 26.0, 33.0, 15.0, 20.0, 9.0, 12.0, 13.0, 15.0, 12.0, 11.0, 8.0, 8.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-79.5, -77.1416015625, -74.783203125, -72.4248046875, -70.06640625, -67.7080078125, -65.349609375, -62.9912109375, -60.6328125, -58.2744140625, -55.916015625, -53.5576171875, -51.19921875, -48.8408203125, -46.482421875, -44.1240234375, -41.765625, -39.4072265625, -37.048828125, -34.6904296875, -32.33203125, -29.9736328125, -27.615234375, -25.2568359375, -22.8984375, -20.5400390625, -18.181640625, -15.8232421875, -13.46484375, -11.1064453125, -8.748046875, -6.3896484375, -4.03125, -1.6728515625, 0.685546875, 3.0439453125, 5.40234375, 7.7607421875, 10.119140625, 12.4775390625, 14.8359375, 17.1943359375, 19.552734375, 21.9111328125, 24.26953125, 26.6279296875, 28.986328125, 31.3447265625, 33.703125, 36.0615234375, 38.419921875, 40.7783203125, 43.13671875, 45.4951171875, 47.853515625, 50.2119140625, 52.5703125, 54.9287109375, 57.287109375, 59.6455078125, 62.00390625, 64.3623046875, 66.720703125, 69.0791015625, 71.4375]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 5.0, 8.0, 7.0, 7.0, 21.0, 19.0, 44.0, 47.0, 70.0, 112.0, 183.0, 242.0, 383.0, 551.0, 867.0, 1249.0, 1906.0, 2917.0, 4340.0, 6621.0, 10143.0, 15386.0, 23959.0, 36782.0, 56963.0, 87866.0, 139854.0, 200189.0, 163877.0, 103810.0, 66568.0, 42748.0, 27966.0, 18168.0, 11796.0, 7666.0, 5103.0, 3446.0, 2249.0, 1452.0, 998.0, 674.0, 407.0, 302.0, 203.0, 123.0, 90.0, 51.0, 46.0, 28.0, 16.0, 16.0, 5.0, 7.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0], "bins": [-9.3046875, -9.010986328125, -8.71728515625, -8.423583984375, -8.1298828125, -7.836181640625, -7.54248046875, -7.248779296875, -6.955078125, -6.661376953125, -6.36767578125, -6.073974609375, -5.7802734375, -5.486572265625, -5.19287109375, -4.899169921875, -4.60546875, -4.311767578125, -4.01806640625, -3.724365234375, -3.4306640625, -3.136962890625, -2.84326171875, -2.549560546875, -2.255859375, -1.962158203125, -1.66845703125, -1.374755859375, -1.0810546875, -0.787353515625, -0.49365234375, -0.199951171875, 0.09375, 0.387451171875, 0.68115234375, 0.974853515625, 1.2685546875, 1.562255859375, 1.85595703125, 2.149658203125, 2.443359375, 2.737060546875, 3.03076171875, 3.324462890625, 3.6181640625, 3.911865234375, 4.20556640625, 4.499267578125, 4.79296875, 5.086669921875, 5.38037109375, 5.674072265625, 5.9677734375, 6.261474609375, 6.55517578125, 6.848876953125, 7.142578125, 7.436279296875, 7.72998046875, 8.023681640625, 8.3173828125, 8.611083984375, 8.90478515625, 9.198486328125, 9.4921875]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 2.0, 6.0, 3.0, 6.0, 6.0, 20.0, 15.0, 14.0, 14.0, 38.0, 28.0, 23.0, 27.0, 45.0, 43.0, 45.0, 34.0, 39.0, 36.0, 1072.0, 31.0, 47.0, 39.0, 40.0, 40.0, 35.0, 45.0, 40.0, 32.0, 34.0, 26.0, 18.0, 22.0, 17.0, 8.0, 13.0, 4.0, 8.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-52.4375, -50.68896484375, -48.9404296875, -47.19189453125, -45.443359375, -43.69482421875, -41.9462890625, -40.19775390625, -38.44921875, -36.70068359375, -34.9521484375, -33.20361328125, -31.455078125, -29.70654296875, -27.9580078125, -26.20947265625, -24.4609375, -22.71240234375, -20.9638671875, -19.21533203125, -17.466796875, -15.71826171875, -13.9697265625, -12.22119140625, -10.47265625, -8.72412109375, -6.9755859375, -5.22705078125, -3.478515625, -1.72998046875, 0.0185546875, 1.76708984375, 3.515625, 5.26416015625, 7.0126953125, 8.76123046875, 10.509765625, 12.25830078125, 14.0068359375, 15.75537109375, 17.50390625, 19.25244140625, 21.0009765625, 22.74951171875, 24.498046875, 26.24658203125, 27.9951171875, 29.74365234375, 31.4921875, 33.24072265625, 34.9892578125, 36.73779296875, 38.486328125, 40.23486328125, 41.9833984375, 43.73193359375, 45.48046875, 47.22900390625, 48.9775390625, 50.72607421875, 52.474609375, 54.22314453125, 55.9716796875, 57.72021484375, 59.46875]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 14.0, 13.0, 19.0, 25.0, 27.0, 48.0, 69.0, 114.0, 182.0, 274.0, 449.0, 606.0, 936.0, 1419.0, 2306.0, 3686.0, 5574.0, 8727.0, 13899.0, 21832.0, 34849.0, 55328.0, 87384.0, 137702.0, 1249852.0, 171688.0, 110311.0, 69297.0, 44518.0, 27784.0, 17545.0, 10943.0, 7030.0, 4538.0, 2911.0, 1827.0, 1193.0, 776.0, 471.0, 328.0, 213.0, 154.0, 102.0, 53.0, 44.0, 26.0, 19.0, 12.0, 11.0, 4.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.34375, -9.0399169921875, -8.736083984375, -8.4322509765625, -8.12841796875, -7.8245849609375, -7.520751953125, -7.2169189453125, -6.9130859375, -6.6092529296875, -6.305419921875, -6.0015869140625, -5.69775390625, -5.3939208984375, -5.090087890625, -4.7862548828125, -4.482421875, -4.1785888671875, -3.874755859375, -3.5709228515625, -3.26708984375, -2.9632568359375, -2.659423828125, -2.3555908203125, -2.0517578125, -1.7479248046875, -1.444091796875, -1.1402587890625, -0.83642578125, -0.5325927734375, -0.228759765625, 0.0750732421875, 0.37890625, 0.6827392578125, 0.986572265625, 1.2904052734375, 1.59423828125, 1.8980712890625, 2.201904296875, 2.5057373046875, 2.8095703125, 3.1134033203125, 3.417236328125, 3.7210693359375, 4.02490234375, 4.3287353515625, 4.632568359375, 4.9364013671875, 5.240234375, 5.5440673828125, 5.847900390625, 6.1517333984375, 6.45556640625, 6.7593994140625, 7.063232421875, 7.3670654296875, 7.6708984375, 7.9747314453125, 8.278564453125, 8.5823974609375, 8.88623046875, 9.1900634765625, 9.493896484375, 9.7977294921875, 10.1015625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 5.0, 5.0, 9.0, 12.0, 9.0, 12.0, 20.0, 33.0, 31.0, 30.0, 47.0, 50.0, 56.0, 61.0, 48.0, 54.0, 62.0, 51.0, 46.0, 38.0, 45.0, 45.0, 46.0, 37.0, 23.0, 27.0, 22.0, 14.0, 15.0, 10.0, 10.0, 7.0, 8.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.022674560546875, -0.02207040786743164, -0.02146625518798828, -0.020862102508544922, -0.020257949829101562, -0.019653797149658203, -0.019049644470214844, -0.018445491790771484, -0.017841339111328125, -0.017237186431884766, -0.016633033752441406, -0.016028881072998047, -0.015424728393554688, -0.014820575714111328, -0.014216423034667969, -0.01361227035522461, -0.01300811767578125, -0.01240396499633789, -0.011799812316894531, -0.011195659637451172, -0.010591506958007812, -0.009987354278564453, -0.009383201599121094, -0.008779048919677734, -0.008174896240234375, -0.007570743560791016, -0.006966590881347656, -0.006362438201904297, -0.0057582855224609375, -0.005154132843017578, -0.004549980163574219, -0.003945827484130859, -0.0033416748046875, -0.0027375221252441406, -0.0021333694458007812, -0.0015292167663574219, -0.0009250640869140625, -0.0003209114074707031, 0.00028324127197265625, 0.0008873939514160156, 0.001491546630859375, 0.0020956993103027344, 0.0026998519897460938, 0.003304004669189453, 0.0039081573486328125, 0.004512310028076172, 0.005116462707519531, 0.005720615386962891, 0.00632476806640625, 0.006928920745849609, 0.007533073425292969, 0.008137226104736328, 0.008741378784179688, 0.009345531463623047, 0.009949684143066406, 0.010553836822509766, 0.011157989501953125, 0.011762142181396484, 0.012366294860839844, 0.012970447540283203, 0.013574600219726562, 0.014178752899169922, 0.014782905578613281, 0.01538705825805664, 0.0159912109375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 7.0, 8.0, 9.0, 16.0, 22.0, 24.0, 55.0, 53.0, 76.0, 104.0, 156.0, 201.0, 305.0, 510.0, 1010.0, 2402.0, 8767.0, 47716.0, 351413.0, 530325.0, 84954.0, 13915.0, 3418.0, 1269.0, 649.0, 385.0, 243.0, 154.0, 116.0, 66.0, 68.0, 32.0, 27.0, 20.0, 12.0, 19.0, 12.0, 8.0, 4.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.156005859375, -0.15099716186523438, -0.14598846435546875, -0.14097976684570312, -0.1359710693359375, -0.13096237182617188, -0.12595367431640625, -0.12094497680664062, -0.115936279296875, -0.11092758178710938, -0.10591888427734375, -0.10091018676757812, -0.0959014892578125, -0.09089279174804688, -0.08588409423828125, -0.08087539672851562, -0.07586669921875, -0.07085800170898438, -0.06584930419921875, -0.060840606689453125, -0.0558319091796875, -0.050823211669921875, -0.04581451416015625, -0.040805816650390625, -0.035797119140625, -0.030788421630859375, -0.02577972412109375, -0.020771026611328125, -0.0157623291015625, -0.010753631591796875, -0.00574493408203125, -0.000736236572265625, 0.0042724609375, 0.009281158447265625, 0.01428985595703125, 0.019298553466796875, 0.0243072509765625, 0.029315948486328125, 0.03432464599609375, 0.039333343505859375, 0.044342041015625, 0.049350738525390625, 0.05435943603515625, 0.059368133544921875, 0.0643768310546875, 0.06938552856445312, 0.07439422607421875, 0.07940292358398438, 0.08441162109375, 0.08942031860351562, 0.09442901611328125, 0.09943771362304688, 0.1044464111328125, 0.10945510864257812, 0.11446380615234375, 0.11947250366210938, 0.124481201171875, 0.12948989868164062, 0.13449859619140625, 0.13950729370117188, 0.1445159912109375, 0.14952468872070312, 0.15453338623046875, 0.15954208374023438, 0.16455078125]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 11.0, 9.0, 17.0, 30.0, 38.0, 55.0, 83.0, 113.0, 131.0, 128.0, 107.0, 86.0, 68.0, 45.0, 26.0, 18.0, 12.0, 8.0, 5.0, 3.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.014692848548293114, -0.014030023477971554, -0.013367198407649994, -0.012704374268651009, -0.012041548267006874, -0.011378724128007889, -0.010715899057686329, -0.010053073987364769, -0.009390248917043209, -0.00872742384672165, -0.00806459877640009, -0.007401774171739817, -0.006738949101418257, -0.006076124031096697, -0.005413299426436424, -0.004750474356114864, -0.0040876492857933044, -0.0034248242154717445, -0.0027619993779808283, -0.002099174540489912, -0.0014363494701683521, -0.0007735243998467922, -0.00011069979518651962, 0.0005521252751350403, 0.0012149503454566002, 0.0018777752993628383, 0.0025406002532690763, 0.0032034250907599926, 0.0038662501610815525, 0.004529075231403112, 0.005191899836063385, 0.005854724906384945, 0.006517549976706505, 0.007180375047028065, 0.007843200117349625, 0.00850602425634861, 0.009168850257992744, 0.00983167439699173, 0.01049449946731329, 0.01115732453763485, 0.01182014960795641, 0.01248297467827797, 0.01314579974859953, 0.01380862481892109, 0.014471448957920074, 0.015134274959564209, 0.015797099098563194, 0.01645992323756218, 0.017122749239206314, 0.0177855733782053, 0.018448399379849434, 0.01911122351884842, 0.019774049520492554, 0.02043687365949154, 0.021099697798490524, 0.02176252380013466, 0.022425349801778793, 0.02308817394077778, 0.023750999942421913, 0.0244138240814209, 0.025076650083065033, 0.025739474222064018, 0.026402298361063004, 0.027065124362707138, 0.027727948501706123]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0, 4.0, 2.0, 5.0, 8.0, 11.0, 11.0, 10.0, 15.0, 10.0, 23.0, 18.0, 23.0, 24.0, 29.0, 25.0, 31.0, 37.0, 37.0, 43.0, 29.0, 45.0, 41.0, 37.0, 38.0, 32.0, 36.0, 39.0, 28.0, 28.0, 25.0, 22.0, 29.0, 25.0, 22.0, 24.0, 25.0, 18.0, 10.0, 11.0, 15.0, 9.0, 7.0, 8.0, 6.0, 3.0, 9.0, 4.0, 10.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.008817911148071289, -0.008537821471691132, -0.008257731795310974, -0.007977642118930817, -0.007697552442550659, -0.007417462766170502, -0.007137373089790344, -0.006857283413410187, -0.006577193737030029, -0.006297104060649872, -0.006017014384269714, -0.005736924707889557, -0.005456835031509399, -0.005176745355129242, -0.0048966556787490845, -0.004616566002368927, -0.0043364763259887695, -0.004056386649608612, -0.0037762969732284546, -0.003496207296848297, -0.0032161176204681396, -0.002936027944087982, -0.0026559382677078247, -0.0023758485913276672, -0.0020957589149475098, -0.0018156692385673523, -0.0015355795621871948, -0.0012554898858070374, -0.0009754002094268799, -0.0006953105330467224, -0.00041522085666656494, -0.00013513118028640747, 0.00014495849609375, 0.00042504817247390747, 0.0007051378488540649, 0.0009852275252342224, 0.0012653172016143799, 0.0015454068779945374, 0.0018254965543746948, 0.0021055862307548523, 0.0023856759071350098, 0.0026657655835151672, 0.0029458552598953247, 0.003225944936275482, 0.0035060346126556396, 0.003786124289035797, 0.004066213965415955, 0.004346303641796112, 0.0046263933181762695, 0.004906482994556427, 0.0051865726709365845, 0.005466662347316742, 0.005746752023696899, 0.006026841700077057, 0.006306931376457214, 0.006587021052837372, 0.006867110729217529, 0.007147200405597687, 0.007427290081977844, 0.007707379758358002, 0.00798746943473816, 0.008267559111118317, 0.008547648787498474, 0.008827738463878632, 0.009107828140258789]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 4.0, 2.0, 9.0, 4.0, 11.0, 9.0, 10.0, 14.0, 11.0, 21.0, 14.0, 20.0, 27.0, 29.0, 32.0, 37.0, 40.0, 24.0, 37.0, 50.0, 38.0, 39.0, 31.0, 35.0, 32.0, 44.0, 42.0, 36.0, 39.0, 39.0, 30.0, 25.0, 33.0, 15.0, 20.0, 9.0, 12.0, 13.0, 15.0, 12.0, 11.0, 8.0, 8.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-79.5, -77.1416015625, -74.783203125, -72.4248046875, -70.06640625, -67.7080078125, -65.349609375, -62.9912109375, -60.6328125, -58.2744140625, -55.916015625, -53.5576171875, -51.19921875, -48.8408203125, -46.482421875, -44.1240234375, -41.765625, -39.4072265625, -37.048828125, -34.6904296875, -32.33203125, -29.9736328125, -27.615234375, -25.2568359375, -22.8984375, -20.5400390625, -18.181640625, -15.8232421875, -13.46484375, -11.1064453125, -8.748046875, -6.3896484375, -4.03125, -1.6728515625, 0.685546875, 3.0439453125, 5.40234375, 7.7607421875, 10.119140625, 12.4775390625, 14.8359375, 17.1943359375, 19.552734375, 21.9111328125, 24.26953125, 26.6279296875, 28.986328125, 31.3447265625, 33.703125, 36.0615234375, 38.419921875, 40.7783203125, 43.13671875, 45.4951171875, 47.853515625, 50.2119140625, 52.5703125, 54.9287109375, 57.287109375, 59.6455078125, 62.00390625, 64.3623046875, 66.720703125, 69.0791015625, 71.4375]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 13.0, 7.0, 12.0, 15.0, 16.0, 23.0, 38.0, 39.0, 67.0, 91.0, 132.0, 202.0, 324.0, 580.0, 1063.0, 1980.0, 3812.0, 8782.0, 25291.0, 110499.0, 571110.0, 253422.0, 45993.0, 13569.0, 5454.0, 2632.0, 1353.0, 803.0, 434.0, 255.0, 156.0, 114.0, 76.0, 54.0, 22.0, 25.0, 23.0, 21.0, 14.0, 7.0, 11.0, 4.0, 5.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-21.390625, -20.75634765625, -20.1220703125, -19.48779296875, -18.853515625, -18.21923828125, -17.5849609375, -16.95068359375, -16.31640625, -15.68212890625, -15.0478515625, -14.41357421875, -13.779296875, -13.14501953125, -12.5107421875, -11.87646484375, -11.2421875, -10.60791015625, -9.9736328125, -9.33935546875, -8.705078125, -8.07080078125, -7.4365234375, -6.80224609375, -6.16796875, -5.53369140625, -4.8994140625, -4.26513671875, -3.630859375, -2.99658203125, -2.3623046875, -1.72802734375, -1.09375, -0.45947265625, 0.1748046875, 0.80908203125, 1.443359375, 2.07763671875, 2.7119140625, 3.34619140625, 3.98046875, 4.61474609375, 5.2490234375, 5.88330078125, 6.517578125, 7.15185546875, 7.7861328125, 8.42041015625, 9.0546875, 9.68896484375, 10.3232421875, 10.95751953125, 11.591796875, 12.22607421875, 12.8603515625, 13.49462890625, 14.12890625, 14.76318359375, 15.3974609375, 16.03173828125, 16.666015625, 17.30029296875, 17.9345703125, 18.56884765625, 19.203125]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 8.0, 9.0, 13.0, 18.0, 25.0, 37.0, 36.0, 49.0, 51.0, 80.0, 69.0, 99.0, 2124.0, 74.0, 74.0, 63.0, 47.0, 44.0, 34.0, 20.0, 26.0, 11.0, 12.0, 9.0, 7.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-213.125, -206.33984375, -199.5546875, -192.76953125, -185.984375, -179.19921875, -172.4140625, -165.62890625, -158.84375, -152.05859375, -145.2734375, -138.48828125, -131.703125, -124.91796875, -118.1328125, -111.34765625, -104.5625, -97.77734375, -90.9921875, -84.20703125, -77.421875, -70.63671875, -63.8515625, -57.06640625, -50.28125, -43.49609375, -36.7109375, -29.92578125, -23.140625, -16.35546875, -9.5703125, -2.78515625, 4.0, 10.78515625, 17.5703125, 24.35546875, 31.140625, 37.92578125, 44.7109375, 51.49609375, 58.28125, 65.06640625, 71.8515625, 78.63671875, 85.421875, 92.20703125, 98.9921875, 105.77734375, 112.5625, 119.34765625, 126.1328125, 132.91796875, 139.703125, 146.48828125, 153.2734375, 160.05859375, 166.84375, 173.62890625, 180.4140625, 187.19921875, 193.984375, 200.76953125, 207.5546875, 214.33984375, 221.125]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 3.0, 6.0, 10.0, 9.0, 14.0, 16.0, 23.0, 36.0, 59.0, 80.0, 120.0, 190.0, 318.0, 627.0, 1446.0, 4216.0, 43993.0, 2984604.0, 99964.0, 6366.0, 1825.0, 773.0, 365.0, 212.0, 135.0, 99.0, 50.0, 39.0, 24.0, 22.0, 17.0, 8.0, 9.0, 3.0, 6.0, 3.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-46.21875, -44.7568359375, -43.294921875, -41.8330078125, -40.37109375, -38.9091796875, -37.447265625, -35.9853515625, -34.5234375, -33.0615234375, -31.599609375, -30.1376953125, -28.67578125, -27.2138671875, -25.751953125, -24.2900390625, -22.828125, -21.3662109375, -19.904296875, -18.4423828125, -16.98046875, -15.5185546875, -14.056640625, -12.5947265625, -11.1328125, -9.6708984375, -8.208984375, -6.7470703125, -5.28515625, -3.8232421875, -2.361328125, -0.8994140625, 0.5625, 2.0244140625, 3.486328125, 4.9482421875, 6.41015625, 7.8720703125, 9.333984375, 10.7958984375, 12.2578125, 13.7197265625, 15.181640625, 16.6435546875, 18.10546875, 19.5673828125, 21.029296875, 22.4912109375, 23.953125, 25.4150390625, 26.876953125, 28.3388671875, 29.80078125, 31.2626953125, 32.724609375, 34.1865234375, 35.6484375, 37.1103515625, 38.572265625, 40.0341796875, 41.49609375, 42.9580078125, 44.419921875, 45.8818359375, 47.34375]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 10.0, 35.0, 179.0, 642.0, 111.0, 18.0, 8.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1493.390869140625, -1466.4288330078125, -1439.466796875, -1412.5047607421875, -1385.542724609375, -1358.580810546875, -1331.6187744140625, -1304.65673828125, -1277.6947021484375, -1250.732666015625, -1223.7706298828125, -1196.80859375, -1169.8466796875, -1142.8846435546875, -1115.922607421875, -1088.9605712890625, -1061.99853515625, -1035.0364990234375, -1008.074462890625, -981.1124877929688, -954.1504516601562, -927.1884155273438, -900.2264404296875, -873.264404296875, -846.3023681640625, -819.34033203125, -792.3782958984375, -765.4163208007812, -738.4542846679688, -711.4922485351562, -684.5302734375, -657.5682373046875, -630.6062622070312, -603.6442260742188, -576.6822509765625, -549.72021484375, -522.7581787109375, -495.796142578125, -468.8341369628906, -441.87213134765625, -414.91009521484375, -387.94805908203125, -360.9860534667969, -334.0240478515625, -307.06201171875, -280.0999755859375, -253.13796997070312, -226.1759490966797, -199.21392822265625, -172.2519073486328, -145.28988647460938, -118.32786560058594, -91.3658447265625, -64.40382385253906, -37.441802978515625, -10.479782104492188, 16.48223876953125, 43.44425964355469, 70.40628051757812, 97.36830139160156, 124.330322265625, 151.29234313964844, 178.25436401367188, 205.2163848876953, 232.17840576171875]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 3.0, 3.0, 7.0, 12.0, 4.0, 10.0, 13.0, 22.0, 18.0, 18.0, 24.0, 19.0, 32.0, 43.0, 44.0, 42.0, 39.0, 52.0, 58.0, 46.0, 54.0, 53.0, 44.0, 44.0, 53.0, 44.0, 24.0, 37.0, 24.0, 21.0, 19.0, 11.0, 20.0, 10.0, 10.0, 6.0, 4.0, 1.0, 7.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-214.85885620117188, -208.4850311279297, -202.11122131347656, -195.73739624023438, -189.3635711669922, -182.98974609375, -176.61593627929688, -170.2421112060547, -163.8682861328125, -157.4944610595703, -151.1206512451172, -144.746826171875, -138.3730010986328, -131.99917602539062, -125.6253662109375, -119.25154113769531, -112.87773132324219, -106.50391387939453, -100.13008880615234, -93.75627136230469, -87.3824462890625, -81.00862884521484, -74.63481140136719, -68.260986328125, -61.887168884277344, -55.51334762573242, -49.1395263671875, -42.765708923339844, -36.39188766479492, -30.01806640625, -23.644248962402344, -17.270427703857422, -10.8966064453125, -4.5227861404418945, 1.851034164428711, 8.224853515625, 14.598674774169922, 20.972496032714844, 27.3463134765625, 33.72013473510742, 40.093955993652344, 46.467777252197266, 52.84159851074219, 59.215415954589844, 65.5892333984375, 71.96305847167969, 78.33687591552734, 84.710693359375, 91.08451843261719, 97.45833587646484, 103.83216094970703, 110.20597839355469, 116.57980346679688, 122.95362091064453, 129.3274383544922, 135.70126342773438, 142.0750732421875, 148.4488983154297, 154.8227081298828, 161.196533203125, 167.5703582763672, 173.94418334960938, 180.3179931640625, 186.6918182373047, 193.06564331054688]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [3.0, 5.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 8.0, 7.0, 17.0, 17.0, 24.0, 25.0, 33.0, 24.0, 46.0, 70.0, 92.0, 120.0, 168.0, 217.0, 295.0, 417.0, 640.0, 793.0, 1382.0, 1040823.0, 868.0, 637.0, 521.0, 339.0, 222.0, 187.0, 118.0, 92.0, 76.0, 57.0, 42.0, 41.0, 30.0, 21.0, 12.0, 13.0, 22.0, 11.0, 3.0, 5.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-46.26725387573242, -44.62516784667969, -42.98308181762695, -41.34099578857422, -39.69891357421875, -38.05682373046875, -36.41474151611328, -34.77265548706055, -33.13056945800781, -31.488483428955078, -29.846397399902344, -28.204313278198242, -26.562227249145508, -24.920141220092773, -23.278057098388672, -21.635971069335938, -19.993885040283203, -18.35179901123047, -16.709712982177734, -15.067628860473633, -13.425542831420898, -11.783456802368164, -10.141371726989746, -8.499286651611328, -6.857200622558594, -5.215115070343018, -3.5730295181274414, -1.9309439659118652, -0.28885841369628906, 1.3532276153564453, 2.9953126907348633, 4.637397766113281, 6.27947998046875, 7.921565532684326, 9.563651084899902, 11.20573616027832, 12.847822189331055, 14.489908218383789, 16.13199234008789, 17.774078369140625, 19.41616439819336, 21.058250427246094, 22.700336456298828, 24.34242057800293, 25.984506607055664, 27.6265926361084, 29.2686767578125, 30.910762786865234, 32.55284881591797, 34.1949348449707, 35.83702087402344, 37.47910690307617, 39.121192932128906, 40.763275146484375, 42.40536117553711, 44.047447204589844, 45.68953323364258, 47.33161926269531, 48.97370529174805, 50.61579132080078, 52.25787353515625, 53.89996337890625, 55.54204559326172, 57.18413162231445, 58.82621765136719]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 12.0, 12.0, 10.0, 11.0, 31.0, 149.0, 51462728.0, 114.0, 36.0, 12.0, 5.0, 5.0, 4.0, 4.0, 6.0, 3.0, 5.0, 4.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8412.0771484375, -8002.13037109375, -7592.18359375, -7182.2373046875, -6772.2900390625, -6362.34375, -5952.39697265625, -5542.4501953125, -5132.50341796875, -4722.556640625, -4312.60986328125, -3902.663330078125, -3492.716552734375, -3082.769775390625, -2672.8232421875, -2262.87646484375, -1852.9296875, -1442.98291015625, -1033.0362548828125, -623.089599609375, -213.142822265625, 196.803955078125, 606.75048828125, 1016.697265625, 1426.64404296875, 1836.5908203125, 2246.53759765625, 2656.484130859375, 3066.430908203125, 3476.377685546875, 3886.32421875, 4296.27099609375, 4706.216796875, 5116.16357421875, 5526.1103515625, 5936.056640625, 6346.00390625, 6755.9501953125, 7165.89697265625, 7575.84375, 7985.79052734375, 8395.7373046875, 8805.68359375, 9215.630859375, 9625.5771484375, 10035.5244140625, 10445.470703125, 10855.41796875, 11265.3642578125, 11675.310546875, 12085.2578125, 12495.2041015625, 12905.1513671875, 13315.09765625, 13725.044921875, 14134.9912109375, 14544.9375, 14954.8837890625, 15364.8310546875, 15774.77734375, 16184.724609375, 16594.671875, 17004.6171875, 17414.564453125, 17824.51171875]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 0.0, 7.0, 6.0, 18.0, 19.0, 27.0, 25.0, 54.0, 90.0, 114.0, 154.0, 237.0, 296.0, 427.0, 577.0, 944.0, 1491.0, 2099.0, 3120.0, 4744.0, 7354.0, 11174.0, 17590.0, 27807.0, 42489.0, 65475.0, 100597.0, 161749.0, 266913.0, 501835.0, 3710630.0, 589430.0, 292243.0, 175108.0, 109623.0, 69264.0, 44425.0, 28995.0, 18415.0, 12532.0, 7869.0, 5245.0, 3554.0, 2236.0, 1518.0, 987.0, 600.0, 470.0, 281.0, 176.0, 114.0, 87.0, 70.0, 49.0, 29.0, 28.0, 12.0, 7.0, 6.0, 5.0, 6.0, 2.0, 6.0], "bins": [-4.98046875, -4.82275390625, -4.6650390625, -4.50732421875, -4.349609375, -4.19189453125, -4.0341796875, -3.87646484375, -3.71875, -3.56103515625, -3.4033203125, -3.24560546875, -3.087890625, -2.93017578125, -2.7724609375, -2.61474609375, -2.45703125, -2.29931640625, -2.1416015625, -1.98388671875, -1.826171875, -1.66845703125, -1.5107421875, -1.35302734375, -1.1953125, -1.03759765625, -0.8798828125, -0.72216796875, -0.564453125, -0.40673828125, -0.2490234375, -0.09130859375, 0.06640625, 0.22412109375, 0.3818359375, 0.53955078125, 0.697265625, 0.85498046875, 1.0126953125, 1.17041015625, 1.328125, 1.48583984375, 1.6435546875, 1.80126953125, 1.958984375, 2.11669921875, 2.2744140625, 2.43212890625, 2.58984375, 2.74755859375, 2.9052734375, 3.06298828125, 3.220703125, 3.37841796875, 3.5361328125, 3.69384765625, 3.8515625, 4.00927734375, 4.1669921875, 4.32470703125, 4.482421875, 4.64013671875, 4.7978515625, 4.95556640625, 5.11328125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 4.0, 5.0, 6.0, 7.0, 8.0, 13.0, 9.0, 16.0, 10.0, 15.0, 18.0, 17.0, 22.0, 23.0, 28.0, 26.0, 20.0, 33.0, 39.0, 53.0, 47.0, 74.0, 342.0, 640.0, 120.0, 41.0, 29.0, 36.0, 47.0, 32.0, 46.0, 32.0, 25.0, 20.0, 26.0, 16.0, 15.0, 14.0, 16.0, 11.0, 7.0, 5.0, 5.0, 3.0, 3.0, 1.0, 1.0, 4.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.046875, -16.500244140625, -15.95361328125, -15.406982421875, -14.8603515625, -14.313720703125, -13.76708984375, -13.220458984375, -12.673828125, -12.127197265625, -11.58056640625, -11.033935546875, -10.4873046875, -9.940673828125, -9.39404296875, -8.847412109375, -8.30078125, -7.754150390625, -7.20751953125, -6.660888671875, -6.1142578125, -5.567626953125, -5.02099609375, -4.474365234375, -3.927734375, -3.381103515625, -2.83447265625, -2.287841796875, -1.7412109375, -1.194580078125, -0.64794921875, -0.101318359375, 0.4453125, 0.991943359375, 1.53857421875, 2.085205078125, 2.6318359375, 3.178466796875, 3.72509765625, 4.271728515625, 4.818359375, 5.364990234375, 5.91162109375, 6.458251953125, 7.0048828125, 7.551513671875, 8.09814453125, 8.644775390625, 9.19140625, 9.738037109375, 10.28466796875, 10.831298828125, 11.3779296875, 11.924560546875, 12.47119140625, 13.017822265625, 13.564453125, 14.111083984375, 14.65771484375, 15.204345703125, 15.7509765625, 16.297607421875, 16.84423828125, 17.390869140625, 17.9375]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 9.0, 17.0, 21.0, 21.0, 31.0, 37.0, 67.0, 118.0, 202.0, 307.0, 399.0, 527.0, 858.0, 1326.0, 2069.0, 2933.0, 4740.0, 7505.0, 11972.0, 19286.0, 33290.0, 58605.0, 107835.0, 215257.0, 488625.0, 3906621.0, 813894.0, 293322.0, 141828.0, 74140.0, 41390.0, 24292.0, 14582.0, 9115.0, 5665.0, 3522.0, 2427.0, 1550.0, 990.0, 642.0, 448.0, 309.0, 238.0, 167.0, 81.0, 53.0, 30.0, 17.0, 24.0, 13.0, 10.0, 17.0, 2.0, 0.0, 3.0], "bins": [-7.75, -7.52667236328125, -7.3033447265625, -7.08001708984375, -6.856689453125, -6.63336181640625, -6.4100341796875, -6.18670654296875, -5.96337890625, -5.74005126953125, -5.5167236328125, -5.29339599609375, -5.070068359375, -4.84674072265625, -4.6234130859375, -4.40008544921875, -4.1767578125, -3.95343017578125, -3.7301025390625, -3.50677490234375, -3.283447265625, -3.06011962890625, -2.8367919921875, -2.61346435546875, -2.39013671875, -2.16680908203125, -1.9434814453125, -1.72015380859375, -1.496826171875, -1.27349853515625, -1.0501708984375, -0.82684326171875, -0.603515625, -0.38018798828125, -0.1568603515625, 0.06646728515625, 0.289794921875, 0.51312255859375, 0.7364501953125, 0.95977783203125, 1.18310546875, 1.40643310546875, 1.6297607421875, 1.85308837890625, 2.076416015625, 2.29974365234375, 2.5230712890625, 2.74639892578125, 2.9697265625, 3.19305419921875, 3.4163818359375, 3.63970947265625, 3.863037109375, 4.08636474609375, 4.3096923828125, 4.53302001953125, 4.75634765625, 4.97967529296875, 5.2030029296875, 5.42633056640625, 5.649658203125, 5.87298583984375, 6.0963134765625, 6.31964111328125, 6.54296875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0, 6.0, 3.0, 9.0, 9.0, 8.0, 12.0, 7.0, 13.0, 16.0, 14.0, 21.0, 20.0, 22.0, 25.0, 32.0, 38.0, 41.0, 50.0, 60.0, 126.0, 531.0, 391.0, 119.0, 54.0, 35.0, 38.0, 33.0, 42.0, 39.0, 40.0, 28.0, 27.0, 23.0, 20.0, 16.0, 15.0, 8.0, 7.0, 5.0, 4.0, 5.0, 6.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-11.5546875, -11.192138671875, -10.82958984375, -10.467041015625, -10.1044921875, -9.741943359375, -9.37939453125, -9.016845703125, -8.654296875, -8.291748046875, -7.92919921875, -7.566650390625, -7.2041015625, -6.841552734375, -6.47900390625, -6.116455078125, -5.75390625, -5.391357421875, -5.02880859375, -4.666259765625, -4.3037109375, -3.941162109375, -3.57861328125, -3.216064453125, -2.853515625, -2.490966796875, -2.12841796875, -1.765869140625, -1.4033203125, -1.040771484375, -0.67822265625, -0.315673828125, 0.046875, 0.409423828125, 0.77197265625, 1.134521484375, 1.4970703125, 1.859619140625, 2.22216796875, 2.584716796875, 2.947265625, 3.309814453125, 3.67236328125, 4.034912109375, 4.3974609375, 4.760009765625, 5.12255859375, 5.485107421875, 5.84765625, 6.210205078125, 6.57275390625, 6.935302734375, 7.2978515625, 7.660400390625, 8.02294921875, 8.385498046875, 8.748046875, 9.110595703125, 9.47314453125, 9.835693359375, 10.1982421875, 10.560791015625, 10.92333984375, 11.285888671875, 11.6484375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 0.0, 4.0, 0.0, 9.0, 16.0, 10.0, 10.0, 17.0, 33.0, 40.0, 31.0, 42.0, 67.0, 102.0, 145.0, 125.0, 216.0, 237.0, 307.0, 483.0, 613.0, 800.0, 1146.0, 1709.0, 2496.0, 4286.0, 7230.0, 14983.0, 35570.0, 123251.0, 5875749.0, 144795.0, 39224.0, 16203.0, 7901.0, 4494.0, 2732.0, 1709.0, 1230.0, 943.0, 611.0, 434.0, 337.0, 241.0, 220.0, 161.0, 103.0, 77.0, 82.0, 53.0, 32.0, 30.0, 14.0, 18.0, 22.0, 11.0, 10.0, 5.0, 12.0, 9.0, 8.0], "bins": [-19.125, -18.554931640625, -17.98486328125, -17.414794921875, -16.8447265625, -16.274658203125, -15.70458984375, -15.134521484375, -14.564453125, -13.994384765625, -13.42431640625, -12.854248046875, -12.2841796875, -11.714111328125, -11.14404296875, -10.573974609375, -10.00390625, -9.433837890625, -8.86376953125, -8.293701171875, -7.7236328125, -7.153564453125, -6.58349609375, -6.013427734375, -5.443359375, -4.873291015625, -4.30322265625, -3.733154296875, -3.1630859375, -2.593017578125, -2.02294921875, -1.452880859375, -0.8828125, -0.312744140625, 0.25732421875, 0.827392578125, 1.3974609375, 1.967529296875, 2.53759765625, 3.107666015625, 3.677734375, 4.247802734375, 4.81787109375, 5.387939453125, 5.9580078125, 6.528076171875, 7.09814453125, 7.668212890625, 8.23828125, 8.808349609375, 9.37841796875, 9.948486328125, 10.5185546875, 11.088623046875, 11.65869140625, 12.228759765625, 12.798828125, 13.368896484375, 13.93896484375, 14.509033203125, 15.0791015625, 15.649169921875, 16.21923828125, 16.789306640625, 17.359375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 4.0, 6.0, 11.0, 9.0, 7.0, 6.0, 13.0, 22.0, 15.0, 25.0, 17.0, 19.0, 27.0, 28.0, 28.0, 29.0, 45.0, 56.0, 62.0, 108.0, 248.0, 465.0, 209.0, 95.0, 72.0, 41.0, 36.0, 33.0, 48.0, 28.0, 27.0, 30.0, 26.0, 15.0, 21.0, 12.0, 15.0, 10.0, 12.0, 13.0, 10.0, 6.0, 6.0, 4.0, 2.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.69140625, -7.46063232421875, -7.2298583984375, -6.99908447265625, -6.768310546875, -6.53753662109375, -6.3067626953125, -6.07598876953125, -5.84521484375, -5.61444091796875, -5.3836669921875, -5.15289306640625, -4.922119140625, -4.69134521484375, -4.4605712890625, -4.22979736328125, -3.9990234375, -3.76824951171875, -3.5374755859375, -3.30670166015625, -3.075927734375, -2.84515380859375, -2.6143798828125, -2.38360595703125, -2.15283203125, -1.92205810546875, -1.6912841796875, -1.46051025390625, -1.229736328125, -0.99896240234375, -0.7681884765625, -0.53741455078125, -0.306640625, -0.07586669921875, 0.1549072265625, 0.38568115234375, 0.616455078125, 0.84722900390625, 1.0780029296875, 1.30877685546875, 1.53955078125, 1.77032470703125, 2.0010986328125, 2.23187255859375, 2.462646484375, 2.69342041015625, 2.9241943359375, 3.15496826171875, 3.3857421875, 3.61651611328125, 3.8472900390625, 4.07806396484375, 4.308837890625, 4.53961181640625, 4.7703857421875, 5.00115966796875, 5.23193359375, 5.46270751953125, 5.6934814453125, 5.92425537109375, 6.155029296875, 6.38580322265625, 6.6165771484375, 6.84735107421875, 7.078125]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 6.0, 5.0, 10.0, 40.0, 63.0, 115.0, 223.0, 242.0, 121.0, 77.0, 27.0, 23.0, 15.0, 12.0, 9.0, 3.0, 7.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.559688568115234, -26.752370834350586, -25.945053100585938, -25.137737274169922, -24.330419540405273, -23.523101806640625, -22.715784072875977, -21.908466339111328, -21.10114860534668, -20.29383087158203, -19.486513137817383, -18.679195404052734, -17.87187957763672, -17.06456184387207, -16.257244110107422, -15.449926376342773, -14.642609596252441, -13.835291862487793, -13.027975082397461, -12.220657348632812, -11.413339614868164, -10.606021881103516, -9.798705101013184, -8.991387367248535, -8.184070587158203, -7.376753330230713, -6.5694355964660645, -5.762118339538574, -4.954800605773926, -4.1474833488464355, -3.3401660919189453, -2.532848358154297, -1.7255306243896484, -0.9182131886482239, -0.11089575290679932, 0.6964216232299805, 1.5037391185760498, 2.311056613922119, 3.1183738708496094, 3.925691604614258, 4.733008861541748, 5.540326118469238, 6.347643852233887, 7.154961109161377, 7.962278366088867, 8.769596099853516, 9.576913833618164, 10.384231567382812, 11.191548347473145, 11.998866081237793, 12.806182861328125, 13.613500595092773, 14.420818328857422, 15.22813606262207, 16.03545379638672, 16.842769622802734, 17.650087356567383, 18.45740509033203, 19.26472282409668, 20.072040557861328, 20.879356384277344, 21.686674118041992, 22.49399185180664, 23.30130958557129, 24.108627319335938]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 4.0, 7.0, 10.0, 9.0, 10.0, 20.0, 13.0, 17.0, 24.0, 18.0, 29.0, 24.0, 29.0, 30.0, 41.0, 37.0, 43.0, 49.0, 50.0, 31.0, 45.0, 50.0, 41.0, 28.0, 52.0, 39.0, 39.0, 32.0, 36.0, 24.0, 22.0, 20.0, 11.0, 8.0, 15.0, 8.0, 11.0, 6.0, 6.0, 6.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-11.969585418701172, -11.603760719299316, -11.237936973571777, -10.872112274169922, -10.506288528442383, -10.140463829040527, -9.774639129638672, -9.408815383911133, -9.042990684509277, -8.677165985107422, -8.311342239379883, -7.945517539978027, -7.57969331741333, -7.213869094848633, -6.8480448722839355, -6.482220649719238, -6.116396427154541, -5.750572204589844, -5.3847479820251465, -5.018923759460449, -4.653099060058594, -4.2872748374938965, -3.921450614929199, -3.555626153945923, -3.1898019313812256, -2.8239777088165283, -2.458153247833252, -2.0923290252685547, -1.7265046834945679, -1.360680341720581, -0.9948561191558838, -0.6290316581726074, -0.26320743560791016, 0.10261687636375427, 0.4684411883354187, 0.8342654705047607, 1.2000898122787476, 1.5659141540527344, 1.9317383766174316, 2.297562837600708, 2.6633870601654053, 3.0292112827301025, 3.395035743713379, 3.760859966278076, 4.126684188842773, 4.492508888244629, 4.858332633972168, 5.224157333374023, 5.589981555938721, 5.955805778503418, 6.321630001068115, 6.6874542236328125, 7.053278923034668, 7.419103145599365, 7.7849273681640625, 8.150752067565918, 8.516575813293457, 8.882400512695312, 9.248224258422852, 9.614048957824707, 9.979872703552246, 10.345697402954102, 10.71152114868164, 11.077345848083496, 11.443170547485352]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 5.0, 2.0, 4.0, 10.0, 10.0, 19.0, 15.0, 21.0, 38.0, 40.0, 52.0, 73.0, 94.0, 109.0, 146.0, 197.0, 258.0, 315.0, 465.0, 651.0, 985.0, 1494.0, 2396.0, 4032.0, 7534.0, 15390.0, 40752.0, 3577404.0, 473719.0, 36671.0, 13747.0, 6909.0, 3680.0, 2245.0, 1445.0, 1049.0, 650.0, 448.0, 369.0, 248.0, 165.0, 129.0, 87.0, 67.0, 45.0, 30.0, 20.0, 23.0, 6.0, 9.0, 9.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0], "bins": [-0.341796875, -0.3320159912109375, -0.322235107421875, -0.3124542236328125, -0.30267333984375, -0.2928924560546875, -0.283111572265625, -0.2733306884765625, -0.2635498046875, -0.2537689208984375, -0.243988037109375, -0.2342071533203125, -0.22442626953125, -0.2146453857421875, -0.204864501953125, -0.1950836181640625, -0.185302734375, -0.1755218505859375, -0.165740966796875, -0.1559600830078125, -0.14617919921875, -0.1363983154296875, -0.126617431640625, -0.1168365478515625, -0.1070556640625, -0.0972747802734375, -0.087493896484375, -0.0777130126953125, -0.06793212890625, -0.0581512451171875, -0.048370361328125, -0.0385894775390625, -0.02880859375, -0.0190277099609375, -0.009246826171875, 0.0005340576171875, 0.01031494140625, 0.0200958251953125, 0.029876708984375, 0.0396575927734375, 0.0494384765625, 0.0592193603515625, 0.069000244140625, 0.0787811279296875, 0.08856201171875, 0.0983428955078125, 0.108123779296875, 0.1179046630859375, 0.127685546875, 0.1374664306640625, 0.147247314453125, 0.1570281982421875, 0.16680908203125, 0.1765899658203125, 0.186370849609375, 0.1961517333984375, 0.2059326171875, 0.2157135009765625, 0.225494384765625, 0.2352752685546875, 0.24505615234375, 0.2548370361328125, 0.264617919921875, 0.2743988037109375, 0.2841796875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 5.0, 3.0, 4.0, 6.0, 9.0, 8.0, 5.0, 16.0, 19.0, 23.0, 510.0, 282.0, 31.0, 20.0, 10.0, 12.0, 10.0, 5.0, 8.0, 1.0, 4.0, 0.0, 4.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.038909912109375, -0.0377955436706543, -0.036681175231933594, -0.03556680679321289, -0.03445243835449219, -0.033338069915771484, -0.03222370147705078, -0.031109333038330078, -0.029994964599609375, -0.028880596160888672, -0.02776622772216797, -0.026651859283447266, -0.025537490844726562, -0.02442312240600586, -0.023308753967285156, -0.022194385528564453, -0.02108001708984375, -0.019965648651123047, -0.018851280212402344, -0.01773691177368164, -0.016622543334960938, -0.015508174896240234, -0.014393806457519531, -0.013279438018798828, -0.012165069580078125, -0.011050701141357422, -0.009936332702636719, -0.008821964263916016, -0.0077075958251953125, -0.006593227386474609, -0.005478858947753906, -0.004364490509033203, -0.0032501220703125, -0.002135753631591797, -0.0010213851928710938, 9.298324584960938e-05, 0.0012073516845703125, 0.0023217201232910156, 0.0034360885620117188, 0.004550457000732422, 0.005664825439453125, 0.006779193878173828, 0.007893562316894531, 0.009007930755615234, 0.010122299194335938, 0.01123666763305664, 0.012351036071777344, 0.013465404510498047, 0.01457977294921875, 0.015694141387939453, 0.016808509826660156, 0.01792287826538086, 0.019037246704101562, 0.020151615142822266, 0.02126598358154297, 0.022380352020263672, 0.023494720458984375, 0.024609088897705078, 0.02572345733642578, 0.026837825775146484, 0.027952194213867188, 0.02906656265258789, 0.030180931091308594, 0.0312952995300293, 0.03240966796875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 1.0, 8.0, 13.0, 14.0, 16.0, 21.0, 23.0, 27.0, 51.0, 62.0, 103.0, 139.0, 249.0, 460.0, 1074.0, 3074.0, 12072.0, 60596.0, 848251.0, 3146459.0, 96679.0, 17528.0, 4555.0, 1552.0, 539.0, 255.0, 141.0, 75.0, 65.0, 44.0, 41.0, 22.0, 23.0, 14.0, 10.0, 9.0, 6.0, 1.0, 4.0, 5.0, 4.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.51904296875, -0.5046730041503906, -0.49030303955078125, -0.4759330749511719, -0.4615631103515625, -0.4471931457519531, -0.43282318115234375, -0.4184532165527344, -0.404083251953125, -0.3897132873535156, -0.37534332275390625, -0.3609733581542969, -0.3466033935546875, -0.3322334289550781, -0.31786346435546875, -0.3034934997558594, -0.28912353515625, -0.2747535705566406, -0.26038360595703125, -0.24601364135742188, -0.2316436767578125, -0.21727371215820312, -0.20290374755859375, -0.18853378295898438, -0.174163818359375, -0.15979385375976562, -0.14542388916015625, -0.13105392456054688, -0.1166839599609375, -0.10231399536132812, -0.08794403076171875, -0.07357406616210938, -0.0592041015625, -0.044834136962890625, -0.03046417236328125, -0.016094207763671875, -0.0017242431640625, 0.012645721435546875, 0.02701568603515625, 0.041385650634765625, 0.055755615234375, 0.07012557983398438, 0.08449554443359375, 0.09886550903320312, 0.1132354736328125, 0.12760543823242188, 0.14197540283203125, 0.15634536743164062, 0.17071533203125, 0.18508529663085938, 0.19945526123046875, 0.21382522583007812, 0.2281951904296875, 0.24256515502929688, 0.25693511962890625, 0.2713050842285156, 0.285675048828125, 0.3000450134277344, 0.31441497802734375, 0.3287849426269531, 0.3431549072265625, 0.3575248718261719, 0.37189483642578125, 0.3862648010253906, 0.400634765625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 8.0, 9.0, 5.0, 11.0, 16.0, 14.0, 15.0, 22.0, 29.0, 44.0, 45.0, 73.0, 79.0, 94.0, 111.0, 184.0, 267.0, 573.0, 1177.0, 423.0, 213.0, 150.0, 97.0, 83.0, 76.0, 46.0, 52.0, 30.0, 27.0, 27.0, 17.0, 12.0, 16.0, 11.0, 4.0, 4.0, 5.0, 2.0, 8.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.08258056640625, -0.0803070068359375, -0.078033447265625, -0.0757598876953125, -0.073486328125, -0.0712127685546875, -0.068939208984375, -0.0666656494140625, -0.06439208984375, -0.0621185302734375, -0.059844970703125, -0.0575714111328125, -0.0552978515625, -0.0530242919921875, -0.050750732421875, -0.0484771728515625, -0.04620361328125, -0.0439300537109375, -0.041656494140625, -0.0393829345703125, -0.037109375, -0.0348358154296875, -0.032562255859375, -0.0302886962890625, -0.02801513671875, -0.0257415771484375, -0.023468017578125, -0.0211944580078125, -0.0189208984375, -0.0166473388671875, -0.014373779296875, -0.0121002197265625, -0.00982666015625, -0.0075531005859375, -0.005279541015625, -0.0030059814453125, -0.000732421875, 0.0015411376953125, 0.003814697265625, 0.0060882568359375, 0.00836181640625, 0.0106353759765625, 0.012908935546875, 0.0151824951171875, 0.0174560546875, 0.0197296142578125, 0.022003173828125, 0.0242767333984375, 0.02655029296875, 0.0288238525390625, 0.031097412109375, 0.0333709716796875, 0.03564453125, 0.0379180908203125, 0.040191650390625, 0.0424652099609375, 0.04473876953125, 0.0470123291015625, 0.049285888671875, 0.0515594482421875, 0.0538330078125, 0.0561065673828125, 0.058380126953125, 0.0606536865234375, 0.06292724609375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 7.0, 5.0, 12.0, 9.0, 14.0, 26.0, 47.0, 116.0, 201.0, 259.0, 121.0, 78.0, 39.0, 25.0, 22.0, 8.0, 9.0, 4.0, 7.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4893340766429901, -0.4651179313659668, -0.44090181589126587, -0.41668567061424255, -0.39246952533721924, -0.3682534098625183, -0.344037264585495, -0.3198211193084717, -0.29560500383377075, -0.27138885855674744, -0.2471727430820465, -0.2229565978050232, -0.19874046742916107, -0.17452433705329895, -0.15030819177627563, -0.1260920614004135, -0.10187593102455139, -0.07765980064868927, -0.05344366282224655, -0.029227524995803833, -0.005011394619941711, 0.01920473575592041, 0.043420881032943726, 0.06763701140880585, 0.09185314178466797, 0.11606927216053009, 0.1402854025363922, 0.16450154781341553, 0.18871767818927765, 0.21293380856513977, 0.23714995384216309, 0.261366069316864, 0.28558218479156494, 0.30979833006858826, 0.3340144455432892, 0.3582305908203125, 0.3824467062950134, 0.40666285157203674, 0.43087899684906006, 0.455095112323761, 0.4793112576007843, 0.5035274028778076, 0.5277435183525085, 0.5519596338272095, 0.5761758089065552, 0.6003919243812561, 0.624608039855957, 0.6488242149353027, 0.6730403304100037, 0.6972564458847046, 0.7214726209640503, 0.7456887364387512, 0.7699048519134521, 0.7941210269927979, 0.8183371424674988, 0.8425532579421997, 0.8667694330215454, 0.8909855484962463, 0.915201723575592, 0.939417839050293, 0.9636339545249939, 0.9878500699996948, 1.0120662450790405, 1.0362824201583862, 1.0604984760284424]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 8.0, 3.0, 5.0, 3.0, 11.0, 7.0, 9.0, 20.0, 11.0, 26.0, 23.0, 30.0, 25.0, 33.0, 39.0, 31.0, 51.0, 44.0, 64.0, 45.0, 59.0, 49.0, 42.0, 29.0, 39.0, 39.0, 43.0, 41.0, 32.0, 25.0, 19.0, 17.0, 20.0, 16.0, 13.0, 9.0, 7.0, 3.0, 2.0, 5.0, 3.0, 5.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.31900107860565186, -0.3084261119365692, -0.2978511452674866, -0.2872762084007263, -0.2767012417316437, -0.26612627506256104, -0.2555513083934784, -0.24497634172439575, -0.2344013750553131, -0.22382640838623047, -0.21325145661830902, -0.20267648994922638, -0.19210152328014374, -0.1815265715122223, -0.17095160484313965, -0.160376638174057, -0.14980168640613556, -0.13922671973705292, -0.12865176796913147, -0.11807680130004883, -0.10750183463096619, -0.09692687541246414, -0.0863519161939621, -0.07577694952487946, -0.06520199030637741, -0.05462702736258507, -0.044052064418792725, -0.03347710520029068, -0.022902142256498337, -0.012327179312705994, -0.001752220094203949, 0.008822746574878693, 0.019397705793380737, 0.02997266873717308, 0.040547631680965424, 0.05112259089946747, 0.06169755384325981, 0.07227251678705215, 0.0828474760055542, 0.09342244267463684, 0.10399740189313889, 0.11457236111164093, 0.12514732778072357, 0.13572227954864502, 0.14629724621772766, 0.1568722128868103, 0.16744717955589294, 0.17802214622497559, 0.18859709799289703, 0.19917206466197968, 0.20974701642990112, 0.22032198309898376, 0.2308969497680664, 0.24147191643714905, 0.2520468831062317, 0.26262181997299194, 0.2731967866420746, 0.2837717533111572, 0.29434671998023987, 0.3049216866493225, 0.31549662351608276, 0.3260715901851654, 0.33664655685424805, 0.3472215235233307, 0.35779649019241333]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 9.0, 7.0, 11.0, 12.0, 14.0, 24.0, 36.0, 36.0, 56.0, 90.0, 127.0, 230.0, 349.0, 608.0, 1076.0, 2081.0, 4363.0, 11942.0, 78115.0, 886422.0, 45485.0, 9622.0, 3598.0, 1736.0, 943.0, 561.0, 337.0, 212.0, 147.0, 100.0, 66.0, 44.0, 28.0, 16.0, 12.0, 11.0, 6.0, 9.0, 4.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.33447265625, -0.3244590759277344, -0.31444549560546875, -0.3044319152832031, -0.2944183349609375, -0.2844047546386719, -0.27439117431640625, -0.2643775939941406, -0.254364013671875, -0.24435043334960938, -0.23433685302734375, -0.22432327270507812, -0.2143096923828125, -0.20429611206054688, -0.19428253173828125, -0.18426895141601562, -0.17425537109375, -0.16424179077148438, -0.15422821044921875, -0.14421463012695312, -0.1342010498046875, -0.12418746948242188, -0.11417388916015625, -0.10416030883789062, -0.094146728515625, -0.08413314819335938, -0.07411956787109375, -0.06410598754882812, -0.0540924072265625, -0.044078826904296875, -0.03406524658203125, -0.024051666259765625, -0.0140380859375, -0.004024505615234375, 0.00598907470703125, 0.016002655029296875, 0.0260162353515625, 0.036029815673828125, 0.04604339599609375, 0.056056976318359375, 0.066070556640625, 0.07608413696289062, 0.08609771728515625, 0.09611129760742188, 0.1061248779296875, 0.11613845825195312, 0.12615203857421875, 0.13616561889648438, 0.14617919921875, 0.15619277954101562, 0.16620635986328125, 0.17621994018554688, 0.1862335205078125, 0.19624710083007812, 0.20626068115234375, 0.21627426147460938, 0.226287841796875, 0.23630142211914062, 0.24631500244140625, 0.2563285827636719, 0.2663421630859375, 0.2763557434082031, 0.28636932373046875, 0.2963829040527344, 0.306396484375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 6.0, 11.0, 6.0, 7.0, 12.0, 30.0, 85.0, 161.0, 248.0, 195.0, 118.0, 40.0, 29.0, 11.0, 6.0, 4.0, 2.0, 7.0, 3.0, 3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.03973388671875, -0.038556575775146484, -0.03737926483154297, -0.03620195388793945, -0.03502464294433594, -0.03384733200073242, -0.032670021057128906, -0.03149271011352539, -0.030315399169921875, -0.02913808822631836, -0.027960777282714844, -0.026783466339111328, -0.025606155395507812, -0.024428844451904297, -0.02325153350830078, -0.022074222564697266, -0.02089691162109375, -0.019719600677490234, -0.01854228973388672, -0.017364978790283203, -0.016187667846679688, -0.015010356903076172, -0.013833045959472656, -0.01265573501586914, -0.011478424072265625, -0.01030111312866211, -0.009123802185058594, -0.007946491241455078, -0.0067691802978515625, -0.005591869354248047, -0.004414558410644531, -0.0032372474670410156, -0.0020599365234375, -0.0008826255798339844, 0.00029468536376953125, 0.0014719963073730469, 0.0026493072509765625, 0.003826618194580078, 0.005003929138183594, 0.006181240081787109, 0.007358551025390625, 0.00853586196899414, 0.009713172912597656, 0.010890483856201172, 0.012067794799804688, 0.013245105743408203, 0.014422416687011719, 0.015599727630615234, 0.01677703857421875, 0.017954349517822266, 0.01913166046142578, 0.020308971405029297, 0.021486282348632812, 0.022663593292236328, 0.023840904235839844, 0.02501821517944336, 0.026195526123046875, 0.02737283706665039, 0.028550148010253906, 0.029727458953857422, 0.030904769897460938, 0.03208208084106445, 0.03325939178466797, 0.034436702728271484, 0.035614013671875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 5.0, 1.0, 5.0, 6.0, 7.0, 7.0, 13.0, 22.0, 30.0, 42.0, 62.0, 118.0, 243.0, 576.0, 1697.0, 7804.0, 76880.0, 886664.0, 64739.0, 6912.0, 1586.0, 554.0, 237.0, 134.0, 73.0, 48.0, 26.0, 19.0, 12.0, 9.0, 7.0, 7.0, 4.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.67236328125, -0.6516571044921875, -0.630950927734375, -0.6102447509765625, -0.58953857421875, -0.5688323974609375, -0.548126220703125, -0.5274200439453125, -0.5067138671875, -0.4860076904296875, -0.465301513671875, -0.4445953369140625, -0.42388916015625, -0.4031829833984375, -0.382476806640625, -0.3617706298828125, -0.341064453125, -0.3203582763671875, -0.299652099609375, -0.2789459228515625, -0.25823974609375, -0.2375335693359375, -0.216827392578125, -0.1961212158203125, -0.1754150390625, -0.1547088623046875, -0.134002685546875, -0.1132965087890625, -0.09259033203125, -0.0718841552734375, -0.051177978515625, -0.0304718017578125, -0.009765625, 0.0109405517578125, 0.031646728515625, 0.0523529052734375, 0.07305908203125, 0.0937652587890625, 0.114471435546875, 0.1351776123046875, 0.1558837890625, 0.1765899658203125, 0.197296142578125, 0.2180023193359375, 0.23870849609375, 0.2594146728515625, 0.280120849609375, 0.3008270263671875, 0.321533203125, 0.3422393798828125, 0.362945556640625, 0.3836517333984375, 0.40435791015625, 0.4250640869140625, 0.445770263671875, 0.4664764404296875, 0.4871826171875, 0.5078887939453125, 0.528594970703125, 0.5493011474609375, 0.57000732421875, 0.5907135009765625, 0.611419677734375, 0.6321258544921875, 0.65283203125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 2.0, 6.0, 4.0, 7.0, 13.0, 12.0, 10.0, 7.0, 12.0, 28.0, 18.0, 27.0, 16.0, 38.0, 30.0, 50.0, 42.0, 51.0, 55.0, 51.0, 36.0, 46.0, 48.0, 47.0, 40.0, 43.0, 33.0, 35.0, 39.0, 29.0, 17.0, 21.0, 17.0, 15.0, 9.0, 11.0, 9.0, 10.0, 9.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.2054443359375, -0.20029354095458984, -0.1951427459716797, -0.18999195098876953, -0.18484115600585938, -0.17969036102294922, -0.17453956604003906, -0.1693887710571289, -0.16423797607421875, -0.1590871810913086, -0.15393638610839844, -0.14878559112548828, -0.14363479614257812, -0.13848400115966797, -0.1333332061767578, -0.12818241119384766, -0.1230316162109375, -0.11788082122802734, -0.11273002624511719, -0.10757923126220703, -0.10242843627929688, -0.09727764129638672, -0.09212684631347656, -0.0869760513305664, -0.08182525634765625, -0.0766744613647461, -0.07152366638183594, -0.06637287139892578, -0.061222076416015625, -0.05607128143310547, -0.05092048645019531, -0.045769691467285156, -0.040618896484375, -0.035468101501464844, -0.030317306518554688, -0.02516651153564453, -0.020015716552734375, -0.014864921569824219, -0.009714126586914062, -0.004563331604003906, 0.00058746337890625, 0.005738258361816406, 0.010889053344726562, 0.01603984832763672, 0.021190643310546875, 0.02634143829345703, 0.03149223327636719, 0.036643028259277344, 0.0417938232421875, 0.046944618225097656, 0.05209541320800781, 0.05724620819091797, 0.062397003173828125, 0.06754779815673828, 0.07269859313964844, 0.0778493881225586, 0.08300018310546875, 0.0881509780883789, 0.09330177307128906, 0.09845256805419922, 0.10360336303710938, 0.10875415802001953, 0.11390495300292969, 0.11905574798583984, 0.12420654296875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 6.0, 8.0, 9.0, 13.0, 26.0, 23.0, 60.0, 128.0, 310.0, 1042.0, 11773.0, 1028123.0, 5763.0, 787.0, 257.0, 92.0, 48.0, 30.0, 24.0, 12.0, 4.0, 8.0, 5.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3623046875, -1.310699462890625, -1.25909423828125, -1.207489013671875, -1.1558837890625, -1.104278564453125, -1.05267333984375, -1.001068115234375, -0.949462890625, -0.897857666015625, -0.84625244140625, -0.794647216796875, -0.7430419921875, -0.691436767578125, -0.63983154296875, -0.588226318359375, -0.53662109375, -0.485015869140625, -0.43341064453125, -0.381805419921875, -0.3302001953125, -0.278594970703125, -0.22698974609375, -0.175384521484375, -0.123779296875, -0.072174072265625, -0.02056884765625, 0.031036376953125, 0.0826416015625, 0.134246826171875, 0.18585205078125, 0.237457275390625, 0.2890625, 0.340667724609375, 0.39227294921875, 0.443878173828125, 0.4954833984375, 0.547088623046875, 0.59869384765625, 0.650299072265625, 0.701904296875, 0.753509521484375, 0.80511474609375, 0.856719970703125, 0.9083251953125, 0.959930419921875, 1.01153564453125, 1.063140869140625, 1.11474609375, 1.166351318359375, 1.21795654296875, 1.269561767578125, 1.3211669921875, 1.372772216796875, 1.42437744140625, 1.475982666015625, 1.527587890625, 1.579193115234375, 1.63079833984375, 1.682403564453125, 1.7340087890625, 1.785614013671875, 1.83721923828125, 1.888824462890625, 1.9404296875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 2.0, 6.0, 9.0, 7.0, 12.0, 18.0, 19.0, 15.0, 40.0, 43.0, 50.0, 76.0, 88.0, 101.0, 121.0, 79.0, 88.0, 53.0, 50.0, 43.0, 17.0, 18.0, 13.0, 5.0, 11.0, 5.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-2.390146255493164e-05, -2.3270025849342346e-05, -2.2638589143753052e-05, -2.2007152438163757e-05, -2.1375715732574463e-05, -2.074427902698517e-05, -2.0112842321395874e-05, -1.948140561580658e-05, -1.8849968910217285e-05, -1.821853220462799e-05, -1.7587095499038696e-05, -1.6955658793449402e-05, -1.6324222087860107e-05, -1.5692785382270813e-05, -1.5061348676681519e-05, -1.4429911971092224e-05, -1.379847526550293e-05, -1.3167038559913635e-05, -1.253560185432434e-05, -1.1904165148735046e-05, -1.1272728443145752e-05, -1.0641291737556458e-05, -1.0009855031967163e-05, -9.378418326377869e-06, -8.746981620788574e-06, -8.11554491519928e-06, -7.484108209609985e-06, -6.852671504020691e-06, -6.2212347984313965e-06, -5.589798092842102e-06, -4.958361387252808e-06, -4.326924681663513e-06, -3.6954879760742188e-06, -3.0640512704849243e-06, -2.43261456489563e-06, -1.8011778593063354e-06, -1.169741153717041e-06, -5.383044481277466e-07, 9.313225746154785e-08, 7.245689630508423e-07, 1.3560056686401367e-06, 1.987442374229431e-06, 2.6188790798187256e-06, 3.25031578540802e-06, 3.8817524909973145e-06, 4.513189196586609e-06, 5.144625902175903e-06, 5.776062607765198e-06, 6.407499313354492e-06, 7.038936018943787e-06, 7.670372724533081e-06, 8.301809430122375e-06, 8.93324613571167e-06, 9.564682841300964e-06, 1.0196119546890259e-05, 1.0827556252479553e-05, 1.1458992958068848e-05, 1.2090429663658142e-05, 1.2721866369247437e-05, 1.3353303074836731e-05, 1.3984739780426025e-05, 1.461617648601532e-05, 1.5247613191604614e-05, 1.587904989719391e-05, 1.6510486602783203e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 8.0, 6.0, 7.0, 12.0, 14.0, 26.0, 21.0, 34.0, 45.0, 69.0, 79.0, 129.0, 170.0, 274.0, 396.0, 635.0, 944.0, 1561.0, 2854.0, 5747.0, 14440.0, 66956.0, 748509.0, 165300.0, 23671.0, 7775.0, 3479.0, 1902.0, 1212.0, 723.0, 477.0, 331.0, 202.0, 164.0, 97.0, 87.0, 43.0, 38.0, 25.0, 25.0, 15.0, 14.0, 16.0, 9.0, 2.0, 6.0, 3.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.278564453125, -0.27075958251953125, -0.2629547119140625, -0.25514984130859375, -0.247344970703125, -0.23954010009765625, -0.2317352294921875, -0.22393035888671875, -0.21612548828125, -0.20832061767578125, -0.2005157470703125, -0.19271087646484375, -0.184906005859375, -0.17710113525390625, -0.1692962646484375, -0.16149139404296875, -0.1536865234375, -0.14588165283203125, -0.1380767822265625, -0.13027191162109375, -0.122467041015625, -0.11466217041015625, -0.1068572998046875, -0.09905242919921875, -0.09124755859375, -0.08344268798828125, -0.0756378173828125, -0.06783294677734375, -0.060028076171875, -0.05222320556640625, -0.0444183349609375, -0.03661346435546875, -0.02880859375, -0.02100372314453125, -0.0131988525390625, -0.00539398193359375, 0.002410888671875, 0.01021575927734375, 0.0180206298828125, 0.02582550048828125, 0.03363037109375, 0.04143524169921875, 0.0492401123046875, 0.05704498291015625, 0.064849853515625, 0.07265472412109375, 0.0804595947265625, 0.08826446533203125, 0.0960693359375, 0.10387420654296875, 0.1116790771484375, 0.11948394775390625, 0.127288818359375, 0.13509368896484375, 0.1428985595703125, 0.15070343017578125, 0.15850830078125, 0.16631317138671875, 0.1741180419921875, 0.18192291259765625, 0.189727783203125, 0.19753265380859375, 0.2053375244140625, 0.21314239501953125, 0.220947265625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 4.0, 4.0, 4.0, 6.0, 7.0, 11.0, 30.0, 43.0, 71.0, 122.0, 226.0, 165.0, 110.0, 73.0, 45.0, 20.0, 16.0, 6.0, 11.0, 6.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2047119140625, -0.19680213928222656, -0.18889236450195312, -0.1809825897216797, -0.17307281494140625, -0.1651630401611328, -0.15725326538085938, -0.14934349060058594, -0.1414337158203125, -0.13352394104003906, -0.12561416625976562, -0.11770439147949219, -0.10979461669921875, -0.10188484191894531, -0.09397506713867188, -0.08606529235839844, -0.078155517578125, -0.07024574279785156, -0.062335968017578125, -0.05442619323730469, -0.04651641845703125, -0.03860664367675781, -0.030696868896484375, -0.022787094116210938, -0.0148773193359375, -0.0069675445556640625, 0.000942230224609375, 0.008852005004882812, 0.01676177978515625, 0.024671554565429688, 0.032581329345703125, 0.04049110412597656, 0.04840087890625, 0.05631065368652344, 0.06422042846679688, 0.07213020324707031, 0.08003997802734375, 0.08794975280761719, 0.09585952758789062, 0.10376930236816406, 0.1116790771484375, 0.11958885192871094, 0.12749862670898438, 0.1354084014892578, 0.14331817626953125, 0.1512279510498047, 0.15913772583007812, 0.16704750061035156, 0.174957275390625, 0.18286705017089844, 0.19077682495117188, 0.1986865997314453, 0.20659637451171875, 0.2145061492919922, 0.22241592407226562, 0.23032569885253906, 0.2382354736328125, 0.24614524841308594, 0.2540550231933594, 0.2619647979736328, 0.26987457275390625, 0.2777843475341797, 0.2856941223144531, 0.29360389709472656, 0.301513671875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 11.0, 10.0, 15.0, 59.0, 251.0, 422.0, 131.0, 50.0, 23.0, 13.0, 11.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.01239538192749, -3.870124340057373, -3.727853298187256, -3.5855822563171387, -3.4433112144470215, -3.3010401725769043, -3.158769130706787, -3.01649808883667, -2.8742270469665527, -2.7319560050964355, -2.5896849632263184, -2.447413921356201, -2.305142879486084, -2.162871837615967, -2.0206007957458496, -1.8783297538757324, -1.7360587120056152, -1.593787670135498, -1.4515166282653809, -1.3092455863952637, -1.1669745445251465, -1.0247035026550293, -0.8824324607849121, -0.7401614189147949, -0.5978903770446777, -0.45561933517456055, -0.31334829330444336, -0.17107725143432617, -0.028806209564208984, 0.1134648323059082, 0.2557358741760254, 0.3980069160461426, 0.540278434753418, 0.6825494766235352, 0.8248205184936523, 0.9670915603637695, 1.1093626022338867, 1.251633644104004, 1.393904685974121, 1.5361757278442383, 1.6784467697143555, 1.8207178115844727, 1.9629888534545898, 2.105259895324707, 2.247530937194824, 2.3898019790649414, 2.5320730209350586, 2.674344062805176, 2.816615104675293, 2.95888614654541, 3.1011571884155273, 3.2434282302856445, 3.3856992721557617, 3.527970314025879, 3.670241355895996, 3.8125123977661133, 3.9547834396362305, 4.097054481506348, 4.239325523376465, 4.381596565246582, 4.523867607116699, 4.666138648986816, 4.808409690856934, 4.950680732727051, 5.092951774597168]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 1.0, 3.0, 13.0, 12.0, 20.0, 30.0, 57.0, 101.0, 184.0, 210.0, 140.0, 101.0, 47.0, 20.0, 18.0, 11.0, 6.0, 4.0, 5.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.699883460998535, -3.581669807434082, -3.463456153869629, -3.345242500305176, -3.2270288467407227, -3.1088151931762695, -2.9906015396118164, -2.8723878860473633, -2.75417423248291, -2.635960578918457, -2.517746925354004, -2.399533271789551, -2.2813196182250977, -2.1631059646606445, -2.0448923110961914, -1.9266787767410278, -1.8084652423858643, -1.6902515888214111, -1.572037935256958, -1.4538242816925049, -1.3356106281280518, -1.2173969745635986, -1.099183440208435, -0.9809697866439819, -0.8627561330795288, -0.7445424795150757, -0.6263288259506226, -0.5081152319908142, -0.3899015784263611, -0.27168792486190796, -0.1534743309020996, -0.035260677337646484, 0.08295297622680664, 0.20116661489009857, 0.3193802535533905, 0.43759387731552124, 0.5558075308799744, 0.6740211844444275, 0.7922347784042358, 0.910448431968689, 1.028662085533142, 1.1468757390975952, 1.2650893926620483, 1.383302927017212, 1.501516580581665, 1.6197302341461182, 1.7379438877105713, 1.8561575412750244, 1.9743711948394775, 2.0925848484039307, 2.210798501968384, 2.329012155532837, 2.44722580909729, 2.565439462661743, 2.683652877807617, 2.8018665313720703, 2.9200801849365234, 3.0382938385009766, 3.1565074920654297, 3.274721145629883, 3.392934799194336, 3.511148452758789, 3.629362106323242, 3.7475757598876953, 3.8657894134521484]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 6.0, 5.0, 7.0, 12.0, 16.0, 23.0, 64.0, 172.0, 1648.0, 4039815.0, 150873.0, 1316.0, 179.0, 51.0, 28.0, 19.0, 10.0, 11.0, 9.0, 4.0, 2.0, 2.0, 3.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8359375, -2.71221923828125, -2.5885009765625, -2.46478271484375, -2.341064453125, -2.21734619140625, -2.0936279296875, -1.96990966796875, -1.84619140625, -1.72247314453125, -1.5987548828125, -1.47503662109375, -1.351318359375, -1.22760009765625, -1.1038818359375, -0.98016357421875, -0.8564453125, -0.73272705078125, -0.6090087890625, -0.48529052734375, -0.361572265625, -0.23785400390625, -0.1141357421875, 0.00958251953125, 0.13330078125, 0.25701904296875, 0.3807373046875, 0.50445556640625, 0.628173828125, 0.75189208984375, 0.8756103515625, 0.99932861328125, 1.123046875, 1.24676513671875, 1.3704833984375, 1.49420166015625, 1.617919921875, 1.74163818359375, 1.8653564453125, 1.98907470703125, 2.11279296875, 2.23651123046875, 2.3602294921875, 2.48394775390625, 2.607666015625, 2.73138427734375, 2.8551025390625, 2.97882080078125, 3.1025390625, 3.22625732421875, 3.3499755859375, 3.47369384765625, 3.597412109375, 3.72113037109375, 3.8448486328125, 3.96856689453125, 4.09228515625, 4.21600341796875, 4.3397216796875, 4.46343994140625, 4.587158203125, 4.71087646484375, 4.8345947265625, 4.95831298828125, 5.08203125]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 0.0, 6.0, 5.0, 8.0, 7.0, 13.0, 13.0, 19.0, 29.0, 60.0, 80.0, 98.0, 127.0, 147.0, 121.0, 86.0, 67.0, 31.0, 17.0, 14.0, 11.0, 6.0, 3.0, 6.0, 2.0, 5.0, 2.0, 1.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0295562744140625, -0.028656959533691406, -0.027757644653320312, -0.02685832977294922, -0.025959014892578125, -0.02505970001220703, -0.024160385131835938, -0.023261070251464844, -0.02236175537109375, -0.021462440490722656, -0.020563125610351562, -0.01966381072998047, -0.018764495849609375, -0.01786518096923828, -0.016965866088867188, -0.016066551208496094, -0.015167236328125, -0.014267921447753906, -0.013368606567382812, -0.012469291687011719, -0.011569976806640625, -0.010670661926269531, -0.009771347045898438, -0.008872032165527344, -0.00797271728515625, -0.007073402404785156, -0.0061740875244140625, -0.005274772644042969, -0.004375457763671875, -0.0034761428833007812, -0.0025768280029296875, -0.0016775131225585938, -0.0007781982421875, 0.00012111663818359375, 0.0010204315185546875, 0.0019197463989257812, 0.002819061279296875, 0.0037183761596679688, 0.0046176910400390625, 0.005517005920410156, 0.00641632080078125, 0.007315635681152344, 0.008214950561523438, 0.009114265441894531, 0.010013580322265625, 0.010912895202636719, 0.011812210083007812, 0.012711524963378906, 0.01361083984375, 0.014510154724121094, 0.015409469604492188, 0.01630878448486328, 0.017208099365234375, 0.01810741424560547, 0.019006729125976562, 0.019906044006347656, 0.02080535888671875, 0.021704673767089844, 0.022603988647460938, 0.02350330352783203, 0.024402618408203125, 0.02530193328857422, 0.026201248168945312, 0.027100563049316406, 0.0279998779296875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 6.0, 7.0, 8.0, 26.0, 19.0, 42.0, 54.0, 103.0, 174.0, 408.0, 964.0, 2701.0, 9447.0, 53191.0, 3809455.0, 289487.0, 20720.0, 4973.0, 1563.0, 535.0, 206.0, 82.0, 50.0, 24.0, 12.0, 8.0, 5.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.009765625, -0.9866905212402344, -0.9636154174804688, -0.9405403137207031, -0.9174652099609375, -0.8943901062011719, -0.8713150024414062, -0.8482398986816406, -0.825164794921875, -0.8020896911621094, -0.7790145874023438, -0.7559394836425781, -0.7328643798828125, -0.7097892761230469, -0.6867141723632812, -0.6636390686035156, -0.64056396484375, -0.6174888610839844, -0.5944137573242188, -0.5713386535644531, -0.5482635498046875, -0.5251884460449219, -0.5021133422851562, -0.4790382385253906, -0.455963134765625, -0.4328880310058594, -0.40981292724609375, -0.3867378234863281, -0.3636627197265625, -0.3405876159667969, -0.31751251220703125, -0.2944374084472656, -0.2713623046875, -0.24828720092773438, -0.22521209716796875, -0.20213699340820312, -0.1790618896484375, -0.15598678588867188, -0.13291168212890625, -0.10983657836914062, -0.086761474609375, -0.06368637084960938, -0.04061126708984375, -0.017536163330078125, 0.0055389404296875, 0.028614044189453125, 0.05168914794921875, 0.07476425170898438, 0.09783935546875, 0.12091445922851562, 0.14398956298828125, 0.16706466674804688, 0.1901397705078125, 0.21321487426757812, 0.23628997802734375, 0.2593650817871094, 0.282440185546875, 0.3055152893066406, 0.32859039306640625, 0.3516654968261719, 0.3747406005859375, 0.3978157043457031, 0.42089080810546875, 0.4439659118652344, 0.467041015625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 3.0, 5.0, 5.0, 4.0, 6.0, 0.0, 8.0, 10.0, 13.0, 17.0, 24.0, 32.0, 46.0, 77.0, 141.0, 392.0, 1618.0, 930.0, 280.0, 148.0, 80.0, 63.0, 33.0, 35.0, 23.0, 8.0, 10.0, 10.0, 7.0, 9.0, 8.0, 8.0, 5.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.056396484375, -0.054781436920166016, -0.05316638946533203, -0.05155134201049805, -0.04993629455566406, -0.04832124710083008, -0.046706199645996094, -0.04509115219116211, -0.043476104736328125, -0.04186105728149414, -0.040246009826660156, -0.03863096237182617, -0.03701591491699219, -0.0354008674621582, -0.03378582000732422, -0.032170772552490234, -0.03055572509765625, -0.028940677642822266, -0.02732563018798828, -0.025710582733154297, -0.024095535278320312, -0.022480487823486328, -0.020865440368652344, -0.01925039291381836, -0.017635345458984375, -0.01602029800415039, -0.014405250549316406, -0.012790203094482422, -0.011175155639648438, -0.009560108184814453, -0.007945060729980469, -0.006330013275146484, -0.0047149658203125, -0.0030999183654785156, -0.0014848709106445312, 0.00013017654418945312, 0.0017452239990234375, 0.003360271453857422, 0.004975318908691406, 0.006590366363525391, 0.008205413818359375, 0.00982046127319336, 0.011435508728027344, 0.013050556182861328, 0.014665603637695312, 0.016280651092529297, 0.01789569854736328, 0.019510746002197266, 0.02112579345703125, 0.022740840911865234, 0.02435588836669922, 0.025970935821533203, 0.027585983276367188, 0.029201030731201172, 0.030816078186035156, 0.03243112564086914, 0.034046173095703125, 0.03566122055053711, 0.037276268005371094, 0.03889131546020508, 0.04050636291503906, 0.04212141036987305, 0.04373645782470703, 0.045351505279541016, 0.046966552734375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 23.0, 582.0, 393.0, 12.0, 4.0], "bins": [-5.504264831542969, -5.414007186889648, -5.323750019073486, -5.233492374420166, -5.143235206604004, -5.052977561950684, -4.9627203941345215, -4.872462749481201, -4.782205581665039, -4.691947937011719, -4.601690769195557, -4.511433124542236, -4.421175956726074, -4.330918312072754, -4.240661144256592, -4.1504034996032715, -4.060146331787109, -3.969888925552368, -3.879631519317627, -3.7893741130828857, -3.6991167068481445, -3.6088593006134033, -3.518601894378662, -3.428344249725342, -3.3380866050720215, -3.2478291988372803, -3.157571792602539, -3.067314386367798, -2.9770569801330566, -2.8867995738983154, -2.796542167663574, -2.706284523010254, -2.6160271167755127, -2.5257697105407715, -2.4355123043060303, -2.345254898071289, -2.254997491836548, -2.1647400856018066, -2.0744824409484863, -1.9842251539230347, -1.893967866897583, -1.8037104606628418, -1.7134530544281006, -1.6231956481933594, -1.5329382419586182, -1.442680835723877, -1.3524233102798462, -1.262165904045105, -1.1719083786010742, -1.081650972366333, -0.9913935661315918, -0.9011361002922058, -0.8108786940574646, -0.7206212878227234, -0.6303638219833374, -0.5401064157485962, -0.44984906911849976, -0.35959166288375854, -0.26933422684669495, -0.17907679080963135, -0.08881938457489014, 0.0014380216598510742, 0.09169548749923706, 0.18195289373397827, 0.2722102999687195]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 7.0, 1.0, 6.0, 10.0, 12.0, 27.0, 45.0, 64.0, 105.0, 128.0, 143.0, 119.0, 104.0, 74.0, 57.0, 34.0, 19.0, 10.0, 8.0, 6.0, 3.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3847852945327759, -0.37370383739471436, -0.36262235045433044, -0.3515408933162689, -0.340459406375885, -0.3293779492378235, -0.31829649209976196, -0.30721500515937805, -0.29613354802131653, -0.285052090883255, -0.2739706039428711, -0.26288914680480957, -0.25180765986442566, -0.24072620272636414, -0.22964473068714142, -0.2185632586479187, -0.20748178660869598, -0.19640031456947327, -0.18531884253025055, -0.17423737049102783, -0.1631559133529663, -0.1520744413137436, -0.14099296927452087, -0.12991151213645935, -0.11883003264665604, -0.10774856060743332, -0.0966670960187912, -0.08558562397956848, -0.07450415194034576, -0.06342268735170364, -0.052341215312480927, -0.041259750723838806, -0.03017827868461609, -0.01909681037068367, -0.008015340194106102, 0.003066129982471466, 0.014147598296403885, 0.025229066610336304, 0.03631053864955902, 0.04739200323820114, 0.05847347527742386, 0.06955494731664658, 0.0806364119052887, 0.09171788394451141, 0.10279935598373413, 0.11388082057237625, 0.12496229261159897, 0.1360437572002411, 0.1471252292394638, 0.15820670127868652, 0.16928817331790924, 0.18036964535713196, 0.19145110249519348, 0.2025325745344162, 0.21361404657363892, 0.22469550371170044, 0.23577699065208435, 0.24685846269130707, 0.2579399347305298, 0.2690213918685913, 0.2801028788089752, 0.29118433594703674, 0.30226582288742065, 0.3133472800254822, 0.3244287371635437]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 7.0, 6.0, 10.0, 8.0, 23.0, 29.0, 44.0, 81.0, 96.0, 158.0, 237.0, 348.0, 539.0, 825.0, 1350.0, 2150.0, 3789.0, 6618.0, 12405.0, 27804.0, 76294.0, 292975.0, 445727.0, 106608.0, 35804.0, 15531.0, 7838.0, 4426.0, 2475.0, 1554.0, 952.0, 630.0, 417.0, 268.0, 185.0, 106.0, 71.0, 57.0, 47.0, 19.0, 19.0, 12.0, 9.0, 7.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1591796875, -0.15437698364257812, -0.14957427978515625, -0.14477157592773438, -0.1399688720703125, -0.13516616821289062, -0.13036346435546875, -0.12556076049804688, -0.120758056640625, -0.11595535278320312, -0.11115264892578125, -0.10634994506835938, -0.1015472412109375, -0.09674453735351562, -0.09194183349609375, -0.08713912963867188, -0.08233642578125, -0.07753372192382812, -0.07273101806640625, -0.06792831420898438, -0.0631256103515625, -0.058322906494140625, -0.05352020263671875, -0.048717498779296875, -0.043914794921875, -0.039112091064453125, -0.03430938720703125, -0.029506683349609375, -0.0247039794921875, -0.019901275634765625, -0.01509857177734375, -0.010295867919921875, -0.0054931640625, -0.000690460205078125, 0.00411224365234375, 0.008914947509765625, 0.0137176513671875, 0.018520355224609375, 0.02332305908203125, 0.028125762939453125, 0.032928466796875, 0.037731170654296875, 0.04253387451171875, 0.047336578369140625, 0.0521392822265625, 0.056941986083984375, 0.06174468994140625, 0.06654739379882812, 0.07135009765625, 0.07615280151367188, 0.08095550537109375, 0.08575820922851562, 0.0905609130859375, 0.09536361694335938, 0.10016632080078125, 0.10496902465820312, 0.109771728515625, 0.11457443237304688, 0.11937713623046875, 0.12417984008789062, 0.1289825439453125, 0.13378524780273438, 0.13858795166015625, 0.14339065551757812, 0.148193359375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 3.0, 3.0, 5.0, 4.0, 1.0, 6.0, 0.0, 9.0, 8.0, 13.0, 11.0, 13.0, 19.0, 32.0, 46.0, 43.0, 63.0, 74.0, 83.0, 78.0, 80.0, 84.0, 52.0, 48.0, 60.0, 41.0, 32.0, 19.0, 12.0, 10.0, 12.0, 8.0, 9.0, 2.0, 5.0, 5.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0170745849609375, -0.01655292510986328, -0.016031265258789062, -0.015509605407714844, -0.014987945556640625, -0.014466285705566406, -0.013944625854492188, -0.013422966003417969, -0.01290130615234375, -0.012379646301269531, -0.011857986450195312, -0.011336326599121094, -0.010814666748046875, -0.010293006896972656, -0.009771347045898438, -0.009249687194824219, -0.00872802734375, -0.008206367492675781, -0.0076847076416015625, -0.007163047790527344, -0.006641387939453125, -0.006119728088378906, -0.0055980682373046875, -0.005076408386230469, -0.00455474853515625, -0.004033088684082031, -0.0035114288330078125, -0.0029897689819335938, -0.002468109130859375, -0.0019464492797851562, -0.0014247894287109375, -0.0009031295776367188, -0.0003814697265625, 0.00014019012451171875, 0.0006618499755859375, 0.0011835098266601562, 0.001705169677734375, 0.0022268295288085938, 0.0027484893798828125, 0.0032701492309570312, 0.00379180908203125, 0.004313468933105469, 0.0048351287841796875, 0.005356788635253906, 0.005878448486328125, 0.006400108337402344, 0.0069217681884765625, 0.007443428039550781, 0.007965087890625, 0.008486747741699219, 0.009008407592773438, 0.009530067443847656, 0.010051727294921875, 0.010573387145996094, 0.011095046997070312, 0.011616706848144531, 0.01213836669921875, 0.012660026550292969, 0.013181686401367188, 0.013703346252441406, 0.014225006103515625, 0.014746665954589844, 0.015268325805664062, 0.01578998565673828, 0.0163116455078125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 1.0, 2.0, 6.0, 3.0, 2.0, 3.0, 2.0, 5.0, 7.0, 9.0, 24.0, 86.0, 831.0, 24777.0, 969591.0, 51712.0, 1303.0, 109.0, 34.0, 9.0, 7.0, 3.0, 7.0, 4.0, 3.0, 3.0, 4.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.548828125, -0.523406982421875, -0.49798583984375, -0.472564697265625, -0.4471435546875, -0.421722412109375, -0.39630126953125, -0.370880126953125, -0.345458984375, -0.320037841796875, -0.29461669921875, -0.269195556640625, -0.2437744140625, -0.218353271484375, -0.19293212890625, -0.167510986328125, -0.14208984375, -0.116668701171875, -0.09124755859375, -0.065826416015625, -0.0404052734375, -0.014984130859375, 0.01043701171875, 0.035858154296875, 0.061279296875, 0.086700439453125, 0.11212158203125, 0.137542724609375, 0.1629638671875, 0.188385009765625, 0.21380615234375, 0.239227294921875, 0.2646484375, 0.290069580078125, 0.31549072265625, 0.340911865234375, 0.3663330078125, 0.391754150390625, 0.41717529296875, 0.442596435546875, 0.468017578125, 0.493438720703125, 0.51885986328125, 0.544281005859375, 0.5697021484375, 0.595123291015625, 0.62054443359375, 0.645965576171875, 0.67138671875, 0.696807861328125, 0.72222900390625, 0.747650146484375, 0.7730712890625, 0.798492431640625, 0.82391357421875, 0.849334716796875, 0.874755859375, 0.900177001953125, 0.92559814453125, 0.951019287109375, 0.9764404296875, 1.001861572265625, 1.02728271484375, 1.052703857421875, 1.078125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 6.0, 7.0, 6.0, 5.0, 11.0, 10.0, 18.0, 15.0, 19.0, 18.0, 29.0, 15.0, 25.0, 37.0, 33.0, 33.0, 42.0, 28.0, 36.0, 46.0, 44.0, 41.0, 45.0, 30.0, 41.0, 43.0, 46.0, 32.0, 40.0, 27.0, 25.0, 26.0, 26.0, 14.0, 13.0, 15.0, 8.0, 11.0, 11.0, 7.0, 7.0, 5.0, 6.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.079833984375, -0.07739734649658203, -0.07496070861816406, -0.0725240707397461, -0.07008743286132812, -0.06765079498291016, -0.06521415710449219, -0.06277751922607422, -0.06034088134765625, -0.05790424346923828, -0.05546760559082031, -0.053030967712402344, -0.050594329833984375, -0.048157691955566406, -0.04572105407714844, -0.04328441619873047, -0.0408477783203125, -0.03841114044189453, -0.03597450256347656, -0.033537864685058594, -0.031101226806640625, -0.028664588928222656, -0.026227951049804688, -0.02379131317138672, -0.02135467529296875, -0.01891803741455078, -0.016481399536132812, -0.014044761657714844, -0.011608123779296875, -0.009171485900878906, -0.0067348480224609375, -0.004298210144042969, -0.001861572265625, 0.0005750656127929688, 0.0030117034912109375, 0.005448341369628906, 0.007884979248046875, 0.010321617126464844, 0.012758255004882812, 0.015194892883300781, 0.01763153076171875, 0.02006816864013672, 0.022504806518554688, 0.024941444396972656, 0.027378082275390625, 0.029814720153808594, 0.03225135803222656, 0.03468799591064453, 0.0371246337890625, 0.03956127166748047, 0.04199790954589844, 0.044434547424316406, 0.046871185302734375, 0.049307823181152344, 0.05174446105957031, 0.05418109893798828, 0.05661773681640625, 0.05905437469482422, 0.06149101257324219, 0.06392765045166016, 0.06636428833007812, 0.0688009262084961, 0.07123756408691406, 0.07367420196533203, 0.07611083984375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 5.0, 4.0, 9.0, 12.0, 17.0, 43.0, 175.0, 1856.0, 1031695.0, 14203.0, 382.0, 81.0, 23.0, 17.0, 10.0, 8.0, 8.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.12890625, -2.075286865234375, -2.02166748046875, -1.968048095703125, -1.9144287109375, -1.860809326171875, -1.80718994140625, -1.753570556640625, -1.699951171875, -1.646331787109375, -1.59271240234375, -1.539093017578125, -1.4854736328125, -1.431854248046875, -1.37823486328125, -1.324615478515625, -1.27099609375, -1.217376708984375, -1.16375732421875, -1.110137939453125, -1.0565185546875, -1.002899169921875, -0.94927978515625, -0.895660400390625, -0.842041015625, -0.788421630859375, -0.73480224609375, -0.681182861328125, -0.6275634765625, -0.573944091796875, -0.52032470703125, -0.466705322265625, -0.4130859375, -0.359466552734375, -0.30584716796875, -0.252227783203125, -0.1986083984375, -0.144989013671875, -0.09136962890625, -0.037750244140625, 0.015869140625, 0.069488525390625, 0.12310791015625, 0.176727294921875, 0.2303466796875, 0.283966064453125, 0.33758544921875, 0.391204833984375, 0.44482421875, 0.498443603515625, 0.55206298828125, 0.605682373046875, 0.6593017578125, 0.712921142578125, 0.76654052734375, 0.820159912109375, 0.873779296875, 0.927398681640625, 0.98101806640625, 1.034637451171875, 1.0882568359375, 1.141876220703125, 1.19549560546875, 1.249114990234375, 1.302734375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 5.0, 7.0, 10.0, 14.0, 20.0, 21.0, 53.0, 142.0, 335.0, 211.0, 78.0, 35.0, 25.0, 10.0, 10.0, 4.0, 7.0, 0.0, 7.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.679794311523438e-05, -9.392388164997101e-05, -9.104982018470764e-05, -8.817575871944427e-05, -8.530169725418091e-05, -8.242763578891754e-05, -7.955357432365417e-05, -7.667951285839081e-05, -7.380545139312744e-05, -7.093138992786407e-05, -6.805732846260071e-05, -6.518326699733734e-05, -6.230920553207397e-05, -5.943514406681061e-05, -5.656108260154724e-05, -5.3687021136283875e-05, -5.081295967102051e-05, -4.793889820575714e-05, -4.5064836740493774e-05, -4.219077527523041e-05, -3.931671380996704e-05, -3.6442652344703674e-05, -3.356859087944031e-05, -3.069452941417694e-05, -2.7820467948913574e-05, -2.4946406483650208e-05, -2.207234501838684e-05, -1.9198283553123474e-05, -1.6324222087860107e-05, -1.345016062259674e-05, -1.0576099157333374e-05, -7.702037692070007e-06, -4.827976226806641e-06, -1.953914761543274e-06, 9.201467037200928e-07, 3.7942081689834595e-06, 6.668269634246826e-06, 9.542331099510193e-06, 1.241639256477356e-05, 1.5290454030036926e-05, 1.8164515495300293e-05, 2.103857696056366e-05, 2.3912638425827026e-05, 2.6786699891090393e-05, 2.966076135635376e-05, 3.2534822821617126e-05, 3.540888428688049e-05, 3.828294575214386e-05, 4.1157007217407227e-05, 4.403106868267059e-05, 4.690513014793396e-05, 4.977919161319733e-05, 5.265325307846069e-05, 5.552731454372406e-05, 5.840137600898743e-05, 6.12754374742508e-05, 6.414949893951416e-05, 6.702356040477753e-05, 6.98976218700409e-05, 7.277168333530426e-05, 7.564574480056763e-05, 7.8519806265831e-05, 8.139386773109436e-05, 8.426792919635773e-05, 8.71419906616211e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 12.0, 5.0, 14.0, 21.0, 28.0, 36.0, 64.0, 93.0, 166.0, 268.0, 473.0, 883.0, 2018.0, 5160.0, 16673.0, 73675.0, 505068.0, 368448.0, 54522.0, 13125.0, 4251.0, 1725.0, 768.0, 401.0, 255.0, 145.0, 90.0, 55.0, 35.0, 21.0, 15.0, 12.0, 12.0, 6.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2310791015625, -0.22446060180664062, -0.21784210205078125, -0.21122360229492188, -0.2046051025390625, -0.19798660278320312, -0.19136810302734375, -0.18474960327148438, -0.178131103515625, -0.17151260375976562, -0.16489410400390625, -0.15827560424804688, -0.1516571044921875, -0.14503860473632812, -0.13842010498046875, -0.13180160522460938, -0.12518310546875, -0.11856460571289062, -0.11194610595703125, -0.10532760620117188, -0.0987091064453125, -0.09209060668945312, -0.08547210693359375, -0.07885360717773438, -0.072235107421875, -0.06561660766601562, -0.05899810791015625, -0.052379608154296875, -0.0457611083984375, -0.039142608642578125, -0.03252410888671875, -0.025905609130859375, -0.019287109375, -0.012668609619140625, -0.00605010986328125, 0.000568389892578125, 0.0071868896484375, 0.013805389404296875, 0.02042388916015625, 0.027042388916015625, 0.033660888671875, 0.040279388427734375, 0.04689788818359375, 0.053516387939453125, 0.0601348876953125, 0.06675338745117188, 0.07337188720703125, 0.07999038696289062, 0.08660888671875, 0.09322738647460938, 0.09984588623046875, 0.10646438598632812, 0.1130828857421875, 0.11970138549804688, 0.12631988525390625, 0.13293838500976562, 0.139556884765625, 0.14617538452148438, 0.15279388427734375, 0.15941238403320312, 0.1660308837890625, 0.17264938354492188, 0.17926788330078125, 0.18588638305664062, 0.1925048828125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 6.0, 5.0, 11.0, 10.0, 19.0, 37.0, 38.0, 42.0, 76.0, 116.0, 132.0, 140.0, 103.0, 78.0, 56.0, 37.0, 39.0, 22.0, 12.0, 7.0, 8.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1575927734375, -0.1531238555908203, -0.14865493774414062, -0.14418601989746094, -0.13971710205078125, -0.13524818420410156, -0.13077926635742188, -0.1263103485107422, -0.1218414306640625, -0.11737251281738281, -0.11290359497070312, -0.10843467712402344, -0.10396575927734375, -0.09949684143066406, -0.09502792358398438, -0.09055900573730469, -0.086090087890625, -0.08162117004394531, -0.07715225219726562, -0.07268333435058594, -0.06821441650390625, -0.06374549865722656, -0.059276580810546875, -0.05480766296386719, -0.0503387451171875, -0.04586982727050781, -0.041400909423828125, -0.03693199157714844, -0.03246307373046875, -0.027994155883789062, -0.023525238037109375, -0.019056320190429688, -0.01458740234375, -0.010118484497070312, -0.005649566650390625, -0.0011806488037109375, 0.00328826904296875, 0.0077571868896484375, 0.012226104736328125, 0.016695022583007812, 0.0211639404296875, 0.025632858276367188, 0.030101776123046875, 0.03457069396972656, 0.03903961181640625, 0.04350852966308594, 0.047977447509765625, 0.05244636535644531, 0.056915283203125, 0.06138420104980469, 0.06585311889648438, 0.07032203674316406, 0.07479095458984375, 0.07925987243652344, 0.08372879028320312, 0.08819770812988281, 0.0926666259765625, 0.09713554382324219, 0.10160446166992188, 0.10607337951660156, 0.11054229736328125, 0.11501121520996094, 0.11948013305664062, 0.12394905090332031, 0.12841796875]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 6.0, 15.0, 35.0, 47.0, 158.0, 323.0, 230.0, 105.0, 41.0, 15.0, 8.0, 11.0, 3.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8318114280700684, -1.7755467891693115, -1.7192820310592651, -1.6630172729492188, -1.606752634048462, -1.550487995147705, -1.4942232370376587, -1.4379584789276123, -1.3816938400268555, -1.3254292011260986, -1.2691644430160522, -1.2128996849060059, -1.156635046005249, -1.1003704071044922, -1.0441056489944458, -0.9878409504890442, -0.9315762519836426, -0.875311553478241, -0.8190468549728394, -0.7627821564674377, -0.7065174579620361, -0.6502527594566345, -0.5939880609512329, -0.5377233624458313, -0.4814586639404297, -0.4251939654350281, -0.36892926692962646, -0.31266456842422485, -0.25639986991882324, -0.20013517141342163, -0.14387047290802002, -0.08760577440261841, -0.03134119510650635, 0.024923503398895264, 0.08118820190429688, 0.1374529004096985, 0.1937175989151001, 0.2499822974205017, 0.3062469959259033, 0.36251169443130493, 0.41877639293670654, 0.47504109144210815, 0.5313057899475098, 0.5875704884529114, 0.643835186958313, 0.7000998854637146, 0.7563645839691162, 0.8126292824745178, 0.8688939809799194, 0.925158679485321, 0.9814233779907227, 1.0376880168914795, 1.0939527750015259, 1.1502175331115723, 1.206482172012329, 1.262746810913086, 1.3190115690231323, 1.3752763271331787, 1.4315409660339355, 1.4878056049346924, 1.5440703630447388, 1.6003351211547852, 1.656599760055542, 1.7128643989562988, 1.7691291570663452]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 6.0, 5.0, 3.0, 5.0, 5.0, 16.0, 13.0, 18.0, 25.0, 38.0, 47.0, 55.0, 63.0, 75.0, 82.0, 75.0, 74.0, 75.0, 53.0, 56.0, 54.0, 28.0, 25.0, 22.0, 19.0, 11.0, 10.0, 10.0, 7.0, 3.0, 7.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9033595323562622, -0.8758248686790466, -0.848290205001831, -0.8207556009292603, -0.7932209372520447, -0.7656862735748291, -0.7381516098976135, -0.710616946220398, -0.6830823421478271, -0.6555476784706116, -0.628013014793396, -0.6004784107208252, -0.5729437470436096, -0.545409083366394, -0.5178744196891785, -0.4903397560119629, -0.4628050923347473, -0.43527042865753174, -0.40773579478263855, -0.380201131105423, -0.3526664972305298, -0.3251318335533142, -0.29759716987609863, -0.27006250619888306, -0.24252787232398987, -0.21499322354793549, -0.1874585747718811, -0.15992391109466553, -0.13238926231861115, -0.10485461354255676, -0.07731994986534119, -0.049785301089286804, -0.022250711917877197, 0.0052839405834674835, 0.032818593084812164, 0.060353249311447144, 0.08788789808750153, 0.11542254686355591, 0.14295721054077148, 0.17049185931682587, 0.19802650809288025, 0.22556115686893463, 0.253095805644989, 0.2806304693222046, 0.30816513299942017, 0.33569976687431335, 0.36323443055152893, 0.3907690644264221, 0.4183037281036377, 0.44583839178085327, 0.47337302565574646, 0.5009076595306396, 0.5284423232078552, 0.5559769868850708, 0.5835116505622864, 0.611046314239502, 0.6385809183120728, 0.6661155819892883, 0.6936502456665039, 0.7211848497390747, 0.7487195134162903, 0.7762541770935059, 0.8037888407707214, 0.831323504447937, 0.8588581681251526]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 4.0, 8.0, 16.0, 12.0, 33.0, 49.0, 159.0, 2122.0, 3693807.0, 496830.0, 1054.0, 45.0, 33.0, 14.0, 14.0, 24.0, 16.0, 8.0, 10.0, 4.0, 6.0, 4.0, 6.0, 0.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.1328125, -2.050689697265625, -1.96856689453125, -1.886444091796875, -1.8043212890625, -1.722198486328125, -1.64007568359375, -1.557952880859375, -1.475830078125, -1.393707275390625, -1.31158447265625, -1.229461669921875, -1.1473388671875, -1.065216064453125, -0.98309326171875, -0.900970458984375, -0.81884765625, -0.736724853515625, -0.65460205078125, -0.572479248046875, -0.4903564453125, -0.408233642578125, -0.32611083984375, -0.243988037109375, -0.161865234375, -0.079742431640625, 0.00238037109375, 0.084503173828125, 0.1666259765625, 0.248748779296875, 0.33087158203125, 0.412994384765625, 0.4951171875, 0.577239990234375, 0.65936279296875, 0.741485595703125, 0.8236083984375, 0.905731201171875, 0.98785400390625, 1.069976806640625, 1.152099609375, 1.234222412109375, 1.31634521484375, 1.398468017578125, 1.4805908203125, 1.562713623046875, 1.64483642578125, 1.726959228515625, 1.80908203125, 1.891204833984375, 1.97332763671875, 2.055450439453125, 2.1375732421875, 2.219696044921875, 2.30181884765625, 2.383941650390625, 2.466064453125, 2.548187255859375, 2.63031005859375, 2.712432861328125, 2.7945556640625, 2.876678466796875, 2.95880126953125, 3.040924072265625, 3.123046875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 9.0, 1.0, 3.0, 8.0, 6.0, 10.0, 12.0, 19.0, 18.0, 31.0, 35.0, 43.0, 44.0, 68.0, 61.0, 60.0, 74.0, 77.0, 65.0, 57.0, 54.0, 52.0, 50.0, 38.0, 24.0, 10.0, 10.0, 14.0, 9.0, 8.0, 10.0, 7.0, 2.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0186614990234375, -0.01820194721221924, -0.017742395401000977, -0.017282843589782715, -0.016823291778564453, -0.01636373996734619, -0.01590418815612793, -0.015444636344909668, -0.014985084533691406, -0.014525532722473145, -0.014065980911254883, -0.013606429100036621, -0.01314687728881836, -0.012687325477600098, -0.012227773666381836, -0.011768221855163574, -0.011308670043945312, -0.01084911823272705, -0.010389566421508789, -0.009930014610290527, -0.009470462799072266, -0.009010910987854004, -0.008551359176635742, -0.00809180736541748, -0.007632255554199219, -0.007172703742980957, -0.006713151931762695, -0.006253600120544434, -0.005794048309326172, -0.00533449649810791, -0.0048749446868896484, -0.004415392875671387, -0.003955841064453125, -0.0034962892532348633, -0.0030367374420166016, -0.00257718563079834, -0.002117633819580078, -0.0016580820083618164, -0.0011985301971435547, -0.000738978385925293, -0.00027942657470703125, 0.00018012523651123047, 0.0006396770477294922, 0.001099228858947754, 0.0015587806701660156, 0.0020183324813842773, 0.002477884292602539, 0.0029374361038208008, 0.0033969879150390625, 0.0038565397262573242, 0.004316091537475586, 0.004775643348693848, 0.005235195159912109, 0.005694746971130371, 0.006154298782348633, 0.0066138505935668945, 0.007073402404785156, 0.007532954216003418, 0.00799250602722168, 0.008452057838439941, 0.008911609649658203, 0.009371161460876465, 0.009830713272094727, 0.010290265083312988, 0.01074981689453125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 4.0, 6.0, 14.0, 64.0, 125.0, 352.0, 2651.0, 990444.0, 3197039.0, 3020.0, 365.0, 129.0, 56.0, 16.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.445556640625, -0.3961753845214844, -0.34679412841796875, -0.2974128723144531, -0.2480316162109375, -0.19865036010742188, -0.14926910400390625, -0.09988784790039062, -0.050506591796875, -0.001125335693359375, 0.04825592041015625, 0.09763717651367188, 0.1470184326171875, 0.19639968872070312, 0.24578094482421875, 0.2951622009277344, 0.34454345703125, 0.3939247131347656, 0.44330596923828125, 0.4926872253417969, 0.5420684814453125, 0.5914497375488281, 0.6408309936523438, 0.6902122497558594, 0.739593505859375, 0.7889747619628906, 0.8383560180664062, 0.8877372741699219, 0.9371185302734375, 0.9864997863769531, 1.0358810424804688, 1.0852622985839844, 1.1346435546875, 1.1840248107910156, 1.2334060668945312, 1.2827873229980469, 1.3321685791015625, 1.3815498352050781, 1.4309310913085938, 1.4803123474121094, 1.529693603515625, 1.5790748596191406, 1.6284561157226562, 1.6778373718261719, 1.7272186279296875, 1.7765998840332031, 1.8259811401367188, 1.8753623962402344, 1.92474365234375, 1.9741249084472656, 2.0235061645507812, 2.072887420654297, 2.1222686767578125, 2.171649932861328, 2.2210311889648438, 2.2704124450683594, 2.319793701171875, 2.3691749572753906, 2.4185562133789062, 2.467937469482422, 2.5173187255859375, 2.566699981689453, 2.6160812377929688, 2.6654624938964844, 2.71484375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 2.0, 7.0, 10.0, 14.0, 13.0, 16.0, 17.0, 28.0, 34.0, 39.0, 68.0, 124.0, 201.0, 395.0, 1714.0, 633.0, 249.0, 143.0, 112.0, 65.0, 52.0, 27.0, 28.0, 14.0, 17.0, 11.0, 6.0, 3.0, 8.0, 3.0, 4.0, 1.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.04986572265625, -0.04857921600341797, -0.04729270935058594, -0.046006202697753906, -0.044719696044921875, -0.043433189392089844, -0.04214668273925781, -0.04086017608642578, -0.03957366943359375, -0.03828716278076172, -0.03700065612792969, -0.035714149475097656, -0.034427642822265625, -0.033141136169433594, -0.03185462951660156, -0.03056812286376953, -0.0292816162109375, -0.02799510955810547, -0.026708602905273438, -0.025422096252441406, -0.024135589599609375, -0.022849082946777344, -0.021562576293945312, -0.02027606964111328, -0.01898956298828125, -0.01770305633544922, -0.016416549682617188, -0.015130043029785156, -0.013843536376953125, -0.012557029724121094, -0.011270523071289062, -0.009984016418457031, -0.008697509765625, -0.007411003112792969, -0.0061244964599609375, -0.004837989807128906, -0.003551483154296875, -0.0022649765014648438, -0.0009784698486328125, 0.00030803680419921875, 0.00159454345703125, 0.0028810501098632812, 0.0041675567626953125, 0.005454063415527344, 0.006740570068359375, 0.008027076721191406, 0.009313583374023438, 0.010600090026855469, 0.0118865966796875, 0.013173103332519531, 0.014459609985351562, 0.015746116638183594, 0.017032623291015625, 0.018319129943847656, 0.019605636596679688, 0.02089214324951172, 0.02217864990234375, 0.02346515655517578, 0.024751663208007812, 0.026038169860839844, 0.027324676513671875, 0.028611183166503906, 0.029897689819335938, 0.03118419647216797, 0.032470703125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 4.0, 6.0, 185.0, 765.0, 51.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7070081233978271, -0.5940101146697998, -0.4810120463371277, -0.36801400780677795, -0.2550159692764282, -0.14201796054840088, -0.02901989221572876, 0.08397817611694336, 0.1969761848449707, 0.30997422337532043, 0.42297226190567017, 0.5359703302383423, 0.6489683389663696, 0.761966347694397, 0.8749644160270691, 0.9879624843597412, 1.1009604930877686, 1.213958501815796, 1.3269565105438232, 1.4399546384811401, 1.5529526472091675, 1.6659506559371948, 1.7789487838745117, 1.891946792602539, 2.0049448013305664, 2.1179428100585938, 2.230940818786621, 2.3439388275146484, 2.456936836242676, 2.569934844970703, 2.6829330921173096, 2.795931100845337, 2.908928871154785, 3.0219268798828125, 3.13492488861084, 3.247922897338867, 3.3609209060668945, 3.473918914794922, 3.5869171619415283, 3.6999151706695557, 3.812913179397583, 3.9259111881256104, 4.038909435272217, 4.151907444000244, 4.2649054527282715, 4.377903461456299, 4.490901470184326, 4.6038994789123535, 4.716897487640381, 4.829895496368408, 4.9428935050964355, 5.055891513824463, 5.16888952255249, 5.281887531280518, 5.394885540008545, 5.5078840255737305, 5.620882034301758, 5.733880043029785, 5.8468780517578125, 5.95987606048584, 6.072874069213867, 6.1858720779418945, 6.298870086669922, 6.411868095397949, 6.524866104125977]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 10.0, 14.0, 17.0, 36.0, 45.0, 81.0, 101.0, 120.0, 117.0, 104.0, 95.0, 86.0, 76.0, 51.0, 23.0, 11.0, 8.0, 5.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.555079460144043, -0.5425467491149902, -0.5300140380859375, -0.5174813270568848, -0.504948616027832, -0.4924158751964569, -0.4798831641674042, -0.46735045313835144, -0.4548177421092987, -0.44228503108024597, -0.42975232005119324, -0.4172195792198181, -0.4046868681907654, -0.39215415716171265, -0.3796214461326599, -0.3670887351036072, -0.35455602407455444, -0.3420233130455017, -0.329490602016449, -0.31695789098739624, -0.3044251501560211, -0.2918924391269684, -0.27935972809791565, -0.2668270170688629, -0.2542942762374878, -0.24176156520843506, -0.22922883927822113, -0.2166961282491684, -0.20416341722011566, -0.19163069128990173, -0.179097980260849, -0.16656526923179626, -0.15403255820274353, -0.1414998471736908, -0.12896712124347687, -0.11643441021442413, -0.1039016991853714, -0.09136898070573807, -0.07883626222610474, -0.066303551197052, -0.05377083271741867, -0.04123811796307564, -0.028705401346087456, -0.016172684729099274, -0.003639969974756241, 0.008892744779586792, 0.021425463259220123, 0.03395817428827286, 0.04649089276790619, 0.05902360752224922, 0.07155632227659225, 0.08408904075622559, 0.09662175178527832, 0.10915447026491165, 0.12168718874454498, 0.13421989977359772, 0.14675262570381165, 0.15928533673286438, 0.1718180626630783, 0.18435077369213104, 0.19688348472118378, 0.2094162106513977, 0.22194892168045044, 0.23448163270950317, 0.2470143437385559]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 6.0, 3.0, 11.0, 6.0, 8.0, 19.0, 18.0, 23.0, 30.0, 36.0, 29.0, 41.0, 35.0, 51.0, 44.0, 41.0, 34651.0, 1013004.0, 73.0, 62.0, 47.0, 49.0, 44.0, 38.0, 37.0, 39.0, 28.0, 18.0, 12.0, 10.0, 6.0, 9.0, 7.0, 7.0, 3.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.986328125, -3.869537353515625, -3.75274658203125, -3.635955810546875, -3.5191650390625, -3.402374267578125, -3.28558349609375, -3.168792724609375, -3.052001953125, -2.935211181640625, -2.81842041015625, -2.701629638671875, -2.5848388671875, -2.468048095703125, -2.35125732421875, -2.234466552734375, -2.11767578125, -2.000885009765625, -1.88409423828125, -1.767303466796875, -1.6505126953125, -1.533721923828125, -1.41693115234375, -1.300140380859375, -1.183349609375, -1.066558837890625, -0.94976806640625, -0.832977294921875, -0.7161865234375, -0.599395751953125, -0.48260498046875, -0.365814208984375, -0.2490234375, -0.132232666015625, -0.01544189453125, 0.101348876953125, 0.2181396484375, 0.334930419921875, 0.45172119140625, 0.568511962890625, 0.685302734375, 0.802093505859375, 0.91888427734375, 1.035675048828125, 1.1524658203125, 1.269256591796875, 1.38604736328125, 1.502838134765625, 1.61962890625, 1.736419677734375, 1.85321044921875, 1.970001220703125, 2.0867919921875, 2.203582763671875, 2.32037353515625, 2.437164306640625, 2.553955078125, 2.670745849609375, 2.78753662109375, 2.904327392578125, 3.0211181640625, 3.137908935546875, 3.25469970703125, 3.371490478515625, 3.48828125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 28.0, 132.0, 331.0, 348.0, 140.0, 34.0], "bins": [-0.1541748046875, -0.151644766330719, -0.149114727973938, -0.14658468961715698, -0.14405465126037598, -0.14152461290359497, -0.13899457454681396, -0.13646453619003296, -0.13393449783325195, -0.13140445947647095, -0.12887442111968994, -0.12634438276290894, -0.12381434440612793, -0.12128430604934692, -0.11875426769256592, -0.11622422933578491, -0.1136941909790039, -0.1111641526222229, -0.1086341142654419, -0.10610407590866089, -0.10357403755187988, -0.10104399919509888, -0.09851396083831787, -0.09598392248153687, -0.09345388412475586, -0.09092384576797485, -0.08839380741119385, -0.08586376905441284, -0.08333373069763184, -0.08080369234085083, -0.07827365398406982, -0.07574361562728882, -0.07321357727050781, -0.0706835389137268, -0.0681535005569458, -0.0656234622001648, -0.06309342384338379, -0.06056338548660278, -0.05803334712982178, -0.05550330877304077, -0.052973270416259766, -0.05044323205947876, -0.047913193702697754, -0.04538315534591675, -0.04285311698913574, -0.040323078632354736, -0.03779304027557373, -0.035263001918792725, -0.03273296356201172, -0.030202925205230713, -0.027672886848449707, -0.0251428484916687, -0.022612810134887695, -0.02008277177810669, -0.017552733421325684, -0.015022695064544678, -0.012492656707763672, -0.009962618350982666, -0.00743257999420166, -0.004902541637420654, -0.0023725032806396484, 0.00015753507614135742, 0.0026875734329223633, 0.005217611789703369, 0.007747650146484375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 4.0, 3.0, 3.0, 3.0, 10.0, 7.0, 15.0, 19.0, 30.0, 49.0, 76.0, 108.0, 189.0, 334.0, 640.0, 1477.0, 3423.0, 9683.0, 36352.0, 227415.0, 652153.0, 87030.0, 19478.0, 5828.0, 2181.0, 922.0, 446.0, 256.0, 148.0, 90.0, 64.0, 26.0, 26.0, 22.0, 16.0, 9.0, 12.0, 3.0, 2.0, 3.0, 6.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8779296875, -0.8523101806640625, -0.826690673828125, -0.8010711669921875, -0.77545166015625, -0.7498321533203125, -0.724212646484375, -0.6985931396484375, -0.6729736328125, -0.6473541259765625, -0.621734619140625, -0.5961151123046875, -0.57049560546875, -0.5448760986328125, -0.519256591796875, -0.4936370849609375, -0.468017578125, -0.4423980712890625, -0.416778564453125, -0.3911590576171875, -0.36553955078125, -0.3399200439453125, -0.314300537109375, -0.2886810302734375, -0.2630615234375, -0.2374420166015625, -0.211822509765625, -0.1862030029296875, -0.16058349609375, -0.1349639892578125, -0.109344482421875, -0.0837249755859375, -0.05810546875, -0.0324859619140625, -0.006866455078125, 0.0187530517578125, 0.04437255859375, 0.0699920654296875, 0.095611572265625, 0.1212310791015625, 0.1468505859375, 0.1724700927734375, 0.198089599609375, 0.2237091064453125, 0.24932861328125, 0.2749481201171875, 0.300567626953125, 0.3261871337890625, 0.351806640625, 0.3774261474609375, 0.403045654296875, 0.4286651611328125, 0.45428466796875, 0.4799041748046875, 0.505523681640625, 0.5311431884765625, 0.5567626953125, 0.5823822021484375, 0.608001708984375, 0.6336212158203125, 0.65924072265625, 0.6848602294921875, 0.710479736328125, 0.7360992431640625, 0.76171875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 3.0, 6.0, 1.0, 5.0, 8.0, 10.0, 13.0, 19.0, 16.0, 28.0, 33.0, 33.0, 42.0, 39.0, 60.0, 62.0, 76.0, 65.0, 59.0, 46.0, 57.0, 50.0, 54.0, 41.0, 29.0, 28.0, 20.0, 23.0, 26.0, 11.0, 15.0, 8.0, 6.0, 5.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1160888671875, -0.11192703247070312, -0.10776519775390625, -0.10360336303710938, -0.0994415283203125, -0.09527969360351562, -0.09111785888671875, -0.08695602416992188, -0.082794189453125, -0.07863235473632812, -0.07447052001953125, -0.07030868530273438, -0.0661468505859375, -0.061985015869140625, -0.05782318115234375, -0.053661346435546875, -0.04949951171875, -0.045337677001953125, -0.04117584228515625, -0.037014007568359375, -0.0328521728515625, -0.028690338134765625, -0.02452850341796875, -0.020366668701171875, -0.016204833984375, -0.012042999267578125, -0.00788116455078125, -0.003719329833984375, 0.0004425048828125, 0.004604339599609375, 0.00876617431640625, 0.012928009033203125, 0.01708984375, 0.021251678466796875, 0.02541351318359375, 0.029575347900390625, 0.0337371826171875, 0.037899017333984375, 0.04206085205078125, 0.046222686767578125, 0.050384521484375, 0.054546356201171875, 0.05870819091796875, 0.06287002563476562, 0.0670318603515625, 0.07119369506835938, 0.07535552978515625, 0.07951736450195312, 0.08367919921875, 0.08784103393554688, 0.09200286865234375, 0.09616470336914062, 0.1003265380859375, 0.10448837280273438, 0.10865020751953125, 0.11281204223632812, 0.116973876953125, 0.12113571166992188, 0.12529754638671875, 0.12945938110351562, 0.1336212158203125, 0.13778305053710938, 0.14194488525390625, 0.14610671997070312, 0.1502685546875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 8.0, 14.0, 23.0, 39.0, 72.0, 128.0, 238.0, 546.0, 1646.0, 5240.0, 22004.0, 149174.0, 744350.0, 101350.0, 17058.0, 4225.0, 1392.0, 523.0, 229.0, 100.0, 71.0, 43.0, 28.0, 12.0, 10.0, 10.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.841796875, -0.81500244140625, -0.7882080078125, -0.76141357421875, -0.734619140625, -0.70782470703125, -0.6810302734375, -0.65423583984375, -0.62744140625, -0.60064697265625, -0.5738525390625, -0.54705810546875, -0.520263671875, -0.49346923828125, -0.4666748046875, -0.43988037109375, -0.4130859375, -0.38629150390625, -0.3594970703125, -0.33270263671875, -0.305908203125, -0.27911376953125, -0.2523193359375, -0.22552490234375, -0.19873046875, -0.17193603515625, -0.1451416015625, -0.11834716796875, -0.091552734375, -0.06475830078125, -0.0379638671875, -0.01116943359375, 0.015625, 0.04241943359375, 0.0692138671875, 0.09600830078125, 0.122802734375, 0.14959716796875, 0.1763916015625, 0.20318603515625, 0.22998046875, 0.25677490234375, 0.2835693359375, 0.31036376953125, 0.337158203125, 0.36395263671875, 0.3907470703125, 0.41754150390625, 0.4443359375, 0.47113037109375, 0.4979248046875, 0.52471923828125, 0.551513671875, 0.57830810546875, 0.6051025390625, 0.63189697265625, 0.65869140625, 0.68548583984375, 0.7122802734375, 0.73907470703125, 0.765869140625, 0.79266357421875, 0.8194580078125, 0.84625244140625, 0.873046875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 4.0, 7.0, 7.0, 8.0, 11.0, 18.0, 28.0, 50.0, 49.0, 62.0, 100.0, 100.0, 135.0, 126.0, 85.0, 51.0, 40.0, 33.0, 19.0, 14.0, 13.0, 11.0, 7.0, 5.0, 7.0, 5.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-9.97781753540039e-05, -9.717419743537903e-05, -9.457021951675415e-05, -9.196624159812927e-05, -8.93622636795044e-05, -8.675828576087952e-05, -8.415430784225464e-05, -8.155032992362976e-05, -7.894635200500488e-05, -7.634237408638e-05, -7.373839616775513e-05, -7.113441824913025e-05, -6.853044033050537e-05, -6.592646241188049e-05, -6.332248449325562e-05, -6.071850657463074e-05, -5.811452865600586e-05, -5.551055073738098e-05, -5.2906572818756104e-05, -5.0302594900131226e-05, -4.769861698150635e-05, -4.509463906288147e-05, -4.249066114425659e-05, -3.9886683225631714e-05, -3.7282705307006836e-05, -3.467872738838196e-05, -3.207474946975708e-05, -2.9470771551132202e-05, -2.6866793632507324e-05, -2.4262815713882446e-05, -2.165883779525757e-05, -1.905485987663269e-05, -1.6450881958007812e-05, -1.3846904039382935e-05, -1.1242926120758057e-05, -8.638948202133179e-06, -6.034970283508301e-06, -3.430992364883423e-06, -8.270144462585449e-07, 1.776963472366333e-06, 4.380941390991211e-06, 6.984919309616089e-06, 9.588897228240967e-06, 1.2192875146865845e-05, 1.4796853065490723e-05, 1.74008309841156e-05, 2.000480890274048e-05, 2.2608786821365356e-05, 2.5212764739990234e-05, 2.7816742658615112e-05, 3.042072057723999e-05, 3.302469849586487e-05, 3.5628676414489746e-05, 3.8232654333114624e-05, 4.08366322517395e-05, 4.344061017036438e-05, 4.604458808898926e-05, 4.8648566007614136e-05, 5.1252543926239014e-05, 5.385652184486389e-05, 5.646049976348877e-05, 5.906447768211365e-05, 6.166845560073853e-05, 6.42724335193634e-05, 6.687641143798828e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 4.0, 5.0, 11.0, 11.0, 30.0, 31.0, 49.0, 75.0, 120.0, 239.0, 480.0, 1254.0, 4431.0, 22258.0, 215788.0, 728916.0, 61454.0, 9680.0, 2296.0, 749.0, 315.0, 134.0, 99.0, 58.0, 26.0, 21.0, 11.0, 10.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58447265625, -0.5582046508789062, -0.5319366455078125, -0.5056686401367188, -0.479400634765625, -0.45313262939453125, -0.4268646240234375, -0.40059661865234375, -0.37432861328125, -0.34806060791015625, -0.3217926025390625, -0.29552459716796875, -0.269256591796875, -0.24298858642578125, -0.2167205810546875, -0.19045257568359375, -0.1641845703125, -0.13791656494140625, -0.1116485595703125, -0.08538055419921875, -0.059112548828125, -0.03284454345703125, -0.0065765380859375, 0.01969146728515625, 0.04595947265625, 0.07222747802734375, 0.0984954833984375, 0.12476348876953125, 0.151031494140625, 0.17729949951171875, 0.2035675048828125, 0.22983551025390625, 0.256103515625, 0.28237152099609375, 0.3086395263671875, 0.33490753173828125, 0.361175537109375, 0.38744354248046875, 0.4137115478515625, 0.43997955322265625, 0.46624755859375, 0.49251556396484375, 0.5187835693359375, 0.5450515747070312, 0.571319580078125, 0.5975875854492188, 0.6238555908203125, 0.6501235961914062, 0.6763916015625, 0.7026596069335938, 0.7289276123046875, 0.7551956176757812, 0.781463623046875, 0.8077316284179688, 0.8339996337890625, 0.8602676391601562, 0.88653564453125, 0.9128036499023438, 0.9390716552734375, 0.9653396606445312, 0.991607666015625, 1.0178756713867188, 1.0441436767578125, 1.0704116821289062, 1.0966796875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 2.0, 5.0, 5.0, 9.0, 13.0, 13.0, 14.0, 22.0, 27.0, 32.0, 43.0, 76.0, 94.0, 105.0, 112.0, 96.0, 73.0, 65.0, 36.0, 37.0, 26.0, 22.0, 17.0, 15.0, 15.0, 8.0, 15.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.34912109375, -0.34107208251953125, -0.3330230712890625, -0.32497406005859375, -0.316925048828125, -0.30887603759765625, -0.3008270263671875, -0.29277801513671875, -0.28472900390625, -0.27667999267578125, -0.2686309814453125, -0.26058197021484375, -0.252532958984375, -0.24448394775390625, -0.2364349365234375, -0.22838592529296875, -0.2203369140625, -0.21228790283203125, -0.2042388916015625, -0.19618988037109375, -0.188140869140625, -0.18009185791015625, -0.1720428466796875, -0.16399383544921875, -0.15594482421875, -0.14789581298828125, -0.1398468017578125, -0.13179779052734375, -0.123748779296875, -0.11569976806640625, -0.1076507568359375, -0.09960174560546875, -0.091552734375, -0.08350372314453125, -0.0754547119140625, -0.06740570068359375, -0.059356689453125, -0.05130767822265625, -0.0432586669921875, -0.03520965576171875, -0.02716064453125, -0.01911163330078125, -0.0110626220703125, -0.00301361083984375, 0.005035400390625, 0.01308441162109375, 0.0211334228515625, 0.02918243408203125, 0.0372314453125, 0.04528045654296875, 0.0533294677734375, 0.06137847900390625, 0.069427490234375, 0.07747650146484375, 0.0855255126953125, 0.09357452392578125, 0.10162353515625, 0.10967254638671875, 0.1177215576171875, 0.12577056884765625, 0.133819580078125, 0.14186859130859375, 0.1499176025390625, 0.15796661376953125, 0.166015625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 7.0, 21.0, 119.0, 625.0, 210.0, 20.0, 8.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.046420097351074, -6.597654342651367, -6.148888111114502, -5.700121879577637, -5.25135612487793, -4.802590370178223, -4.353824138641357, -3.9050581455230713, -3.456292152404785, -3.007526159286499, -2.558760166168213, -2.1099941730499268, -1.6612281799316406, -1.2124621868133545, -0.7636961936950684, -0.3149302005767822, 0.1338357925415039, 0.58260178565979, 1.0313677787780762, 1.4801337718963623, 1.9288997650146484, 2.3776657581329346, 2.8264317512512207, 3.275197744369507, 3.723963737487793, 4.1727294921875, 4.621495723724365, 5.0702619552612305, 5.5190277099609375, 5.9677934646606445, 6.41655969619751, 6.865325927734375, 7.314090728759766, 7.762856483459473, 8.21162223815918, 8.660388946533203, 9.10915470123291, 9.557920455932617, 10.00668716430664, 10.455452919006348, 10.904218673706055, 11.352984428405762, 11.801750183105469, 12.250516891479492, 12.6992826461792, 13.148048400878906, 13.59681510925293, 14.045580863952637, 14.494346618652344, 14.94311237335205, 15.391878128051758, 15.840644836425781, 16.289409637451172, 16.738176345825195, 17.18694305419922, 17.63570785522461, 18.084474563598633, 18.533241271972656, 18.982006072998047, 19.43077278137207, 19.879539489746094, 20.328304290771484, 20.777070999145508, 21.2258358001709, 21.674602508544922]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 9.0, 9.0, 14.0, 25.0, 26.0, 38.0, 54.0, 39.0, 62.0, 59.0, 74.0, 81.0, 68.0, 82.0, 60.0, 74.0, 43.0, 58.0, 30.0, 29.0, 22.0, 15.0, 9.0, 9.0, 8.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8026463985443115, -0.7644394040107727, -0.7262324094772339, -0.6880253553390503, -0.6498183608055115, -0.6116113662719727, -0.5734043121337891, -0.5351973176002502, -0.4969903230667114, -0.4587833285331726, -0.4205763041973114, -0.3823692798614502, -0.3441622853279114, -0.30595529079437256, -0.26774826645851135, -0.22954124212265015, -0.19133424758911133, -0.15312723815441132, -0.1149202287197113, -0.07671321928501129, -0.03850620985031128, -0.0002992004156112671, 0.037907809019088745, 0.07611483335494995, 0.11432182788848877, 0.15252883732318878, 0.1907358467578888, 0.2289428561925888, 0.2671498656272888, 0.30535686016082764, 0.34356388449668884, 0.38177090883255005, 0.41997790336608887, 0.4581848978996277, 0.4963919222354889, 0.5345989465713501, 0.5728059411048889, 0.6110129356384277, 0.6492199897766113, 0.6874269843101501, 0.725633978843689, 0.7638409733772278, 0.8020479679107666, 0.8402550220489502, 0.878462016582489, 0.9166690111160278, 0.9548760652542114, 0.9930830597877502, 1.031290054321289, 1.0694971084594727, 1.1077040433883667, 1.1459110975265503, 1.1841180324554443, 1.222325086593628, 1.2605321407318115, 1.2987391948699951, 1.3369461297988892, 1.3751531839370728, 1.4133601188659668, 1.4515671730041504, 1.489774227142334, 1.527981162071228, 1.5661882162094116, 1.6043951511383057, 1.6426022052764893]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0, 1.0, 5.0, 7.0, 7.0, 8.0, 9.0, 13.0, 10.0, 25.0, 20.0, 17.0, 23.0, 34.0, 43.0, 41.0, 61.0, 55.0, 61.0, 120.0, 330.0, 17099.0, 4170215.0, 5442.0, 293.0, 110.0, 55.0, 43.0, 30.0, 19.0, 19.0, 22.0, 11.0, 10.0, 6.0, 7.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.75, -5.59197998046875, -5.4339599609375, -5.27593994140625, -5.117919921875, -4.95989990234375, -4.8018798828125, -4.64385986328125, -4.48583984375, -4.32781982421875, -4.1697998046875, -4.01177978515625, -3.853759765625, -3.69573974609375, -3.5377197265625, -3.37969970703125, -3.2216796875, -3.06365966796875, -2.9056396484375, -2.74761962890625, -2.589599609375, -2.43157958984375, -2.2735595703125, -2.11553955078125, -1.95751953125, -1.79949951171875, -1.6414794921875, -1.48345947265625, -1.325439453125, -1.16741943359375, -1.0093994140625, -0.85137939453125, -0.693359375, -0.53533935546875, -0.3773193359375, -0.21929931640625, -0.061279296875, 0.09674072265625, 0.2547607421875, 0.41278076171875, 0.57080078125, 0.72882080078125, 0.8868408203125, 1.04486083984375, 1.202880859375, 1.36090087890625, 1.5189208984375, 1.67694091796875, 1.8349609375, 1.99298095703125, 2.1510009765625, 2.30902099609375, 2.467041015625, 2.62506103515625, 2.7830810546875, 2.94110107421875, 3.09912109375, 3.25714111328125, 3.4151611328125, 3.57318115234375, 3.731201171875, 3.88922119140625, 4.0472412109375, 4.20526123046875, 4.36328125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 6.0, 15.0, 41.0, 86.0, 136.0, 179.0, 190.0, 158.0, 103.0, 61.0, 21.0, 10.0, 5.0, 3.0, 1.0], "bins": [-0.125732421875, -0.12345290184020996, -0.12117338180541992, -0.11889386177062988, -0.11661434173583984, -0.1143348217010498, -0.11205530166625977, -0.10977578163146973, -0.10749626159667969, -0.10521674156188965, -0.10293722152709961, -0.10065770149230957, -0.09837818145751953, -0.09609866142272949, -0.09381914138793945, -0.09153962135314941, -0.08926010131835938, -0.08698058128356934, -0.0847010612487793, -0.08242154121398926, -0.08014202117919922, -0.07786250114440918, -0.07558298110961914, -0.0733034610748291, -0.07102394104003906, -0.06874442100524902, -0.06646490097045898, -0.06418538093566895, -0.061905860900878906, -0.05962634086608887, -0.05734682083129883, -0.05506730079650879, -0.05278778076171875, -0.05050826072692871, -0.04822874069213867, -0.04594922065734863, -0.043669700622558594, -0.041390180587768555, -0.039110660552978516, -0.03683114051818848, -0.03455162048339844, -0.0322721004486084, -0.02999258041381836, -0.02771306037902832, -0.02543354034423828, -0.023154020309448242, -0.020874500274658203, -0.018594980239868164, -0.016315460205078125, -0.014035940170288086, -0.011756420135498047, -0.009476900100708008, -0.007197380065917969, -0.00491786003112793, -0.0026383399963378906, -0.00035881996154785156, 0.0019207000732421875, 0.0042002201080322266, 0.006479740142822266, 0.008759260177612305, 0.011038780212402344, 0.013318300247192383, 0.015597820281982422, 0.01787734031677246, 0.0201568603515625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 4.0, 11.0, 13.0, 23.0, 44.0, 104.0, 179.0, 444.0, 2418.0, 3961656.0, 227002.0, 1658.0, 345.0, 189.0, 90.0, 64.0, 26.0, 10.0, 10.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2109375, -3.9287109375, -3.646484375, -3.3642578125, -3.08203125, -2.7998046875, -2.517578125, -2.2353515625, -1.953125, -1.6708984375, -1.388671875, -1.1064453125, -0.82421875, -0.5419921875, -0.259765625, 0.0224609375, 0.3046875, 0.5869140625, 0.869140625, 1.1513671875, 1.43359375, 1.7158203125, 1.998046875, 2.2802734375, 2.5625, 2.8447265625, 3.126953125, 3.4091796875, 3.69140625, 3.9736328125, 4.255859375, 4.5380859375, 4.8203125, 5.1025390625, 5.384765625, 5.6669921875, 5.94921875, 6.2314453125, 6.513671875, 6.7958984375, 7.078125, 7.3603515625, 7.642578125, 7.9248046875, 8.20703125, 8.4892578125, 8.771484375, 9.0537109375, 9.3359375, 9.6181640625, 9.900390625, 10.1826171875, 10.46484375, 10.7470703125, 11.029296875, 11.3115234375, 11.59375, 11.8759765625, 12.158203125, 12.4404296875, 12.72265625, 13.0048828125, 13.287109375, 13.5693359375, 13.8515625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 8.0, 14.0, 72.0, 435.0, 3217.0, 253.0, 59.0, 19.0, 7.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26904296875, -0.24524688720703125, -0.2214508056640625, -0.19765472412109375, -0.173858642578125, -0.15006256103515625, -0.1262664794921875, -0.10247039794921875, -0.07867431640625, -0.05487823486328125, -0.0310821533203125, -0.00728607177734375, 0.016510009765625, 0.04030609130859375, 0.0641021728515625, 0.08789825439453125, 0.1116943359375, 0.13549041748046875, 0.1592864990234375, 0.18308258056640625, 0.206878662109375, 0.23067474365234375, 0.2544708251953125, 0.27826690673828125, 0.30206298828125, 0.32585906982421875, 0.3496551513671875, 0.37345123291015625, 0.397247314453125, 0.42104339599609375, 0.4448394775390625, 0.46863555908203125, 0.492431640625, 0.5162277221679688, 0.5400238037109375, 0.5638198852539062, 0.587615966796875, 0.6114120483398438, 0.6352081298828125, 0.6590042114257812, 0.68280029296875, 0.7065963745117188, 0.7303924560546875, 0.7541885375976562, 0.777984619140625, 0.8017807006835938, 0.8255767822265625, 0.8493728637695312, 0.8731689453125, 0.8969650268554688, 0.9207611083984375, 0.9445571899414062, 0.968353271484375, 0.9921493530273438, 1.0159454345703125, 1.0397415161132812, 1.06353759765625, 1.0873336791992188, 1.1111297607421875, 1.1349258422851562, 1.158721923828125, 1.1825180053710938, 1.2063140869140625, 1.2301101684570312, 1.25390625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 10.0, 35.0, 164.0, 504.0, 222.0, 51.0, 15.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.556102752685547, -3.3115787506103516, -3.0670547485351562, -2.822530746459961, -2.5780067443847656, -2.3334827423095703, -2.088958740234375, -1.8444346189498901, -1.5999106168746948, -1.3553866147994995, -1.1108626127243042, -0.8663385510444641, -0.6218145489692688, -0.3772904872894287, -0.1327664852142334, 0.11175751686096191, 0.3562815189361572, 0.6008055210113525, 0.8453295230865479, 1.0898535251617432, 1.3343775272369385, 1.5789016485214233, 1.8234256505966187, 2.0679497718811035, 2.312473773956299, 2.556997776031494, 2.8015217781066895, 3.0460457801818848, 3.29056978225708, 3.5350937843322754, 3.7796177864074707, 4.024141788482666, 4.268665790557861, 4.513189792633057, 4.757713794708252, 5.002237796783447, 5.246761798858643, 5.491285800933838, 5.735809803009033, 5.9803338050842285, 6.224857807159424, 6.469381809234619, 6.7139058113098145, 6.95842981338501, 7.202953815460205, 7.4474778175354, 7.692001819610596, 7.936525821685791, 8.181050300598145, 8.42557430267334, 8.670098304748535, 8.91462230682373, 9.159146308898926, 9.403670310974121, 9.648194313049316, 9.892718315124512, 10.137242317199707, 10.381766319274902, 10.626290321350098, 10.870814323425293, 11.115338325500488, 11.359862327575684, 11.604386329650879, 11.848910331726074, 12.09343433380127]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 12.0, 14.0, 36.0, 46.0, 57.0, 80.0, 89.0, 115.0, 98.0, 120.0, 100.0, 82.0, 44.0, 46.0, 28.0, 19.0, 5.0, 7.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3043053150177, -2.23893404006958, -2.17356276512146, -2.108191728591919, -2.042820453643799, -1.9774491786956787, -1.9120779037475586, -1.846706748008728, -1.7813355922698975, -1.7159643173217773, -1.6505931615829468, -1.5852218866348267, -1.519850730895996, -1.454479455947876, -1.3891081809997559, -1.3237370252609253, -1.2583657503128052, -1.192994475364685, -1.1276233196258545, -1.0622520446777344, -0.9968808889389038, -0.9315096139907837, -0.8661383986473083, -0.800767183303833, -0.7353959679603577, -0.6700247526168823, -0.604653537273407, -0.5392823219299316, -0.4739110767841339, -0.40853986144065857, -0.34316861629486084, -0.2777974009513855, -0.2124263048171997, -0.14705508947372437, -0.08168385922908783, -0.016312628984451294, 0.04905858635902405, 0.11442980170249939, 0.17980104684829712, 0.24517226219177246, 0.3105434775352478, 0.37591469287872314, 0.4412859082221985, 0.5066571235656738, 0.572028398513794, 0.6373995542526245, 0.7027708292007446, 0.76814204454422, 0.8335132598876953, 0.8988844752311707, 0.964255690574646, 1.0296269655227661, 1.0949981212615967, 1.1603693962097168, 1.225740671157837, 1.2911118268966675, 1.356482982635498, 1.4218542575836182, 1.4872254133224487, 1.5525966882705688, 1.6179678440093994, 1.6833391189575195, 1.7487103939056396, 1.8140815496444702, 1.8794528245925903]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 5.0, 2.0, 9.0, 6.0, 8.0, 6.0, 13.0, 9.0, 15.0, 12.0, 20.0, 25.0, 27.0, 32.0, 41.0, 50.0, 75.0, 193.0, 644.0, 4761.0, 197226.0, 827408.0, 15974.0, 1278.0, 291.0, 102.0, 64.0, 58.0, 36.0, 32.0, 24.0, 21.0, 20.0, 14.0, 9.0, 13.0, 7.0, 7.0, 4.0, 4.0, 1.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0], "bins": [-3.556640625, -3.455596923828125, -3.35455322265625, -3.253509521484375, -3.1524658203125, -3.051422119140625, -2.95037841796875, -2.849334716796875, -2.748291015625, -2.647247314453125, -2.54620361328125, -2.445159912109375, -2.3441162109375, -2.243072509765625, -2.14202880859375, -2.040985107421875, -1.93994140625, -1.838897705078125, -1.73785400390625, -1.636810302734375, -1.5357666015625, -1.434722900390625, -1.33367919921875, -1.232635498046875, -1.131591796875, -1.030548095703125, -0.92950439453125, -0.828460693359375, -0.7274169921875, -0.626373291015625, -0.52532958984375, -0.424285888671875, -0.3232421875, -0.222198486328125, -0.12115478515625, -0.020111083984375, 0.0809326171875, 0.181976318359375, 0.28302001953125, 0.384063720703125, 0.485107421875, 0.586151123046875, 0.68719482421875, 0.788238525390625, 0.8892822265625, 0.990325927734375, 1.09136962890625, 1.192413330078125, 1.29345703125, 1.394500732421875, 1.49554443359375, 1.596588134765625, 1.6976318359375, 1.798675537109375, 1.89971923828125, 2.000762939453125, 2.101806640625, 2.202850341796875, 2.30389404296875, 2.404937744140625, 2.5059814453125, 2.607025146484375, 2.70806884765625, 2.809112548828125, 2.91015625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 4.0, 4.0, 8.0, 5.0, 20.0, 25.0, 29.0, 33.0, 47.0, 52.0, 44.0, 63.0, 67.0, 79.0, 94.0, 74.0, 58.0, 55.0, 51.0, 39.0, 41.0, 30.0, 21.0, 17.0, 11.0, 9.0, 10.0, 3.0, 6.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.07733154296875, -0.07493400573730469, -0.07253646850585938, -0.07013893127441406, -0.06774139404296875, -0.06534385681152344, -0.06294631958007812, -0.06054878234863281, -0.0581512451171875, -0.05575370788574219, -0.053356170654296875, -0.05095863342285156, -0.04856109619140625, -0.04616355895996094, -0.043766021728515625, -0.04136848449707031, -0.038970947265625, -0.03657341003417969, -0.034175872802734375, -0.03177833557128906, -0.02938079833984375, -0.026983261108398438, -0.024585723876953125, -0.022188186645507812, -0.0197906494140625, -0.017393112182617188, -0.014995574951171875, -0.012598037719726562, -0.01020050048828125, -0.0078029632568359375, -0.005405426025390625, -0.0030078887939453125, -0.0006103515625, 0.0017871856689453125, 0.004184722900390625, 0.0065822601318359375, 0.00897979736328125, 0.011377334594726562, 0.013774871826171875, 0.016172409057617188, 0.0185699462890625, 0.020967483520507812, 0.023365020751953125, 0.025762557983398438, 0.02816009521484375, 0.030557632446289062, 0.032955169677734375, 0.03535270690917969, 0.037750244140625, 0.04014778137207031, 0.042545318603515625, 0.04494285583496094, 0.04734039306640625, 0.04973793029785156, 0.052135467529296875, 0.05453300476074219, 0.0569305419921875, 0.05932807922363281, 0.061725616455078125, 0.06412315368652344, 0.06652069091796875, 0.06891822814941406, 0.07131576538085938, 0.07371330261230469, 0.07611083984375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 5.0, 2.0, 9.0, 8.0, 12.0, 16.0, 15.0, 31.0, 42.0, 73.0, 102.0, 157.0, 238.0, 467.0, 891.0, 2072.0, 5699.0, 22023.0, 120938.0, 567262.0, 269340.0, 43576.0, 9747.0, 3070.0, 1243.0, 612.0, 320.0, 193.0, 119.0, 69.0, 62.0, 51.0, 21.0, 21.0, 12.0, 4.0, 7.0, 7.0, 9.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8369140625, -0.808746337890625, -0.78057861328125, -0.752410888671875, -0.7242431640625, -0.696075439453125, -0.66790771484375, -0.639739990234375, -0.611572265625, -0.583404541015625, -0.55523681640625, -0.527069091796875, -0.4989013671875, -0.470733642578125, -0.44256591796875, -0.414398193359375, -0.38623046875, -0.358062744140625, -0.32989501953125, -0.301727294921875, -0.2735595703125, -0.245391845703125, -0.21722412109375, -0.189056396484375, -0.160888671875, -0.132720947265625, -0.10455322265625, -0.076385498046875, -0.0482177734375, -0.020050048828125, 0.00811767578125, 0.036285400390625, 0.064453125, 0.092620849609375, 0.12078857421875, 0.148956298828125, 0.1771240234375, 0.205291748046875, 0.23345947265625, 0.261627197265625, 0.289794921875, 0.317962646484375, 0.34613037109375, 0.374298095703125, 0.4024658203125, 0.430633544921875, 0.45880126953125, 0.486968994140625, 0.51513671875, 0.543304443359375, 0.57147216796875, 0.599639892578125, 0.6278076171875, 0.655975341796875, 0.68414306640625, 0.712310791015625, 0.740478515625, 0.768646240234375, 0.79681396484375, 0.824981689453125, 0.8531494140625, 0.881317138671875, 0.90948486328125, 0.937652587890625, 0.9658203125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 7.0, 5.0, 3.0, 6.0, 12.0, 14.0, 17.0, 20.0, 27.0, 20.0, 27.0, 39.0, 57.0, 54.0, 61.0, 46.0, 58.0, 52.0, 62.0, 68.0, 57.0, 50.0, 40.0, 35.0, 36.0, 36.0, 24.0, 21.0, 12.0, 14.0, 11.0, 2.0, 5.0, 3.0, 3.0, 6.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.35791015625, -0.34685516357421875, -0.3358001708984375, -0.32474517822265625, -0.313690185546875, -0.30263519287109375, -0.2915802001953125, -0.28052520751953125, -0.26947021484375, -0.25841522216796875, -0.2473602294921875, -0.23630523681640625, -0.225250244140625, -0.21419525146484375, -0.2031402587890625, -0.19208526611328125, -0.1810302734375, -0.16997528076171875, -0.1589202880859375, -0.14786529541015625, -0.136810302734375, -0.12575531005859375, -0.1147003173828125, -0.10364532470703125, -0.09259033203125, -0.08153533935546875, -0.0704803466796875, -0.05942535400390625, -0.048370361328125, -0.03731536865234375, -0.0262603759765625, -0.01520538330078125, -0.004150390625, 0.00690460205078125, 0.0179595947265625, 0.02901458740234375, 0.040069580078125, 0.05112457275390625, 0.0621795654296875, 0.07323455810546875, 0.08428955078125, 0.09534454345703125, 0.1063995361328125, 0.11745452880859375, 0.128509521484375, 0.13956451416015625, 0.1506195068359375, 0.16167449951171875, 0.1727294921875, 0.18378448486328125, 0.1948394775390625, 0.20589447021484375, 0.216949462890625, 0.22800445556640625, 0.2390594482421875, 0.25011444091796875, 0.26116943359375, 0.27222442626953125, 0.2832794189453125, 0.29433441162109375, 0.305389404296875, 0.31644439697265625, 0.3274993896484375, 0.33855438232421875, 0.349609375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 3.0, 11.0, 8.0, 18.0, 20.0, 29.0, 57.0, 92.0, 113.0, 177.0, 380.0, 897.0, 2652.0, 12056.0, 159283.0, 819719.0, 43818.0, 6189.0, 1719.0, 591.0, 289.0, 147.0, 96.0, 55.0, 37.0, 28.0, 19.0, 16.0, 14.0, 5.0, 2.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.189453125, -1.1501922607421875, -1.110931396484375, -1.0716705322265625, -1.03240966796875, -0.9931488037109375, -0.953887939453125, -0.9146270751953125, -0.8753662109375, -0.8361053466796875, -0.796844482421875, -0.7575836181640625, -0.71832275390625, -0.6790618896484375, -0.639801025390625, -0.6005401611328125, -0.561279296875, -0.5220184326171875, -0.482757568359375, -0.4434967041015625, -0.40423583984375, -0.3649749755859375, -0.325714111328125, -0.2864532470703125, -0.2471923828125, -0.2079315185546875, -0.168670654296875, -0.1294097900390625, -0.09014892578125, -0.0508880615234375, -0.011627197265625, 0.0276336669921875, 0.06689453125, 0.1061553955078125, 0.145416259765625, 0.1846771240234375, 0.22393798828125, 0.2631988525390625, 0.302459716796875, 0.3417205810546875, 0.3809814453125, 0.4202423095703125, 0.459503173828125, 0.4987640380859375, 0.53802490234375, 0.5772857666015625, 0.616546630859375, 0.6558074951171875, 0.695068359375, 0.7343292236328125, 0.773590087890625, 0.8128509521484375, 0.85211181640625, 0.8913726806640625, 0.930633544921875, 0.9698944091796875, 1.0091552734375, 1.0484161376953125, 1.087677001953125, 1.1269378662109375, 1.16619873046875, 1.2054595947265625, 1.244720458984375, 1.2839813232421875, 1.3232421875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 9.0, 13.0, 16.0, 18.0, 26.0, 29.0, 44.0, 82.0, 124.0, 142.0, 132.0, 117.0, 72.0, 61.0, 39.0, 26.0, 10.0, 15.0, 12.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.08970832824707e-05, -8.710380643606186e-05, -8.331052958965302e-05, -7.951725274324417e-05, -7.572397589683533e-05, -7.193069905042648e-05, -6.813742220401764e-05, -6.43441453576088e-05, -6.055086851119995e-05, -5.675759166479111e-05, -5.296431481838226e-05, -4.917103797197342e-05, -4.5377761125564575e-05, -4.158448427915573e-05, -3.779120743274689e-05, -3.399793058633804e-05, -3.02046537399292e-05, -2.6411376893520355e-05, -2.261810004711151e-05, -1.8824823200702667e-05, -1.5031546354293823e-05, -1.123826950788498e-05, -7.444992661476135e-06, -3.6517158150672913e-06, 1.4156103134155273e-07, 3.934837877750397e-06, 7.72811472415924e-06, 1.1521391570568085e-05, 1.531466841697693e-05, 1.9107945263385773e-05, 2.2901222109794617e-05, 2.669449895620346e-05, 3.0487775802612305e-05, 3.428105264902115e-05, 3.807432949542999e-05, 4.186760634183884e-05, 4.566088318824768e-05, 4.9454160034656525e-05, 5.324743688106537e-05, 5.704071372747421e-05, 6.083399057388306e-05, 6.46272674202919e-05, 6.842054426670074e-05, 7.221382111310959e-05, 7.600709795951843e-05, 7.980037480592728e-05, 8.359365165233612e-05, 8.738692849874496e-05, 9.118020534515381e-05, 9.497348219156265e-05, 9.87667590379715e-05, 0.00010256003588438034, 0.00010635331273078918, 0.00011014658957719803, 0.00011393986642360687, 0.00011773314327001572, 0.00012152642011642456, 0.0001253196969628334, 0.00012911297380924225, 0.0001329062506556511, 0.00013669952750205994, 0.00014049280434846878, 0.00014428608119487762, 0.00014807935804128647, 0.0001518726348876953]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 6.0, 5.0, 6.0, 11.0, 12.0, 11.0, 19.0, 23.0, 58.0, 75.0, 150.0, 246.0, 343.0, 713.0, 1486.0, 3869.0, 13118.0, 85473.0, 744060.0, 170582.0, 19627.0, 4909.0, 1887.0, 846.0, 404.0, 222.0, 133.0, 73.0, 56.0, 29.0, 26.0, 24.0, 10.0, 13.0, 9.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69140625, -0.6672592163085938, -0.6431121826171875, -0.6189651489257812, -0.594818115234375, -0.5706710815429688, -0.5465240478515625, -0.5223770141601562, -0.49822998046875, -0.47408294677734375, -0.4499359130859375, -0.42578887939453125, -0.401641845703125, -0.37749481201171875, -0.3533477783203125, -0.32920074462890625, -0.3050537109375, -0.28090667724609375, -0.2567596435546875, -0.23261260986328125, -0.208465576171875, -0.18431854248046875, -0.1601715087890625, -0.13602447509765625, -0.11187744140625, -0.08773040771484375, -0.0635833740234375, -0.03943634033203125, -0.015289306640625, 0.00885772705078125, 0.0330047607421875, 0.05715179443359375, 0.081298828125, 0.10544586181640625, 0.1295928955078125, 0.15373992919921875, 0.177886962890625, 0.20203399658203125, 0.2261810302734375, 0.25032806396484375, 0.27447509765625, 0.29862213134765625, 0.3227691650390625, 0.34691619873046875, 0.371063232421875, 0.39521026611328125, 0.4193572998046875, 0.44350433349609375, 0.4676513671875, 0.49179840087890625, 0.5159454345703125, 0.5400924682617188, 0.564239501953125, 0.5883865356445312, 0.6125335693359375, 0.6366806030273438, 0.66082763671875, 0.6849746704101562, 0.7091217041015625, 0.7332687377929688, 0.757415771484375, 0.7815628051757812, 0.8057098388671875, 0.8298568725585938, 0.85400390625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 4.0, 7.0, 14.0, 14.0, 14.0, 18.0, 26.0, 33.0, 40.0, 41.0, 59.0, 64.0, 79.0, 91.0, 119.0, 70.0, 62.0, 60.0, 47.0, 22.0, 25.0, 22.0, 9.0, 11.0, 7.0, 8.0, 5.0, 6.0, 5.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.302490234375, -0.29425048828125, -0.2860107421875, -0.27777099609375, -0.26953125, -0.26129150390625, -0.2530517578125, -0.24481201171875, -0.236572265625, -0.22833251953125, -0.2200927734375, -0.21185302734375, -0.20361328125, -0.19537353515625, -0.1871337890625, -0.17889404296875, -0.170654296875, -0.16241455078125, -0.1541748046875, -0.14593505859375, -0.1376953125, -0.12945556640625, -0.1212158203125, -0.11297607421875, -0.104736328125, -0.09649658203125, -0.0882568359375, -0.08001708984375, -0.07177734375, -0.06353759765625, -0.0552978515625, -0.04705810546875, -0.038818359375, -0.03057861328125, -0.0223388671875, -0.01409912109375, -0.005859375, 0.00238037109375, 0.0106201171875, 0.01885986328125, 0.027099609375, 0.03533935546875, 0.0435791015625, 0.05181884765625, 0.06005859375, 0.06829833984375, 0.0765380859375, 0.08477783203125, 0.093017578125, 0.10125732421875, 0.1094970703125, 0.11773681640625, 0.1259765625, 0.13421630859375, 0.1424560546875, 0.15069580078125, 0.158935546875, 0.16717529296875, 0.1754150390625, 0.18365478515625, 0.19189453125, 0.20013427734375, 0.2083740234375, 0.21661376953125, 0.224853515625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 5.0, 19.0, 83.0, 335.0, 433.0, 110.0, 21.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.385377883911133, -10.91618537902832, -10.446993827819824, -9.977801322937012, -9.5086088180542, -9.039417266845703, -8.57022476196289, -8.101032257080078, -7.631840229034424, -7.1626482009887695, -6.693455696105957, -6.224263668060303, -5.755071640014648, -5.285879135131836, -4.816687107086182, -4.347495079040527, -3.878302574157715, -3.4091103076934814, -2.939918041229248, -2.4707260131835938, -2.0015337467193604, -1.532341480255127, -1.0631494522094727, -0.5939571857452393, -0.12476491928100586, 0.34442728757858276, 0.8136194944381714, 1.2828116416931152, 1.7520039081573486, 2.221196174621582, 2.6903882026672363, 3.1595804691314697, 3.628772735595703, 4.097964763641357, 4.56715726852417, 5.036349296569824, 5.505541801452637, 5.974733829498291, 6.443925857543945, 6.913118362426758, 7.382310390472412, 7.851502418518066, 8.320694923400879, 8.789886474609375, 9.259078979492188, 9.728271484375, 10.197463989257812, 10.666655540466309, 11.135848045349121, 11.605040550231934, 12.07423210144043, 12.543424606323242, 13.012617111206055, 13.481809616088867, 13.951001167297363, 14.420193672180176, 14.889385223388672, 15.358577728271484, 15.82776927947998, 16.29696273803711, 16.76615333557129, 17.2353458404541, 17.704538345336914, 18.173730850219727, 18.64292335510254]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 5.0, 8.0, 5.0, 7.0, 6.0, 7.0, 10.0, 24.0, 17.0, 16.0, 22.0, 20.0, 27.0, 32.0, 31.0, 38.0, 43.0, 45.0, 36.0, 52.0, 39.0, 50.0, 63.0, 41.0, 37.0, 38.0, 35.0, 38.0, 35.0, 35.0, 21.0, 23.0, 14.0, 15.0, 8.0, 14.0, 14.0, 8.0, 7.0, 3.0, 7.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.9695837497711182, -1.9022765159606934, -1.8349692821502686, -1.7676621675491333, -1.7003549337387085, -1.6330476999282837, -1.5657405853271484, -1.4984333515167236, -1.4311261177062988, -1.363818883895874, -1.2965116500854492, -1.229204535484314, -1.1618973016738892, -1.0945900678634644, -1.027282953262329, -0.9599757194519043, -0.8926684856414795, -0.8253612518310547, -0.7580540776252747, -0.6907469034194946, -0.6234396696090698, -0.556132435798645, -0.488825261592865, -0.4215180575847626, -0.35421085357666016, -0.28690364956855774, -0.21959644556045532, -0.1522892415523529, -0.08498203754425049, -0.01767483353614807, 0.049632370471954346, 0.11693957448005676, 0.18424701690673828, 0.2515542209148407, 0.3188614249229431, 0.38616862893104553, 0.45347583293914795, 0.5207830667495728, 0.5880902409553528, 0.6553974151611328, 0.7227046489715576, 0.7900118827819824, 0.8573190569877625, 0.9246262311935425, 0.9919334650039673, 1.059240698814392, 1.1265478134155273, 1.1938550472259521, 1.261162281036377, 1.3284695148468018, 1.3957767486572266, 1.4630838632583618, 1.5303910970687866, 1.5976983308792114, 1.6650054454803467, 1.7323126792907715, 1.7996199131011963, 1.866927146911621, 1.934234380722046, 2.0015416145324707, 2.0688486099243164, 2.136155843734741, 2.203463077545166, 2.270770311355591, 2.3380775451660156]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 5.0, 7.0, 4.0, 9.0, 10.0, 15.0, 9.0, 11.0, 15.0, 20.0, 13.0, 26.0, 19.0, 40.0, 31.0, 53.0, 91.0, 230.0, 1240.0, 21317.0, 4007391.0, 158001.0, 4634.0, 638.0, 185.0, 76.0, 56.0, 40.0, 36.0, 11.0, 16.0, 10.0, 10.0, 4.0, 8.0, 1.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.28125, -4.164703369140625, -4.04815673828125, -3.931610107421875, -3.8150634765625, -3.698516845703125, -3.58197021484375, -3.465423583984375, -3.348876953125, -3.232330322265625, -3.11578369140625, -2.999237060546875, -2.8826904296875, -2.766143798828125, -2.64959716796875, -2.533050537109375, -2.41650390625, -2.299957275390625, -2.18341064453125, -2.066864013671875, -1.9503173828125, -1.833770751953125, -1.71722412109375, -1.600677490234375, -1.484130859375, -1.367584228515625, -1.25103759765625, -1.134490966796875, -1.0179443359375, -0.901397705078125, -0.78485107421875, -0.668304443359375, -0.5517578125, -0.435211181640625, -0.31866455078125, -0.202117919921875, -0.0855712890625, 0.030975341796875, 0.14752197265625, 0.264068603515625, 0.380615234375, 0.497161865234375, 0.61370849609375, 0.730255126953125, 0.8468017578125, 0.963348388671875, 1.07989501953125, 1.196441650390625, 1.31298828125, 1.429534912109375, 1.54608154296875, 1.662628173828125, 1.7791748046875, 1.895721435546875, 2.01226806640625, 2.128814697265625, 2.245361328125, 2.361907958984375, 2.47845458984375, 2.595001220703125, 2.7115478515625, 2.828094482421875, 2.94464111328125, 3.061187744140625, 3.177734375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 7.0, 5.0, 3.0, 4.0, 7.0, 7.0, 10.0, 24.0, 24.0, 32.0, 36.0, 44.0, 37.0, 53.0, 44.0, 62.0, 65.0, 58.0, 72.0, 68.0, 45.0, 53.0, 44.0, 40.0, 37.0, 26.0, 15.0, 17.0, 17.0, 9.0, 9.0, 9.0, 6.0, 3.0, 1.0, 4.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.058685302734375, -0.05639028549194336, -0.05409526824951172, -0.05180025100708008, -0.04950523376464844, -0.0472102165222168, -0.044915199279785156, -0.042620182037353516, -0.040325164794921875, -0.038030147552490234, -0.035735130310058594, -0.03344011306762695, -0.031145095825195312, -0.028850078582763672, -0.02655506134033203, -0.02426004409790039, -0.02196502685546875, -0.01967000961303711, -0.01737499237060547, -0.015079975128173828, -0.012784957885742188, -0.010489940643310547, -0.008194923400878906, -0.005899906158447266, -0.003604888916015625, -0.0013098716735839844, 0.0009851455688476562, 0.003280162811279297, 0.0055751800537109375, 0.007870197296142578, 0.010165214538574219, 0.01246023178100586, 0.0147552490234375, 0.01705026626586914, 0.01934528350830078, 0.021640300750732422, 0.023935317993164062, 0.026230335235595703, 0.028525352478027344, 0.030820369720458984, 0.033115386962890625, 0.035410404205322266, 0.037705421447753906, 0.04000043869018555, 0.04229545593261719, 0.04459047317504883, 0.04688549041748047, 0.04918050765991211, 0.05147552490234375, 0.05377054214477539, 0.05606555938720703, 0.05836057662963867, 0.06065559387207031, 0.06295061111450195, 0.0652456283569336, 0.06754064559936523, 0.06983566284179688, 0.07213068008422852, 0.07442569732666016, 0.0767207145690918, 0.07901573181152344, 0.08131074905395508, 0.08360576629638672, 0.08590078353881836, 0.08819580078125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 7.0, 20.0, 111.0, 351.0, 1445.0, 132671.0, 4056925.0, 2124.0, 460.0, 117.0, 25.0, 16.0, 7.0, 5.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.53515625, -7.16009521484375, -6.7850341796875, -6.40997314453125, -6.034912109375, -5.65985107421875, -5.2847900390625, -4.90972900390625, -4.53466796875, -4.15960693359375, -3.7845458984375, -3.40948486328125, -3.034423828125, -2.65936279296875, -2.2843017578125, -1.90924072265625, -1.5341796875, -1.15911865234375, -0.7840576171875, -0.40899658203125, -0.033935546875, 0.34112548828125, 0.7161865234375, 1.09124755859375, 1.46630859375, 1.84136962890625, 2.2164306640625, 2.59149169921875, 2.966552734375, 3.34161376953125, 3.7166748046875, 4.09173583984375, 4.466796875, 4.84185791015625, 5.2169189453125, 5.59197998046875, 5.967041015625, 6.34210205078125, 6.7171630859375, 7.09222412109375, 7.46728515625, 7.84234619140625, 8.2174072265625, 8.59246826171875, 8.967529296875, 9.34259033203125, 9.7176513671875, 10.09271240234375, 10.4677734375, 10.84283447265625, 11.2178955078125, 11.59295654296875, 11.968017578125, 12.34307861328125, 12.7181396484375, 13.09320068359375, 13.46826171875, 13.84332275390625, 14.2183837890625, 14.59344482421875, 14.968505859375, 15.34356689453125, 15.7186279296875, 16.09368896484375, 16.46875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 23.0, 57.0, 445.0, 3196.0, 286.0, 54.0, 16.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81884765625, -0.7852554321289062, -0.7516632080078125, -0.7180709838867188, -0.684478759765625, -0.6508865356445312, -0.6172943115234375, -0.5837020874023438, -0.55010986328125, -0.5165176391601562, -0.4829254150390625, -0.44933319091796875, -0.415740966796875, -0.38214874267578125, -0.3485565185546875, -0.31496429443359375, -0.2813720703125, -0.24777984619140625, -0.2141876220703125, -0.18059539794921875, -0.147003173828125, -0.11341094970703125, -0.0798187255859375, -0.04622650146484375, -0.01263427734375, 0.02095794677734375, 0.0545501708984375, 0.08814239501953125, 0.121734619140625, 0.15532684326171875, 0.1889190673828125, 0.22251129150390625, 0.256103515625, 0.28969573974609375, 0.3232879638671875, 0.35688018798828125, 0.390472412109375, 0.42406463623046875, 0.4576568603515625, 0.49124908447265625, 0.52484130859375, 0.5584335327148438, 0.5920257568359375, 0.6256179809570312, 0.659210205078125, 0.6928024291992188, 0.7263946533203125, 0.7599868774414062, 0.7935791015625, 0.8271713256835938, 0.8607635498046875, 0.8943557739257812, 0.927947998046875, 0.9615402221679688, 0.9951324462890625, 1.0287246704101562, 1.06231689453125, 1.0959091186523438, 1.1295013427734375, 1.1630935668945312, 1.196685791015625, 1.2302780151367188, 1.2638702392578125, 1.2974624633789062, 1.3310546875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 8.0, 19.0, 92.0, 423.0, 367.0, 66.0, 21.0, 6.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-13.477032661437988, -13.195364952087402, -12.913697242736816, -12.632030487060547, -12.350362777709961, -12.068695068359375, -11.787027359008789, -11.505359649658203, -11.223692893981934, -10.942025184631348, -10.660357475280762, -10.378690719604492, -10.097023010253906, -9.81535530090332, -9.533687591552734, -9.252019882202148, -8.970352172851562, -8.688684463500977, -8.40701675415039, -8.125349998474121, -7.843682289123535, -7.562014579772949, -7.280346870422363, -6.9986796379089355, -6.717012405395508, -6.435344696044922, -6.153677463531494, -5.872009754180908, -5.5903425216674805, -5.3086748123168945, -5.027007102966309, -4.745339870452881, -4.463673114776611, -4.182005405426025, -3.9003381729125977, -3.6186704635620117, -3.337003231048584, -3.055335521697998, -2.773668050765991, -2.4920005798339844, -2.2103331089019775, -1.9286656379699707, -1.6469981670379639, -1.3653305768966675, -1.0836631059646606, -0.8019956350326538, -0.5203280448913574, -0.23866057395935059, 0.04300689697265625, 0.3246743977069855, 0.6063418984413147, 0.8880094289779663, 1.1696768999099731, 1.45134437084198, 1.7330119609832764, 2.014679431915283, 2.29634690284729, 2.578014373779297, 2.8596818447113037, 3.1413493156433105, 3.4230170249938965, 3.704684257507324, 3.98635196685791, 4.268019676208496, 4.549686908721924]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 3.0, 7.0, 11.0, 11.0, 35.0, 37.0, 38.0, 47.0, 62.0, 62.0, 69.0, 92.0, 81.0, 88.0, 59.0, 72.0, 56.0, 40.0, 39.0, 23.0, 26.0, 13.0, 10.0, 10.0, 7.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4030470848083496, -1.3432602882385254, -1.2834734916687012, -1.2236865758895874, -1.1638997793197632, -1.104112982749939, -1.0443260669708252, -0.984539270401001, -0.9247524738311768, -0.8649656772613525, -0.8051788210868835, -0.7453919649124146, -0.6856051683425903, -0.6258183717727661, -0.5660315155982971, -0.5062446594238281, -0.4464578628540039, -0.3866710364818573, -0.3268842101097107, -0.2670973837375641, -0.20731055736541748, -0.14752373099327087, -0.08773690462112427, -0.02795007824897766, 0.031836748123168945, 0.09162357449531555, 0.15141040086746216, 0.21119722723960876, 0.27098405361175537, 0.330770879983902, 0.3905577063560486, 0.4503445327281952, 0.5101313591003418, 0.569918155670166, 0.629705011844635, 0.689491868019104, 0.7492786645889282, 0.8090654611587524, 0.8688523173332214, 0.9286391735076904, 0.9884259700775146, 1.0482127666473389, 1.107999563217163, 1.1677864789962769, 1.227573275566101, 1.2873600721359253, 1.347146987915039, 1.4069337844848633, 1.4667205810546875, 1.5265073776245117, 1.586294174194336, 1.6460810899734497, 1.705867886543274, 1.7656546831130981, 1.825441598892212, 1.8852283954620361, 1.9450151920318604, 2.0048019886016846, 2.064588785171509, 2.124375581741333, 2.1841626167297363, 2.2439494132995605, 2.3037362098693848, 2.363523006439209, 2.423309803009033]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 2.0, 5.0, 3.0, 8.0, 10.0, 9.0, 7.0, 15.0, 19.0, 23.0, 38.0, 56.0, 76.0, 107.0, 182.0, 340.0, 732.0, 1954.0, 9527.0, 121676.0, 813378.0, 89147.0, 7955.0, 1810.0, 594.0, 304.0, 197.0, 122.0, 60.0, 51.0, 38.0, 23.0, 23.0, 10.0, 11.0, 10.0, 8.0, 8.0, 5.0, 4.0, 2.0, 1.0, 1.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.04296875, -1.971160888671875, -1.89935302734375, -1.827545166015625, -1.7557373046875, -1.683929443359375, -1.61212158203125, -1.540313720703125, -1.468505859375, -1.396697998046875, -1.32489013671875, -1.253082275390625, -1.1812744140625, -1.109466552734375, -1.03765869140625, -0.965850830078125, -0.89404296875, -0.822235107421875, -0.75042724609375, -0.678619384765625, -0.6068115234375, -0.535003662109375, -0.46319580078125, -0.391387939453125, -0.319580078125, -0.247772216796875, -0.17596435546875, -0.104156494140625, -0.0323486328125, 0.039459228515625, 0.11126708984375, 0.183074951171875, 0.2548828125, 0.326690673828125, 0.39849853515625, 0.470306396484375, 0.5421142578125, 0.613922119140625, 0.68572998046875, 0.757537841796875, 0.829345703125, 0.901153564453125, 0.97296142578125, 1.044769287109375, 1.1165771484375, 1.188385009765625, 1.26019287109375, 1.332000732421875, 1.40380859375, 1.475616455078125, 1.54742431640625, 1.619232177734375, 1.6910400390625, 1.762847900390625, 1.83465576171875, 1.906463623046875, 1.978271484375, 2.050079345703125, 2.12188720703125, 2.193695068359375, 2.2655029296875, 2.337310791015625, 2.40911865234375, 2.480926513671875, 2.552734375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 5.0, 3.0, 2.0, 6.0, 8.0, 19.0, 19.0, 37.0, 33.0, 49.0, 48.0, 57.0, 74.0, 78.0, 83.0, 87.0, 66.0, 82.0, 60.0, 48.0, 35.0, 34.0, 22.0, 15.0, 15.0, 10.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10760498046875, -0.10328388214111328, -0.09896278381347656, -0.09464168548583984, -0.09032058715820312, -0.0859994888305664, -0.08167839050292969, -0.07735729217529297, -0.07303619384765625, -0.06871509552001953, -0.06439399719238281, -0.060072898864746094, -0.055751800537109375, -0.051430702209472656, -0.04710960388183594, -0.04278850555419922, -0.0384674072265625, -0.03414630889892578, -0.029825210571289062, -0.025504112243652344, -0.021183013916015625, -0.016861915588378906, -0.012540817260742188, -0.008219718933105469, -0.00389862060546875, 0.00042247772216796875, 0.0047435760498046875, 0.009064674377441406, 0.013385772705078125, 0.017706871032714844, 0.022027969360351562, 0.02634906768798828, 0.030670166015625, 0.03499126434326172, 0.03931236267089844, 0.043633460998535156, 0.047954559326171875, 0.052275657653808594, 0.05659675598144531, 0.06091785430908203, 0.06523895263671875, 0.06956005096435547, 0.07388114929199219, 0.0782022476196289, 0.08252334594726562, 0.08684444427490234, 0.09116554260253906, 0.09548664093017578, 0.0998077392578125, 0.10412883758544922, 0.10844993591308594, 0.11277103424072266, 0.11709213256835938, 0.1214132308959961, 0.1257343292236328, 0.13005542755126953, 0.13437652587890625, 0.13869762420654297, 0.1430187225341797, 0.1473398208618164, 0.15166091918945312, 0.15598201751708984, 0.16030311584472656, 0.16462421417236328, 0.1689453125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 7.0, 6.0, 7.0, 7.0, 5.0, 10.0, 8.0, 25.0, 18.0, 33.0, 43.0, 68.0, 103.0, 134.0, 243.0, 394.0, 681.0, 1370.0, 2874.0, 6649.0, 18708.0, 67751.0, 299323.0, 473365.0, 127284.0, 31236.0, 10022.0, 3999.0, 1810.0, 950.0, 544.0, 327.0, 180.0, 130.0, 72.0, 49.0, 36.0, 25.0, 22.0, 13.0, 10.0, 2.0, 5.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.92578125, -0.8994903564453125, -0.873199462890625, -0.8469085693359375, -0.82061767578125, -0.7943267822265625, -0.768035888671875, -0.7417449951171875, -0.7154541015625, -0.6891632080078125, -0.662872314453125, -0.6365814208984375, -0.61029052734375, -0.5839996337890625, -0.557708740234375, -0.5314178466796875, -0.505126953125, -0.4788360595703125, -0.452545166015625, -0.4262542724609375, -0.39996337890625, -0.3736724853515625, -0.347381591796875, -0.3210906982421875, -0.2947998046875, -0.2685089111328125, -0.242218017578125, -0.2159271240234375, -0.18963623046875, -0.1633453369140625, -0.137054443359375, -0.1107635498046875, -0.08447265625, -0.0581817626953125, -0.031890869140625, -0.0055999755859375, 0.02069091796875, 0.0469818115234375, 0.073272705078125, 0.0995635986328125, 0.1258544921875, 0.1521453857421875, 0.178436279296875, 0.2047271728515625, 0.23101806640625, 0.2573089599609375, 0.283599853515625, 0.3098907470703125, 0.336181640625, 0.3624725341796875, 0.388763427734375, 0.4150543212890625, 0.44134521484375, 0.4676361083984375, 0.493927001953125, 0.5202178955078125, 0.5465087890625, 0.5727996826171875, 0.599090576171875, 0.6253814697265625, 0.65167236328125, 0.6779632568359375, 0.704254150390625, 0.7305450439453125, 0.7568359375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 4.0, 2.0, 6.0, 3.0, 11.0, 12.0, 7.0, 15.0, 13.0, 17.0, 21.0, 26.0, 27.0, 35.0, 42.0, 47.0, 47.0, 53.0, 56.0, 56.0, 57.0, 58.0, 51.0, 33.0, 45.0, 42.0, 38.0, 31.0, 26.0, 20.0, 25.0, 15.0, 8.0, 14.0, 16.0, 5.0, 2.0, 5.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.5205078125, -0.5063667297363281, -0.49222564697265625, -0.4780845642089844, -0.4639434814453125, -0.4498023986816406, -0.43566131591796875, -0.4215202331542969, -0.407379150390625, -0.3932380676269531, -0.37909698486328125, -0.3649559020996094, -0.3508148193359375, -0.3366737365722656, -0.32253265380859375, -0.3083915710449219, -0.29425048828125, -0.2801094055175781, -0.26596832275390625, -0.2518272399902344, -0.2376861572265625, -0.22354507446289062, -0.20940399169921875, -0.19526290893554688, -0.181121826171875, -0.16698074340820312, -0.15283966064453125, -0.13869857788085938, -0.1245574951171875, -0.11041641235351562, -0.09627532958984375, -0.08213424682617188, -0.0679931640625, -0.053852081298828125, -0.03971099853515625, -0.025569915771484375, -0.0114288330078125, 0.002712249755859375, 0.01685333251953125, 0.030994415283203125, 0.045135498046875, 0.059276580810546875, 0.07341766357421875, 0.08755874633789062, 0.1016998291015625, 0.11584091186523438, 0.12998199462890625, 0.14412307739257812, 0.15826416015625, 0.17240524291992188, 0.18654632568359375, 0.20068740844726562, 0.2148284912109375, 0.22896957397460938, 0.24311065673828125, 0.2572517395019531, 0.271392822265625, 0.2855339050292969, 0.29967498779296875, 0.3138160705566406, 0.3279571533203125, 0.3420982360839844, 0.35623931884765625, 0.3703804016113281, 0.384521484375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 6.0, 2.0, 6.0, 3.0, 7.0, 4.0, 13.0, 17.0, 28.0, 40.0, 61.0, 114.0, 174.0, 485.0, 1438.0, 5390.0, 33847.0, 847142.0, 144494.0, 11270.0, 2563.0, 791.0, 300.0, 142.0, 73.0, 43.0, 24.0, 18.0, 20.0, 16.0, 3.0, 5.0, 4.0, 5.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-1.333984375, -1.2966461181640625, -1.259307861328125, -1.2219696044921875, -1.18463134765625, -1.1472930908203125, -1.109954833984375, -1.0726165771484375, -1.0352783203125, -0.9979400634765625, -0.960601806640625, -0.9232635498046875, -0.88592529296875, -0.8485870361328125, -0.811248779296875, -0.7739105224609375, -0.736572265625, -0.6992340087890625, -0.661895751953125, -0.6245574951171875, -0.58721923828125, -0.5498809814453125, -0.512542724609375, -0.4752044677734375, -0.4378662109375, -0.4005279541015625, -0.363189697265625, -0.3258514404296875, -0.28851318359375, -0.2511749267578125, -0.213836669921875, -0.1764984130859375, -0.13916015625, -0.1018218994140625, -0.064483642578125, -0.0271453857421875, 0.01019287109375, 0.0475311279296875, 0.084869384765625, 0.1222076416015625, 0.1595458984375, 0.1968841552734375, 0.234222412109375, 0.2715606689453125, 0.30889892578125, 0.3462371826171875, 0.383575439453125, 0.4209136962890625, 0.458251953125, 0.4955902099609375, 0.532928466796875, 0.5702667236328125, 0.60760498046875, 0.6449432373046875, 0.682281494140625, 0.7196197509765625, 0.7569580078125, 0.7942962646484375, 0.831634521484375, 0.8689727783203125, 0.90631103515625, 0.9436492919921875, 0.980987548828125, 1.0183258056640625, 1.0556640625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 1.0, 2.0, 1.0, 10.0, 6.0, 8.0, 9.0, 9.0, 23.0, 25.0, 34.0, 46.0, 69.0, 118.0, 110.0, 127.0, 121.0, 98.0, 62.0, 34.0, 21.0, 24.0, 11.0, 6.0, 8.0, 2.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.207559585571289e-05, -7.894355803728104e-05, -7.581152021884918e-05, -7.267948240041733e-05, -6.954744458198547e-05, -6.641540676355362e-05, -6.328336894512177e-05, -6.015133112668991e-05, -5.701929330825806e-05, -5.38872554898262e-05, -5.075521767139435e-05, -4.7623179852962494e-05, -4.449114203453064e-05, -4.1359104216098785e-05, -3.822706639766693e-05, -3.509502857923508e-05, -3.196299076080322e-05, -2.883095294237137e-05, -2.5698915123939514e-05, -2.256687730550766e-05, -1.9434839487075806e-05, -1.630280166864395e-05, -1.3170763850212097e-05, -1.0038726031780243e-05, -6.906688213348389e-06, -3.7746503949165344e-06, -6.426125764846802e-07, 2.489425241947174e-06, 5.621463060379028e-06, 8.753500878810883e-06, 1.1885538697242737e-05, 1.5017576515674591e-05, 1.8149614334106445e-05, 2.12816521525383e-05, 2.4413689970970154e-05, 2.7545727789402008e-05, 3.067776560783386e-05, 3.3809803426265717e-05, 3.694184124469757e-05, 4.0073879063129425e-05, 4.320591688156128e-05, 4.6337954699993134e-05, 4.946999251842499e-05, 5.260203033685684e-05, 5.5734068155288696e-05, 5.886610597372055e-05, 6.19981437921524e-05, 6.513018161058426e-05, 6.826221942901611e-05, 7.139425724744797e-05, 7.452629506587982e-05, 7.765833288431168e-05, 8.079037070274353e-05, 8.392240852117538e-05, 8.705444633960724e-05, 9.018648415803909e-05, 9.331852197647095e-05, 9.64505597949028e-05, 9.958259761333466e-05, 0.00010271463543176651, 0.00010584667325019836, 0.00010897871106863022, 0.00011211074888706207, 0.00011524278670549393, 0.00011837482452392578]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 8.0, 9.0, 10.0, 11.0, 23.0, 28.0, 43.0, 73.0, 81.0, 142.0, 211.0, 443.0, 820.0, 1789.0, 4205.0, 11410.0, 47320.0, 555671.0, 374097.0, 35713.0, 9474.0, 3605.0, 1651.0, 734.0, 399.0, 232.0, 118.0, 75.0, 49.0, 22.0, 21.0, 16.0, 15.0, 10.0, 9.0, 6.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.65185546875, -0.6326370239257812, -0.6134185791015625, -0.5942001342773438, -0.574981689453125, -0.5557632446289062, -0.5365447998046875, -0.5173263549804688, -0.49810791015625, -0.47888946533203125, -0.4596710205078125, -0.44045257568359375, -0.421234130859375, -0.40201568603515625, -0.3827972412109375, -0.36357879638671875, -0.3443603515625, -0.32514190673828125, -0.3059234619140625, -0.28670501708984375, -0.267486572265625, -0.24826812744140625, -0.2290496826171875, -0.20983123779296875, -0.19061279296875, -0.17139434814453125, -0.1521759033203125, -0.13295745849609375, -0.113739013671875, -0.09452056884765625, -0.0753021240234375, -0.05608367919921875, -0.036865234375, -0.01764678955078125, 0.0015716552734375, 0.02079010009765625, 0.040008544921875, 0.05922698974609375, 0.0784454345703125, 0.09766387939453125, 0.11688232421875, 0.13610076904296875, 0.1553192138671875, 0.17453765869140625, 0.193756103515625, 0.21297454833984375, 0.2321929931640625, 0.25141143798828125, 0.2706298828125, 0.28984832763671875, 0.3090667724609375, 0.32828521728515625, 0.347503662109375, 0.36672210693359375, 0.3859405517578125, 0.40515899658203125, 0.42437744140625, 0.44359588623046875, 0.4628143310546875, 0.48203277587890625, 0.501251220703125, 0.5204696655273438, 0.5396881103515625, 0.5589065551757812, 0.578125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 0.0, 3.0, 6.0, 2.0, 5.0, 6.0, 6.0, 9.0, 14.0, 29.0, 42.0, 74.0, 134.0, 177.0, 178.0, 107.0, 80.0, 47.0, 26.0, 16.0, 9.0, 6.0, 3.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.486328125, -0.4715843200683594, -0.45684051513671875, -0.4420967102050781, -0.4273529052734375, -0.4126091003417969, -0.39786529541015625, -0.3831214904785156, -0.368377685546875, -0.3536338806152344, -0.33889007568359375, -0.3241462707519531, -0.3094024658203125, -0.2946586608886719, -0.27991485595703125, -0.2651710510253906, -0.25042724609375, -0.23568344116210938, -0.22093963623046875, -0.20619583129882812, -0.1914520263671875, -0.17670822143554688, -0.16196441650390625, -0.14722061157226562, -0.132476806640625, -0.11773300170898438, -0.10298919677734375, -0.08824539184570312, -0.0735015869140625, -0.058757781982421875, -0.04401397705078125, -0.029270172119140625, -0.0145263671875, 0.000217437744140625, 0.01496124267578125, 0.029705047607421875, 0.0444488525390625, 0.059192657470703125, 0.07393646240234375, 0.08868026733398438, 0.103424072265625, 0.11816787719726562, 0.13291168212890625, 0.14765548706054688, 0.1623992919921875, 0.17714309692382812, 0.19188690185546875, 0.20663070678710938, 0.22137451171875, 0.23611831665039062, 0.25086212158203125, 0.2656059265136719, 0.2803497314453125, 0.2950935363769531, 0.30983734130859375, 0.3245811462402344, 0.339324951171875, 0.3540687561035156, 0.36881256103515625, 0.3835563659667969, 0.3983001708984375, 0.4130439758300781, 0.42778778076171875, 0.4425315856933594, 0.457275390625]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 4.0, 7.0, 5.0, 32.0, 113.0, 239.0, 334.0, 171.0, 69.0, 20.0, 12.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.548263549804688, -9.185465812683105, -8.822668075561523, -8.459871292114258, -8.097073554992676, -7.734275817871094, -7.371478080749512, -7.008680820465088, -6.645883560180664, -6.283085823059082, -5.920288562774658, -5.557490825653076, -5.194693565368652, -4.83189582824707, -4.469098091125488, -4.1063008308410645, -3.7435030937194824, -3.3807055950164795, -3.0179080963134766, -2.6551103591918945, -2.2923130989074707, -1.9295154809951782, -1.5667178630828857, -1.2039203643798828, -0.8411228656768799, -0.47832533717155457, -0.11552780866622925, 0.24726974964141846, 0.6100672483444214, 0.9728647470474243, 1.3356623649597168, 1.6984598636627197, 2.0612573623657227, 2.4240548610687256, 2.7868523597717285, 3.1496500968933105, 3.5124473571777344, 3.8752450942993164, 4.238042831420898, 4.600840091705322, 4.963637351989746, 5.326435089111328, 5.689232349395752, 6.052030086517334, 6.414827346801758, 6.77762508392334, 7.140422821044922, 7.503220081329346, 7.866017818450928, 8.228815078735352, 8.591612815856934, 8.954410552978516, 9.317208290100098, 9.680005073547363, 10.042802810668945, 10.405600547790527, 10.76839828491211, 11.131196022033691, 11.493993759155273, 11.856790542602539, 12.219588279724121, 12.582386016845703, 12.945183753967285, 13.307981491088867, 13.670778274536133]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 7.0, 4.0, 7.0, 7.0, 12.0, 17.0, 16.0, 16.0, 25.0, 25.0, 34.0, 30.0, 39.0, 40.0, 39.0, 54.0, 46.0, 47.0, 61.0, 59.0, 43.0, 56.0, 52.0, 37.0, 44.0, 32.0, 31.0, 26.0, 23.0, 13.0, 14.0, 5.0, 14.0, 4.0, 11.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0359015464782715, -2.949129104614258, -2.862356424331665, -2.7755839824676514, -2.6888115406036377, -2.602038860321045, -2.5152664184570312, -2.4284939765930176, -2.341721296310425, -2.254948854446411, -2.1681761741638184, -2.0814037322998047, -1.9946311712265015, -1.9078586101531982, -1.8210861682891846, -1.7343136072158813, -1.6475411653518677, -1.5607686042785645, -1.4739961624145508, -1.3872236013412476, -1.3004510402679443, -1.2136785984039307, -1.1269060373306274, -1.0401334762573242, -0.9533609747886658, -0.8665884733200073, -0.7798159122467041, -0.6930434107780457, -0.6062709093093872, -0.519498348236084, -0.43272584676742554, -0.3459532856941223, -0.25918078422546387, -0.17240825295448303, -0.08563573658466339, 0.00113677978515625, 0.08790931105613708, 0.17468184232711792, 0.26145434379577637, 0.3482269048690796, 0.43499940633773804, 0.5217719078063965, 0.6085444688796997, 0.6953169703483582, 0.7820894718170166, 0.8688620328903198, 0.9556345343589783, 1.0424070358276367, 1.12917959690094, 1.2159521579742432, 1.3027245998382568, 1.38949716091156, 1.4762697219848633, 1.563042163848877, 1.6498147249221802, 1.7365872859954834, 1.823359727859497, 1.9101322889328003, 1.996904730796814, 2.083677291870117, 2.170449733734131, 2.2572224140167236, 2.3439948558807373, 2.43076753616333, 2.5175399780273438]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 3.0, 2.0, 6.0, 6.0, 6.0, 5.0, 8.0, 13.0, 7.0, 11.0, 16.0, 22.0, 17.0, 26.0, 38.0, 70.0, 71.0, 128.0, 242.0, 496.0, 1420.0, 6761.0, 71579.0, 3989565.0, 110789.0, 9486.0, 2028.0, 674.0, 309.0, 170.0, 88.0, 78.0, 42.0, 28.0, 19.0, 20.0, 10.0, 5.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0], "bins": [-3.2578125, -3.17547607421875, -3.0931396484375, -3.01080322265625, -2.928466796875, -2.84613037109375, -2.7637939453125, -2.68145751953125, -2.59912109375, -2.51678466796875, -2.4344482421875, -2.35211181640625, -2.269775390625, -2.18743896484375, -2.1051025390625, -2.02276611328125, -1.9404296875, -1.85809326171875, -1.7757568359375, -1.69342041015625, -1.611083984375, -1.52874755859375, -1.4464111328125, -1.36407470703125, -1.28173828125, -1.19940185546875, -1.1170654296875, -1.03472900390625, -0.952392578125, -0.87005615234375, -0.7877197265625, -0.70538330078125, -0.623046875, -0.54071044921875, -0.4583740234375, -0.37603759765625, -0.293701171875, -0.21136474609375, -0.1290283203125, -0.04669189453125, 0.03564453125, 0.11798095703125, 0.2003173828125, 0.28265380859375, 0.364990234375, 0.44732666015625, 0.5296630859375, 0.61199951171875, 0.6943359375, 0.77667236328125, 0.8590087890625, 0.94134521484375, 1.023681640625, 1.10601806640625, 1.1883544921875, 1.27069091796875, 1.35302734375, 1.43536376953125, 1.5177001953125, 1.60003662109375, 1.682373046875, 1.76470947265625, 1.8470458984375, 1.92938232421875, 2.01171875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 7.0, 3.0, 10.0, 12.0, 16.0, 18.0, 26.0, 34.0, 41.0, 41.0, 43.0, 45.0, 50.0, 55.0, 80.0, 60.0, 54.0, 69.0, 46.0, 47.0, 47.0, 31.0, 33.0, 27.0, 23.0, 22.0, 19.0, 19.0, 12.0, 1.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08978271484375, -0.08627033233642578, -0.08275794982910156, -0.07924556732177734, -0.07573318481445312, -0.0722208023071289, -0.06870841979980469, -0.06519603729248047, -0.06168365478515625, -0.05817127227783203, -0.05465888977050781, -0.051146507263183594, -0.047634124755859375, -0.044121742248535156, -0.04060935974121094, -0.03709697723388672, -0.0335845947265625, -0.03007221221923828, -0.026559829711914062, -0.023047447204589844, -0.019535064697265625, -0.016022682189941406, -0.012510299682617188, -0.008997917175292969, -0.00548553466796875, -0.0019731521606445312, 0.0015392303466796875, 0.005051612854003906, 0.008563995361328125, 0.012076377868652344, 0.015588760375976562, 0.01910114288330078, 0.022613525390625, 0.02612590789794922, 0.029638290405273438, 0.033150672912597656, 0.036663055419921875, 0.040175437927246094, 0.04368782043457031, 0.04720020294189453, 0.05071258544921875, 0.05422496795654297, 0.05773735046386719, 0.061249732971191406, 0.06476211547851562, 0.06827449798583984, 0.07178688049316406, 0.07529926300048828, 0.0788116455078125, 0.08232402801513672, 0.08583641052246094, 0.08934879302978516, 0.09286117553710938, 0.0963735580444336, 0.09988594055175781, 0.10339832305908203, 0.10691070556640625, 0.11042308807373047, 0.11393547058105469, 0.1174478530883789, 0.12096023559570312, 0.12447261810302734, 0.12798500061035156, 0.13149738311767578, 0.135009765625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 8.0, 14.0, 22.0, 42.0, 101.0, 177.0, 442.0, 1090.0, 4229.0, 258600.0, 3920113.0, 7162.0, 1283.0, 514.0, 244.0, 106.0, 49.0, 38.0, 23.0, 13.0, 7.0, 4.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.69921875, -2.55810546875, -2.4169921875, -2.27587890625, -2.134765625, -1.99365234375, -1.8525390625, -1.71142578125, -1.5703125, -1.42919921875, -1.2880859375, -1.14697265625, -1.005859375, -0.86474609375, -0.7236328125, -0.58251953125, -0.44140625, -0.30029296875, -0.1591796875, -0.01806640625, 0.123046875, 0.26416015625, 0.4052734375, 0.54638671875, 0.6875, 0.82861328125, 0.9697265625, 1.11083984375, 1.251953125, 1.39306640625, 1.5341796875, 1.67529296875, 1.81640625, 1.95751953125, 2.0986328125, 2.23974609375, 2.380859375, 2.52197265625, 2.6630859375, 2.80419921875, 2.9453125, 3.08642578125, 3.2275390625, 3.36865234375, 3.509765625, 3.65087890625, 3.7919921875, 3.93310546875, 4.07421875, 4.21533203125, 4.3564453125, 4.49755859375, 4.638671875, 4.77978515625, 4.9208984375, 5.06201171875, 5.203125, 5.34423828125, 5.4853515625, 5.62646484375, 5.767578125, 5.90869140625, 6.0498046875, 6.19091796875, 6.33203125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 13.0, 34.0, 81.0, 366.0, 2830.0, 558.0, 132.0, 36.0, 12.0, 10.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52294921875, -0.49877166748046875, -0.4745941162109375, -0.45041656494140625, -0.426239013671875, -0.40206146240234375, -0.3778839111328125, -0.35370635986328125, -0.32952880859375, -0.30535125732421875, -0.2811737060546875, -0.25699615478515625, -0.232818603515625, -0.20864105224609375, -0.1844635009765625, -0.16028594970703125, -0.1361083984375, -0.11193084716796875, -0.0877532958984375, -0.06357574462890625, -0.039398193359375, -0.01522064208984375, 0.0089569091796875, 0.03313446044921875, 0.05731201171875, 0.08148956298828125, 0.1056671142578125, 0.12984466552734375, 0.154022216796875, 0.17819976806640625, 0.2023773193359375, 0.22655487060546875, 0.250732421875, 0.27490997314453125, 0.2990875244140625, 0.32326507568359375, 0.347442626953125, 0.37162017822265625, 0.3957977294921875, 0.41997528076171875, 0.44415283203125, 0.46833038330078125, 0.4925079345703125, 0.5166854858398438, 0.540863037109375, 0.5650405883789062, 0.5892181396484375, 0.6133956909179688, 0.6375732421875, 0.6617507934570312, 0.6859283447265625, 0.7101058959960938, 0.734283447265625, 0.7584609985351562, 0.7826385498046875, 0.8068161010742188, 0.83099365234375, 0.8551712036132812, 0.8793487548828125, 0.9035263061523438, 0.927703857421875, 0.9518814086914062, 0.9760589599609375, 1.0002365112304688, 1.0244140625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 11.0, 54.0, 303.0, 467.0, 119.0, 33.0, 7.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.450301647186279, -5.225833892822266, -5.00136661529541, -4.776899337768555, -4.552431583404541, -4.327963829040527, -4.103496551513672, -3.8790290355682373, -3.6545615196228027, -3.430094003677368, -3.2056264877319336, -2.981158971786499, -2.7566914558410645, -2.53222393989563, -2.3077564239501953, -2.0832889080047607, -1.8588213920593262, -1.6343538761138916, -1.409886360168457, -1.1854188442230225, -0.9609513282775879, -0.7364838123321533, -0.5120162963867188, -0.2875487804412842, -0.06308126449584961, 0.16138625144958496, 0.38585376739501953, 0.6103212833404541, 0.8347887992858887, 1.0592563152313232, 1.2837238311767578, 1.5081913471221924, 1.7326583862304688, 1.9571259021759033, 2.181593418121338, 2.4060609340667725, 2.630528450012207, 2.8549959659576416, 3.079463481903076, 3.3039309978485107, 3.5283985137939453, 3.75286602973938, 3.9773335456848145, 4.201801300048828, 4.426268577575684, 4.650735855102539, 4.875203609466553, 5.099671363830566, 5.324138641357422, 5.548605918884277, 5.773073673248291, 5.997541427612305, 6.22200870513916, 6.446475982666016, 6.670943737030029, 6.895411491394043, 7.119878768920898, 7.344346046447754, 7.568813800811768, 7.793281555175781, 8.017748832702637, 8.242216110229492, 8.466684341430664, 8.69115161895752, 8.915618896484375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 7.0, 4.0, 6.0, 15.0, 18.0, 13.0, 37.0, 40.0, 43.0, 49.0, 65.0, 74.0, 85.0, 69.0, 73.0, 64.0, 59.0, 60.0, 47.0, 39.0, 45.0, 35.0, 25.0, 11.0, 9.0, 5.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.6858141422271729, -1.6417864561080933, -1.5977587699890137, -1.5537312030792236, -1.509703516960144, -1.4656758308410645, -1.4216482639312744, -1.3776205778121948, -1.3335928916931152, -1.2895652055740356, -1.245537519454956, -1.201509952545166, -1.1574822664260864, -1.1134545803070068, -1.0694270133972168, -1.0253993272781372, -0.9813716411590576, -0.937343955039978, -0.8933163285255432, -0.8492887020111084, -0.8052610158920288, -0.7612333297729492, -0.7172057032585144, -0.6731780767440796, -0.629150390625, -0.5851227045059204, -0.5410950779914856, -0.4970674216747284, -0.4530397653579712, -0.409012109041214, -0.3649844527244568, -0.3209567964076996, -0.27692925930023193, -0.23290160298347473, -0.18887394666671753, -0.14484629034996033, -0.10081863403320312, -0.05679097771644592, -0.01276332139968872, 0.03126433491706848, 0.07529199123382568, 0.11931964755058289, 0.1633473038673401, 0.2073749601840973, 0.2514026165008545, 0.2954302728176117, 0.3394579291343689, 0.3834855854511261, 0.4275132417678833, 0.4715408980846405, 0.5155685544013977, 0.5595961809158325, 0.6036238670349121, 0.6476515531539917, 0.6916791796684265, 0.7357068061828613, 0.7797344923019409, 0.8237621784210205, 0.8677898049354553, 0.9118174314498901, 0.9558451175689697, 0.9998728036880493, 1.043900489807129, 1.087928056716919, 1.1319557428359985]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 8.0, 2.0, 3.0, 7.0, 10.0, 8.0, 15.0, 13.0, 18.0, 30.0, 27.0, 37.0, 47.0, 83.0, 129.0, 205.0, 312.0, 642.0, 1413.0, 4215.0, 21046.0, 220978.0, 703656.0, 80267.0, 10441.0, 2671.0, 990.0, 481.0, 298.0, 165.0, 88.0, 64.0, 42.0, 34.0, 23.0, 27.0, 15.0, 12.0, 9.0, 3.0, 8.0, 1.0, 4.0, 3.0, 5.0, 4.0, 2.0, 1.0, 4.0], "bins": [-2.46875, -2.4025726318359375, -2.336395263671875, -2.2702178955078125, -2.20404052734375, -2.1378631591796875, -2.071685791015625, -2.0055084228515625, -1.9393310546875, -1.8731536865234375, -1.806976318359375, -1.7407989501953125, -1.67462158203125, -1.6084442138671875, -1.542266845703125, -1.4760894775390625, -1.409912109375, -1.3437347412109375, -1.277557373046875, -1.2113800048828125, -1.14520263671875, -1.0790252685546875, -1.012847900390625, -0.9466705322265625, -0.8804931640625, -0.8143157958984375, -0.748138427734375, -0.6819610595703125, -0.61578369140625, -0.5496063232421875, -0.483428955078125, -0.4172515869140625, -0.35107421875, -0.2848968505859375, -0.218719482421875, -0.1525421142578125, -0.08636474609375, -0.0201873779296875, 0.045989990234375, 0.1121673583984375, 0.1783447265625, 0.2445220947265625, 0.310699462890625, 0.3768768310546875, 0.44305419921875, 0.5092315673828125, 0.575408935546875, 0.6415863037109375, 0.707763671875, 0.7739410400390625, 0.840118408203125, 0.9062957763671875, 0.97247314453125, 1.0386505126953125, 1.104827880859375, 1.1710052490234375, 1.2371826171875, 1.3033599853515625, 1.369537353515625, 1.4357147216796875, 1.50189208984375, 1.5680694580078125, 1.634246826171875, 1.7004241943359375, 1.7666015625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 6.0, 4.0, 7.0, 19.0, 10.0, 22.0, 24.0, 38.0, 37.0, 54.0, 51.0, 62.0, 59.0, 65.0, 80.0, 66.0, 66.0, 49.0, 58.0, 56.0, 44.0, 32.0, 27.0, 20.0, 12.0, 8.0, 11.0, 6.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.12237548828125, -0.1180868148803711, -0.11379814147949219, -0.10950946807861328, -0.10522079467773438, -0.10093212127685547, -0.09664344787597656, -0.09235477447509766, -0.08806610107421875, -0.08377742767333984, -0.07948875427246094, -0.07520008087158203, -0.07091140747070312, -0.06662273406982422, -0.06233406066894531, -0.058045387268066406, -0.0537567138671875, -0.049468040466308594, -0.04517936706542969, -0.04089069366455078, -0.036602020263671875, -0.03231334686279297, -0.028024673461914062, -0.023736000061035156, -0.01944732666015625, -0.015158653259277344, -0.010869979858398438, -0.006581306457519531, -0.002292633056640625, 0.0019960403442382812, 0.0062847137451171875, 0.010573387145996094, 0.014862060546875, 0.019150733947753906, 0.023439407348632812, 0.02772808074951172, 0.032016754150390625, 0.03630542755126953, 0.04059410095214844, 0.044882774353027344, 0.04917144775390625, 0.053460121154785156, 0.05774879455566406, 0.06203746795654297, 0.06632614135742188, 0.07061481475830078, 0.07490348815917969, 0.0791921615600586, 0.0834808349609375, 0.0877695083618164, 0.09205818176269531, 0.09634685516357422, 0.10063552856445312, 0.10492420196533203, 0.10921287536621094, 0.11350154876708984, 0.11779022216796875, 0.12207889556884766, 0.12636756896972656, 0.13065624237060547, 0.13494491577148438, 0.13923358917236328, 0.1435222625732422, 0.1478109359741211, 0.152099609375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 9.0, 5.0, 7.0, 4.0, 15.0, 19.0, 29.0, 47.0, 91.0, 152.0, 235.0, 432.0, 955.0, 2315.0, 6706.0, 28079.0, 237433.0, 653549.0, 95982.0, 14980.0, 4244.0, 1643.0, 727.0, 379.0, 197.0, 117.0, 58.0, 44.0, 35.0, 18.0, 10.0, 8.0, 11.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.337890625, -1.2888946533203125, -1.239898681640625, -1.1909027099609375, -1.14190673828125, -1.0929107666015625, -1.043914794921875, -0.9949188232421875, -0.9459228515625, -0.8969268798828125, -0.847930908203125, -0.7989349365234375, -0.74993896484375, -0.7009429931640625, -0.651947021484375, -0.6029510498046875, -0.553955078125, -0.5049591064453125, -0.455963134765625, -0.4069671630859375, -0.35797119140625, -0.3089752197265625, -0.259979248046875, -0.2109832763671875, -0.1619873046875, -0.1129913330078125, -0.063995361328125, -0.0149993896484375, 0.03399658203125, 0.0829925537109375, 0.131988525390625, 0.1809844970703125, 0.22998046875, 0.2789764404296875, 0.327972412109375, 0.3769683837890625, 0.42596435546875, 0.4749603271484375, 0.523956298828125, 0.5729522705078125, 0.6219482421875, 0.6709442138671875, 0.719940185546875, 0.7689361572265625, 0.81793212890625, 0.8669281005859375, 0.915924072265625, 0.9649200439453125, 1.013916015625, 1.0629119873046875, 1.111907958984375, 1.1609039306640625, 1.20989990234375, 1.2588958740234375, 1.307891845703125, 1.3568878173828125, 1.4058837890625, 1.4548797607421875, 1.503875732421875, 1.5528717041015625, 1.60186767578125, 1.6508636474609375, 1.699859619140625, 1.7488555908203125, 1.7978515625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 5.0, 6.0, 2.0, 7.0, 5.0, 7.0, 5.0, 7.0, 15.0, 19.0, 14.0, 24.0, 30.0, 36.0, 44.0, 36.0, 49.0, 46.0, 54.0, 44.0, 55.0, 64.0, 49.0, 38.0, 56.0, 34.0, 46.0, 39.0, 29.0, 27.0, 20.0, 22.0, 15.0, 16.0, 9.0, 7.0, 7.0, 6.0, 1.0, 2.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.418212890625, -0.4025154113769531, -0.38681793212890625, -0.3711204528808594, -0.3554229736328125, -0.3397254943847656, -0.32402801513671875, -0.3083305358886719, -0.292633056640625, -0.2769355773925781, -0.26123809814453125, -0.24554061889648438, -0.2298431396484375, -0.21414566040039062, -0.19844818115234375, -0.18275070190429688, -0.16705322265625, -0.15135574340820312, -0.13565826416015625, -0.11996078491210938, -0.1042633056640625, -0.08856582641601562, -0.07286834716796875, -0.057170867919921875, -0.041473388671875, -0.025775909423828125, -0.01007843017578125, 0.005619049072265625, 0.0213165283203125, 0.037014007568359375, 0.05271148681640625, 0.06840896606445312, 0.0841064453125, 0.09980392456054688, 0.11550140380859375, 0.13119888305664062, 0.1468963623046875, 0.16259384155273438, 0.17829132080078125, 0.19398880004882812, 0.209686279296875, 0.22538375854492188, 0.24108123779296875, 0.2567787170410156, 0.2724761962890625, 0.2881736755371094, 0.30387115478515625, 0.3195686340332031, 0.33526611328125, 0.3509635925292969, 0.36666107177734375, 0.3823585510253906, 0.3980560302734375, 0.4137535095214844, 0.42945098876953125, 0.4451484680175781, 0.460845947265625, 0.4765434265136719, 0.49224090576171875, 0.5079383850097656, 0.5236358642578125, 0.5393333435058594, 0.5550308227539062, 0.5707283020019531, 0.58642578125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 2.0, 4.0, 3.0, 11.0, 11.0, 22.0, 32.0, 50.0, 78.0, 136.0, 250.0, 390.0, 862.0, 2150.0, 7145.0, 38538.0, 397778.0, 535842.0, 51817.0, 8930.0, 2481.0, 932.0, 453.0, 226.0, 138.0, 85.0, 53.0, 27.0, 22.0, 26.0, 15.0, 11.0, 8.0, 3.0, 3.0, 5.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.68212890625, -0.662109375, -0.64208984375, -0.6220703125, -0.60205078125, -0.58203125, -0.56201171875, -0.5419921875, -0.52197265625, -0.501953125, -0.48193359375, -0.4619140625, -0.44189453125, -0.421875, -0.40185546875, -0.3818359375, -0.36181640625, -0.341796875, -0.32177734375, -0.3017578125, -0.28173828125, -0.26171875, -0.24169921875, -0.2216796875, -0.20166015625, -0.181640625, -0.16162109375, -0.1416015625, -0.12158203125, -0.1015625, -0.08154296875, -0.0615234375, -0.04150390625, -0.021484375, -0.00146484375, 0.0185546875, 0.03857421875, 0.05859375, 0.07861328125, 0.0986328125, 0.11865234375, 0.138671875, 0.15869140625, 0.1787109375, 0.19873046875, 0.21875, 0.23876953125, 0.2587890625, 0.27880859375, 0.298828125, 0.31884765625, 0.3388671875, 0.35888671875, 0.37890625, 0.39892578125, 0.4189453125, 0.43896484375, 0.458984375, 0.47900390625, 0.4990234375, 0.51904296875, 0.5390625, 0.55908203125, 0.5791015625, 0.59912109375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 10.0, 7.0, 15.0, 11.0, 19.0, 18.0, 54.0, 49.0, 82.0, 110.0, 126.0, 112.0, 106.0, 87.0, 50.0, 34.0, 25.0, 24.0, 17.0, 11.0, 8.0, 4.0, 1.0, 5.0, 3.0, 5.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.970499038696289e-05, -8.610356599092484e-05, -8.250214159488678e-05, -7.890071719884872e-05, -7.529929280281067e-05, -7.169786840677261e-05, -6.809644401073456e-05, -6.44950196146965e-05, -6.089359521865845e-05, -5.729217082262039e-05, -5.3690746426582336e-05, -5.008932203054428e-05, -4.6487897634506226e-05, -4.288647323846817e-05, -3.9285048842430115e-05, -3.568362444639206e-05, -3.2082200050354004e-05, -2.848077565431595e-05, -2.4879351258277893e-05, -2.1277926862239838e-05, -1.7676502466201782e-05, -1.4075078070163727e-05, -1.0473653674125671e-05, -6.872229278087616e-06, -3.2708048820495605e-06, 3.3061951398849487e-07, 3.93204391002655e-06, 7.533468306064606e-06, 1.1134892702102661e-05, 1.4736317098140717e-05, 1.8337741494178772e-05, 2.1939165890216827e-05, 2.5540590286254883e-05, 2.9142014682292938e-05, 3.2743439078330994e-05, 3.634486347436905e-05, 3.9946287870407104e-05, 4.354771226644516e-05, 4.7149136662483215e-05, 5.075056105852127e-05, 5.4351985454559326e-05, 5.795340985059738e-05, 6.155483424663544e-05, 6.515625864267349e-05, 6.875768303871155e-05, 7.23591074347496e-05, 7.596053183078766e-05, 7.956195622682571e-05, 8.316338062286377e-05, 8.676480501890182e-05, 9.036622941493988e-05, 9.396765381097794e-05, 9.756907820701599e-05, 0.00010117050260305405, 0.0001047719269990921, 0.00010837335139513016, 0.00011197477579116821, 0.00011557620018720627, 0.00011917762458324432, 0.00012277904897928238, 0.00012638047337532043, 0.0001299818977713585, 0.00013358332216739655, 0.0001371847465634346, 0.00014078617095947266]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 5.0, 6.0, 11.0, 17.0, 25.0, 25.0, 33.0, 64.0, 112.0, 168.0, 322.0, 567.0, 1201.0, 2762.0, 7178.0, 23697.0, 115303.0, 580359.0, 255268.0, 42346.0, 11530.0, 4090.0, 1732.0, 805.0, 366.0, 213.0, 122.0, 75.0, 50.0, 37.0, 19.0, 12.0, 10.0, 9.0, 6.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36376953125, -0.35109710693359375, -0.3384246826171875, -0.32575225830078125, -0.313079833984375, -0.30040740966796875, -0.2877349853515625, -0.27506256103515625, -0.26239013671875, -0.24971771240234375, -0.2370452880859375, -0.22437286376953125, -0.211700439453125, -0.19902801513671875, -0.1863555908203125, -0.17368316650390625, -0.1610107421875, -0.14833831787109375, -0.1356658935546875, -0.12299346923828125, -0.110321044921875, -0.09764862060546875, -0.0849761962890625, -0.07230377197265625, -0.05963134765625, -0.04695892333984375, -0.0342864990234375, -0.02161407470703125, -0.008941650390625, 0.00373077392578125, 0.0164031982421875, 0.02907562255859375, 0.041748046875, 0.05442047119140625, 0.0670928955078125, 0.07976531982421875, 0.092437744140625, 0.10511016845703125, 0.1177825927734375, 0.13045501708984375, 0.14312744140625, 0.15579986572265625, 0.1684722900390625, 0.18114471435546875, 0.193817138671875, 0.20648956298828125, 0.2191619873046875, 0.23183441162109375, 0.2445068359375, 0.25717926025390625, 0.2698516845703125, 0.28252410888671875, 0.295196533203125, 0.30786895751953125, 0.3205413818359375, 0.33321380615234375, 0.34588623046875, 0.35855865478515625, 0.3712310791015625, 0.38390350341796875, 0.396575927734375, 0.40924835205078125, 0.4219207763671875, 0.43459320068359375, 0.447265625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 1.0, 9.0, 8.0, 9.0, 14.0, 20.0, 25.0, 37.0, 27.0, 28.0, 62.0, 52.0, 73.0, 78.0, 80.0, 80.0, 61.0, 49.0, 52.0, 46.0, 20.0, 30.0, 33.0, 20.0, 19.0, 18.0, 10.0, 5.0, 3.0, 4.0, 5.0, 6.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.2218017578125, -0.2152538299560547, -0.20870590209960938, -0.20215797424316406, -0.19561004638671875, -0.18906211853027344, -0.18251419067382812, -0.1759662628173828, -0.1694183349609375, -0.1628704071044922, -0.15632247924804688, -0.14977455139160156, -0.14322662353515625, -0.13667869567871094, -0.13013076782226562, -0.12358283996582031, -0.117034912109375, -0.11048698425292969, -0.10393905639648438, -0.09739112854003906, -0.09084320068359375, -0.08429527282714844, -0.07774734497070312, -0.07119941711425781, -0.0646514892578125, -0.05810356140136719, -0.051555633544921875, -0.04500770568847656, -0.03845977783203125, -0.03191184997558594, -0.025363922119140625, -0.018815994262695312, -0.01226806640625, -0.0057201385498046875, 0.000827789306640625, 0.0073757171630859375, 0.01392364501953125, 0.020471572875976562, 0.027019500732421875, 0.03356742858886719, 0.0401153564453125, 0.04666328430175781, 0.053211212158203125, 0.05975914001464844, 0.06630706787109375, 0.07285499572753906, 0.07940292358398438, 0.08595085144042969, 0.092498779296875, 0.09904670715332031, 0.10559463500976562, 0.11214256286621094, 0.11869049072265625, 0.12523841857910156, 0.13178634643554688, 0.1383342742919922, 0.1448822021484375, 0.1514301300048828, 0.15797805786132812, 0.16452598571777344, 0.17107391357421875, 0.17762184143066406, 0.18416976928710938, 0.1907176971435547, 0.197265625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 7.0, 7.0, 42.0, 71.0, 222.0, 307.0, 208.0, 88.0, 34.0, 12.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.069975852966309, -8.64826774597168, -8.226558685302734, -7.8048505783081055, -7.38314151763916, -6.961433410644531, -6.539724826812744, -6.118016242980957, -5.69630765914917, -5.274599075317383, -4.852890491485596, -4.431181907653809, -4.00947380065918, -3.5877649784088135, -3.1660566329956055, -2.7443480491638184, -2.3226394653320312, -1.9009308815002441, -1.4792224168777466, -1.057513952255249, -0.6358053684234619, -0.2140967845916748, 0.2076115608215332, 0.6293201446533203, 1.0510287284851074, 1.4727373123168945, 1.894445776939392, 2.3161542415618896, 2.7378628253936768, 3.159571409225464, 3.581279754638672, 4.002988338470459, 4.42469596862793, 4.846404552459717, 5.268113136291504, 5.689821243286133, 6.111530303955078, 6.533238410949707, 6.954946994781494, 7.376655578613281, 7.798364162445068, 8.220072746276855, 8.641780853271484, 9.06348991394043, 9.485198020935059, 9.906907081604004, 10.328615188598633, 10.750324249267578, 11.172032356262207, 11.593740463256836, 12.015449523925781, 12.43715763092041, 12.858866691589355, 13.280574798583984, 13.70228385925293, 14.123991966247559, 14.545700073242188, 14.967408180236816, 15.389117240905762, 15.81082534790039, 16.232534408569336, 16.65424346923828, 17.075950622558594, 17.49765968322754, 17.919368743896484]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 9.0, 6.0, 12.0, 11.0, 15.0, 26.0, 36.0, 46.0, 45.0, 32.0, 50.0, 58.0, 62.0, 67.0, 57.0, 70.0, 53.0, 69.0, 46.0, 40.0, 40.0, 27.0, 27.0, 26.0, 26.0, 11.0, 13.0, 12.0, 1.0, 2.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.658356666564941, -4.537021160125732, -4.415685176849365, -4.294349670410156, -4.173013687133789, -4.05167818069458, -3.930342435836792, -3.809006690979004, -3.687670946121216, -3.5663352012634277, -3.4449994564056396, -3.3236637115478516, -3.2023282051086426, -3.0809924602508545, -2.9596567153930664, -2.8383209705352783, -2.7169852256774902, -2.595649480819702, -2.474313735961914, -2.352978229522705, -2.231642484664917, -2.110306739807129, -1.9889709949493408, -1.8676352500915527, -1.7462997436523438, -1.6249639987945557, -1.5036283731460571, -1.382292628288269, -1.260956883430481, -1.1396212577819824, -1.0182855129241943, -0.8969497680664062, -0.7756140232086182, -0.6542783379554749, -0.5329425930976868, -0.41160690784454346, -0.29027119278907776, -0.16893547773361206, -0.04759979248046875, 0.07373595237731934, 0.19507163763046265, 0.31640735268592834, 0.43774306774139404, 0.5590787529945374, 0.6804144382476807, 0.8017501831054688, 0.9230858683586121, 1.044421672821045, 1.1657572984695435, 1.2870930433273315, 1.40842866897583, 1.5297644138336182, 1.6511001586914062, 1.7724359035491943, 1.8937715291976929, 2.0151071548461914, 2.1364428997039795, 2.2577786445617676, 2.3791143894195557, 2.5004501342773438, 2.6217856407165527, 2.743121385574341, 2.864457130432129, 2.985792875289917, 3.107128620147705]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 3.0, 3.0, 2.0, 4.0, 7.0, 9.0, 2.0, 10.0, 10.0, 15.0, 17.0, 28.0, 34.0, 32.0, 40.0, 54.0, 83.0, 147.0, 244.0, 624.0, 1643.0, 7369.0, 67802.0, 3816608.0, 275915.0, 18254.0, 3367.0, 1021.0, 419.0, 212.0, 124.0, 68.0, 37.0, 25.0, 18.0, 13.0, 7.0, 8.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.27734375, -3.19482421875, -3.1123046875, -3.02978515625, -2.947265625, -2.86474609375, -2.7822265625, -2.69970703125, -2.6171875, -2.53466796875, -2.4521484375, -2.36962890625, -2.287109375, -2.20458984375, -2.1220703125, -2.03955078125, -1.95703125, -1.87451171875, -1.7919921875, -1.70947265625, -1.626953125, -1.54443359375, -1.4619140625, -1.37939453125, -1.296875, -1.21435546875, -1.1318359375, -1.04931640625, -0.966796875, -0.88427734375, -0.8017578125, -0.71923828125, -0.63671875, -0.55419921875, -0.4716796875, -0.38916015625, -0.306640625, -0.22412109375, -0.1416015625, -0.05908203125, 0.0234375, 0.10595703125, 0.1884765625, 0.27099609375, 0.353515625, 0.43603515625, 0.5185546875, 0.60107421875, 0.68359375, 0.76611328125, 0.8486328125, 0.93115234375, 1.013671875, 1.09619140625, 1.1787109375, 1.26123046875, 1.34375, 1.42626953125, 1.5087890625, 1.59130859375, 1.673828125, 1.75634765625, 1.8388671875, 1.92138671875, 2.00390625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 8.0, 13.0, 7.0, 16.0, 16.0, 24.0, 19.0, 29.0, 40.0, 41.0, 49.0, 61.0, 61.0, 51.0, 58.0, 72.0, 62.0, 48.0, 56.0, 39.0, 46.0, 41.0, 34.0, 21.0, 19.0, 20.0, 12.0, 9.0, 7.0, 8.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1290283203125, -0.12499237060546875, -0.1209564208984375, -0.11692047119140625, -0.112884521484375, -0.10884857177734375, -0.1048126220703125, -0.10077667236328125, -0.09674072265625, -0.09270477294921875, -0.0886688232421875, -0.08463287353515625, -0.080596923828125, -0.07656097412109375, -0.0725250244140625, -0.06848907470703125, -0.064453125, -0.06041717529296875, -0.0563812255859375, -0.05234527587890625, -0.048309326171875, -0.04427337646484375, -0.0402374267578125, -0.03620147705078125, -0.03216552734375, -0.02812957763671875, -0.0240936279296875, -0.02005767822265625, -0.016021728515625, -0.01198577880859375, -0.0079498291015625, -0.00391387939453125, 0.0001220703125, 0.00415802001953125, 0.0081939697265625, 0.01222991943359375, 0.016265869140625, 0.02030181884765625, 0.0243377685546875, 0.02837371826171875, 0.03240966796875, 0.03644561767578125, 0.0404815673828125, 0.04451751708984375, 0.048553466796875, 0.05258941650390625, 0.0566253662109375, 0.06066131591796875, 0.064697265625, 0.06873321533203125, 0.0727691650390625, 0.07680511474609375, 0.080841064453125, 0.08487701416015625, 0.0889129638671875, 0.09294891357421875, 0.09698486328125, 0.10102081298828125, 0.1050567626953125, 0.10909271240234375, 0.113128662109375, 0.11716461181640625, 0.1212005615234375, 0.12523651123046875, 0.1292724609375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 7.0, 9.0, 18.0, 24.0, 32.0, 77.0, 158.0, 411.0, 1338.0, 6758.0, 300493.0, 3872501.0, 9677.0, 1783.0, 551.0, 184.0, 97.0, 48.0, 38.0, 26.0, 21.0, 11.0, 16.0, 6.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.72265625, -4.52679443359375, -4.3309326171875, -4.13507080078125, -3.939208984375, -3.74334716796875, -3.5474853515625, -3.35162353515625, -3.15576171875, -2.95989990234375, -2.7640380859375, -2.56817626953125, -2.372314453125, -2.17645263671875, -1.9805908203125, -1.78472900390625, -1.5888671875, -1.39300537109375, -1.1971435546875, -1.00128173828125, -0.805419921875, -0.60955810546875, -0.4136962890625, -0.21783447265625, -0.02197265625, 0.17388916015625, 0.3697509765625, 0.56561279296875, 0.761474609375, 0.95733642578125, 1.1531982421875, 1.34906005859375, 1.544921875, 1.74078369140625, 1.9366455078125, 2.13250732421875, 2.328369140625, 2.52423095703125, 2.7200927734375, 2.91595458984375, 3.11181640625, 3.30767822265625, 3.5035400390625, 3.69940185546875, 3.895263671875, 4.09112548828125, 4.2869873046875, 4.48284912109375, 4.6787109375, 4.87457275390625, 5.0704345703125, 5.26629638671875, 5.462158203125, 5.65802001953125, 5.8538818359375, 6.04974365234375, 6.24560546875, 6.44146728515625, 6.6373291015625, 6.83319091796875, 7.029052734375, 7.22491455078125, 7.4207763671875, 7.61663818359375, 7.8125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 3.0, 7.0, 6.0, 5.0, 8.0, 6.0, 14.0, 21.0, 20.0, 41.0, 62.0, 112.0, 226.0, 504.0, 1623.0, 791.0, 313.0, 122.0, 85.0, 42.0, 19.0, 17.0, 10.0, 7.0, 6.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.49951171875, -0.48211669921875, -0.4647216796875, -0.44732666015625, -0.429931640625, -0.41253662109375, -0.3951416015625, -0.37774658203125, -0.3603515625, -0.34295654296875, -0.3255615234375, -0.30816650390625, -0.290771484375, -0.27337646484375, -0.2559814453125, -0.23858642578125, -0.22119140625, -0.20379638671875, -0.1864013671875, -0.16900634765625, -0.151611328125, -0.13421630859375, -0.1168212890625, -0.09942626953125, -0.08203125, -0.06463623046875, -0.0472412109375, -0.02984619140625, -0.012451171875, 0.00494384765625, 0.0223388671875, 0.03973388671875, 0.05712890625, 0.07452392578125, 0.0919189453125, 0.10931396484375, 0.126708984375, 0.14410400390625, 0.1614990234375, 0.17889404296875, 0.1962890625, 0.21368408203125, 0.2310791015625, 0.24847412109375, 0.265869140625, 0.28326416015625, 0.3006591796875, 0.31805419921875, 0.33544921875, 0.35284423828125, 0.3702392578125, 0.38763427734375, 0.405029296875, 0.42242431640625, 0.4398193359375, 0.45721435546875, 0.474609375, 0.49200439453125, 0.5093994140625, 0.52679443359375, 0.544189453125, 0.56158447265625, 0.5789794921875, 0.59637451171875, 0.61376953125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 9.0, 5.0, 20.0, 44.0, 137.0, 304.0, 322.0, 97.0, 33.0, 18.0, 8.0, 3.0, 4.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-14.602534294128418, -14.303973197937012, -14.005412101745605, -13.706851959228516, -13.40829086303711, -13.109729766845703, -12.811168670654297, -12.51260757446289, -12.214046478271484, -11.915485382080078, -11.616924285888672, -11.318364143371582, -11.019803047180176, -10.72124195098877, -10.422680854797363, -10.124119758605957, -9.825559616088867, -9.526998519897461, -9.228437423706055, -8.929877281188965, -8.631316184997559, -8.332755088806152, -8.034193992614746, -7.73563289642334, -7.437072277069092, -7.1385111808776855, -6.8399505615234375, -6.541389465332031, -6.242828369140625, -5.944267749786377, -5.645706653594971, -5.347146034240723, -5.048583984375, -4.750022888183594, -4.451462268829346, -4.1529011726379395, -3.8543403148651123, -3.555779457092285, -3.257218360900879, -2.9586575031280518, -2.6600966453552246, -2.3615357875823975, -2.0629749298095703, -1.764413833618164, -1.465852975845337, -1.1672921180725098, -0.8687311410903931, -0.5701701641082764, -0.2716093063354492, 0.026951611042022705, 0.32551252841949463, 0.6240734457969666, 0.9226343631744385, 1.2211952209472656, 1.5197561979293823, 1.818317174911499, 2.116878032684326, 2.4154388904571533, 2.7139997482299805, 3.0125608444213867, 3.311121702194214, 3.609682559967041, 3.9082436561584473, 4.206804275512695, 4.505365371704102]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 6.0, 11.0, 21.0, 11.0, 24.0, 44.0, 49.0, 42.0, 65.0, 50.0, 77.0, 65.0, 62.0, 73.0, 64.0, 63.0, 54.0, 51.0, 50.0, 39.0, 26.0, 15.0, 10.0, 7.0, 9.0, 2.0, 4.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.830462694168091, -2.7550129890441895, -2.679563522338867, -2.604114055633545, -2.5286643505096436, -2.453214645385742, -2.37776517868042, -2.3023157119750977, -2.2268660068511963, -2.151416301727295, -2.0759668350219727, -2.0005173683166504, -1.925067663192749, -1.8496180772781372, -1.7741684913635254, -1.6987189054489136, -1.6232693195343018, -1.54781973361969, -1.4723701477050781, -1.3969205617904663, -1.3214709758758545, -1.2460213899612427, -1.1705718040466309, -1.095122218132019, -1.0196726322174072, -0.9442230463027954, -0.8687734603881836, -0.7933238744735718, -0.71787428855896, -0.6424247026443481, -0.5669751167297363, -0.4915255308151245, -0.4160761833190918, -0.34062659740448, -0.26517701148986816, -0.18972742557525635, -0.11427783966064453, -0.038828253746032715, 0.0366213321685791, 0.11207091808319092, 0.18752050399780273, 0.26297008991241455, 0.33841967582702637, 0.4138692617416382, 0.48931884765625, 0.5647684335708618, 0.6402180194854736, 0.7156676054000854, 0.7911171913146973, 0.8665667772293091, 0.9420163631439209, 1.0174659490585327, 1.0929155349731445, 1.1683651208877563, 1.2438147068023682, 1.31926429271698, 1.3947138786315918, 1.4701634645462036, 1.5456130504608154, 1.6210626363754272, 1.696512222290039, 1.7719618082046509, 1.8474113941192627, 1.9228609800338745, 1.9983105659484863]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 3.0, 3.0, 7.0, 10.0, 10.0, 20.0, 17.0, 23.0, 34.0, 40.0, 64.0, 84.0, 137.0, 156.0, 254.0, 390.0, 759.0, 1761.0, 7435.0, 65520.0, 681039.0, 264118.0, 20496.0, 3435.0, 1140.0, 553.0, 324.0, 200.0, 138.0, 91.0, 86.0, 53.0, 46.0, 25.0, 18.0, 18.0, 14.0, 12.0, 9.0, 6.0, 4.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.3203125, -2.249481201171875, -2.17864990234375, -2.107818603515625, -2.0369873046875, -1.966156005859375, -1.89532470703125, -1.824493408203125, -1.753662109375, -1.682830810546875, -1.61199951171875, -1.541168212890625, -1.4703369140625, -1.399505615234375, -1.32867431640625, -1.257843017578125, -1.18701171875, -1.116180419921875, -1.04534912109375, -0.974517822265625, -0.9036865234375, -0.832855224609375, -0.76202392578125, -0.691192626953125, -0.620361328125, -0.549530029296875, -0.47869873046875, -0.407867431640625, -0.3370361328125, -0.266204833984375, -0.19537353515625, -0.124542236328125, -0.0537109375, 0.017120361328125, 0.08795166015625, 0.158782958984375, 0.2296142578125, 0.300445556640625, 0.37127685546875, 0.442108154296875, 0.512939453125, 0.583770751953125, 0.65460205078125, 0.725433349609375, 0.7962646484375, 0.867095947265625, 0.93792724609375, 1.008758544921875, 1.07958984375, 1.150421142578125, 1.22125244140625, 1.292083740234375, 1.3629150390625, 1.433746337890625, 1.50457763671875, 1.575408935546875, 1.646240234375, 1.717071533203125, 1.78790283203125, 1.858734130859375, 1.9295654296875, 2.000396728515625, 2.07122802734375, 2.142059326171875, 2.212890625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 5.0, 6.0, 6.0, 11.0, 21.0, 14.0, 27.0, 40.0, 65.0, 67.0, 95.0, 95.0, 88.0, 88.0, 97.0, 69.0, 57.0, 38.0, 32.0, 32.0, 20.0, 15.0, 10.0, 8.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.263671875, -0.257354736328125, -0.25103759765625, -0.244720458984375, -0.2384033203125, -0.232086181640625, -0.22576904296875, -0.219451904296875, -0.213134765625, -0.206817626953125, -0.20050048828125, -0.194183349609375, -0.1878662109375, -0.181549072265625, -0.17523193359375, -0.168914794921875, -0.16259765625, -0.156280517578125, -0.14996337890625, -0.143646240234375, -0.1373291015625, -0.131011962890625, -0.12469482421875, -0.118377685546875, -0.112060546875, -0.105743408203125, -0.09942626953125, -0.093109130859375, -0.0867919921875, -0.080474853515625, -0.07415771484375, -0.067840576171875, -0.0615234375, -0.055206298828125, -0.04888916015625, -0.042572021484375, -0.0362548828125, -0.029937744140625, -0.02362060546875, -0.017303466796875, -0.010986328125, -0.004669189453125, 0.00164794921875, 0.007965087890625, 0.0142822265625, 0.020599365234375, 0.02691650390625, 0.033233642578125, 0.03955078125, 0.045867919921875, 0.05218505859375, 0.058502197265625, 0.0648193359375, 0.071136474609375, 0.07745361328125, 0.083770751953125, 0.090087890625, 0.096405029296875, 0.10272216796875, 0.109039306640625, 0.1153564453125, 0.121673583984375, 0.12799072265625, 0.134307861328125, 0.140625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 3.0, 6.0, 10.0, 13.0, 22.0, 30.0, 48.0, 46.0, 66.0, 87.0, 127.0, 211.0, 338.0, 479.0, 847.0, 1450.0, 2730.0, 5642.0, 12416.0, 29143.0, 73498.0, 180339.0, 318532.0, 242172.0, 105528.0, 41886.0, 17153.0, 7565.0, 3535.0, 1914.0, 1012.0, 618.0, 367.0, 203.0, 152.0, 108.0, 71.0, 56.0, 38.0, 23.0, 23.0, 18.0, 7.0, 9.0, 4.0, 2.0, 5.0, 7.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5341796875, -0.5167770385742188, -0.4993743896484375, -0.48197174072265625, -0.464569091796875, -0.44716644287109375, -0.4297637939453125, -0.41236114501953125, -0.39495849609375, -0.37755584716796875, -0.3601531982421875, -0.34275054931640625, -0.325347900390625, -0.30794525146484375, -0.2905426025390625, -0.27313995361328125, -0.2557373046875, -0.23833465576171875, -0.2209320068359375, -0.20352935791015625, -0.186126708984375, -0.16872406005859375, -0.1513214111328125, -0.13391876220703125, -0.11651611328125, -0.09911346435546875, -0.0817108154296875, -0.06430816650390625, -0.046905517578125, -0.02950286865234375, -0.0121002197265625, 0.00530242919921875, 0.022705078125, 0.04010772705078125, 0.0575103759765625, 0.07491302490234375, 0.092315673828125, 0.10971832275390625, 0.1271209716796875, 0.14452362060546875, 0.16192626953125, 0.17932891845703125, 0.1967315673828125, 0.21413421630859375, 0.231536865234375, 0.24893951416015625, 0.2663421630859375, 0.28374481201171875, 0.3011474609375, 0.31855010986328125, 0.3359527587890625, 0.35335540771484375, 0.370758056640625, 0.38816070556640625, 0.4055633544921875, 0.42296600341796875, 0.44036865234375, 0.45777130126953125, 0.4751739501953125, 0.49257659912109375, 0.509979248046875, 0.5273818969726562, 0.5447845458984375, 0.5621871948242188, 0.57958984375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 2.0, 6.0, 3.0, 4.0, 4.0, 14.0, 7.0, 7.0, 11.0, 17.0, 13.0, 16.0, 15.0, 10.0, 18.0, 30.0, 15.0, 32.0, 31.0, 31.0, 26.0, 31.0, 47.0, 33.0, 30.0, 41.0, 35.0, 47.0, 43.0, 40.0, 45.0, 30.0, 28.0, 30.0, 24.0, 28.0, 26.0, 17.0, 21.0, 14.0, 14.0, 12.0, 15.0, 9.0, 6.0, 9.0, 1.0, 3.0, 7.0, 5.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.3818359375, -0.3686256408691406, -0.35541534423828125, -0.3422050476074219, -0.3289947509765625, -0.3157844543457031, -0.30257415771484375, -0.2893638610839844, -0.276153564453125, -0.2629432678222656, -0.24973297119140625, -0.23652267456054688, -0.2233123779296875, -0.21010208129882812, -0.19689178466796875, -0.18368148803710938, -0.17047119140625, -0.15726089477539062, -0.14405059814453125, -0.13084030151367188, -0.1176300048828125, -0.10441970825195312, -0.09120941162109375, -0.07799911499023438, -0.064788818359375, -0.051578521728515625, -0.03836822509765625, -0.025157928466796875, -0.0119476318359375, 0.001262664794921875, 0.01447296142578125, 0.027683258056640625, 0.0408935546875, 0.054103851318359375, 0.06731414794921875, 0.08052444458007812, 0.0937347412109375, 0.10694503784179688, 0.12015533447265625, 0.13336563110351562, 0.146575927734375, 0.15978622436523438, 0.17299652099609375, 0.18620681762695312, 0.1994171142578125, 0.21262741088867188, 0.22583770751953125, 0.23904800415039062, 0.25225830078125, 0.2654685974121094, 0.27867889404296875, 0.2918891906738281, 0.3050994873046875, 0.3183097839355469, 0.33152008056640625, 0.3447303771972656, 0.357940673828125, 0.3711509704589844, 0.38436126708984375, 0.3975715637207031, 0.4107818603515625, 0.4239921569824219, 0.43720245361328125, 0.4504127502441406, 0.463623046875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 7.0, 15.0, 16.0, 23.0, 34.0, 42.0, 71.0, 138.0, 295.0, 566.0, 1337.0, 3501.0, 12289.0, 67805.0, 414828.0, 450923.0, 76472.0, 13627.0, 3870.0, 1367.0, 654.0, 301.0, 168.0, 83.0, 42.0, 19.0, 21.0, 13.0, 3.0, 6.0, 5.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.447998046875, -0.4325675964355469, -0.41713714599609375, -0.4017066955566406, -0.3862762451171875, -0.3708457946777344, -0.35541534423828125, -0.3399848937988281, -0.324554443359375, -0.3091239929199219, -0.29369354248046875, -0.2782630920410156, -0.2628326416015625, -0.24740219116210938, -0.23197174072265625, -0.21654129028320312, -0.20111083984375, -0.18568038940429688, -0.17024993896484375, -0.15481948852539062, -0.1393890380859375, -0.12395858764648438, -0.10852813720703125, -0.09309768676757812, -0.077667236328125, -0.062236785888671875, -0.04680633544921875, -0.031375885009765625, -0.0159454345703125, -0.000514984130859375, 0.01491546630859375, 0.030345916748046875, 0.0457763671875, 0.061206817626953125, 0.07663726806640625, 0.09206771850585938, 0.1074981689453125, 0.12292861938476562, 0.13835906982421875, 0.15378952026367188, 0.169219970703125, 0.18465042114257812, 0.20008087158203125, 0.21551132202148438, 0.2309417724609375, 0.24637222290039062, 0.26180267333984375, 0.2772331237792969, 0.29266357421875, 0.3080940246582031, 0.32352447509765625, 0.3389549255371094, 0.3543853759765625, 0.3698158264160156, 0.38524627685546875, 0.4006767272949219, 0.416107177734375, 0.4315376281738281, 0.44696807861328125, 0.4623985290527344, 0.4778289794921875, 0.4932594299316406, 0.5086898803710938, 0.5241203308105469, 0.53955078125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 3.0, 4.0, 6.0, 5.0, 5.0, 6.0, 10.0, 11.0, 23.0, 32.0, 35.0, 59.0, 74.0, 83.0, 102.0, 91.0, 105.0, 84.0, 70.0, 56.0, 35.0, 27.0, 19.0, 11.0, 12.0, 14.0, 4.0, 2.0, 5.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.876489639282227e-05, -9.57949087023735e-05, -9.282492101192474e-05, -8.985493332147598e-05, -8.688494563102722e-05, -8.391495794057846e-05, -8.09449702501297e-05, -7.797498255968094e-05, -7.500499486923218e-05, -7.203500717878342e-05, -6.906501948833466e-05, -6.60950317978859e-05, -6.312504410743713e-05, -6.015505641698837e-05, -5.718506872653961e-05, -5.421508103609085e-05, -5.124509334564209e-05, -4.827510565519333e-05, -4.530511796474457e-05, -4.233513027429581e-05, -3.9365142583847046e-05, -3.6395154893398285e-05, -3.3425167202949524e-05, -3.0455179512500763e-05, -2.7485191822052002e-05, -2.451520413160324e-05, -2.154521644115448e-05, -1.857522875070572e-05, -1.5605241060256958e-05, -1.2635253369808197e-05, -9.665265679359436e-06, -6.695277988910675e-06, -3.725290298461914e-06, -7.553026080131531e-07, 2.214685082435608e-06, 5.184672772884369e-06, 8.15466046333313e-06, 1.1124648153781891e-05, 1.4094635844230652e-05, 1.7064623534679413e-05, 2.0034611225128174e-05, 2.3004598915576935e-05, 2.5974586606025696e-05, 2.8944574296474457e-05, 3.191456198692322e-05, 3.488454967737198e-05, 3.785453736782074e-05, 4.08245250582695e-05, 4.379451274871826e-05, 4.676450043916702e-05, 4.9734488129615784e-05, 5.2704475820064545e-05, 5.5674463510513306e-05, 5.864445120096207e-05, 6.161443889141083e-05, 6.458442658185959e-05, 6.755441427230835e-05, 7.052440196275711e-05, 7.349438965320587e-05, 7.646437734365463e-05, 7.94343650341034e-05, 8.240435272455215e-05, 8.537434041500092e-05, 8.834432810544968e-05, 9.131431579589844e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 6.0, 9.0, 11.0, 14.0, 10.0, 26.0, 35.0, 48.0, 67.0, 125.0, 171.0, 327.0, 503.0, 898.0, 1600.0, 3587.0, 8780.0, 25332.0, 88457.0, 295079.0, 401113.0, 155607.0, 42930.0, 13548.0, 5245.0, 2243.0, 1176.0, 626.0, 359.0, 190.0, 144.0, 94.0, 63.0, 43.0, 32.0, 15.0, 13.0, 10.0, 5.0, 7.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.323486328125, -0.31479454040527344, -0.3061027526855469, -0.2974109649658203, -0.28871917724609375, -0.2800273895263672, -0.2713356018066406, -0.26264381408691406, -0.2539520263671875, -0.24526023864746094, -0.23656845092773438, -0.2278766632080078, -0.21918487548828125, -0.2104930877685547, -0.20180130004882812, -0.19310951232910156, -0.184417724609375, -0.17572593688964844, -0.16703414916992188, -0.1583423614501953, -0.14965057373046875, -0.1409587860107422, -0.13226699829101562, -0.12357521057128906, -0.1148834228515625, -0.10619163513183594, -0.09749984741210938, -0.08880805969238281, -0.08011627197265625, -0.07142448425292969, -0.06273269653320312, -0.05404090881347656, -0.04534912109375, -0.03665733337402344, -0.027965545654296875, -0.019273757934570312, -0.01058197021484375, -0.0018901824951171875, 0.006801605224609375, 0.015493392944335938, 0.0241851806640625, 0.03287696838378906, 0.041568756103515625, 0.05026054382324219, 0.05895233154296875, 0.06764411926269531, 0.07633590698242188, 0.08502769470214844, 0.093719482421875, 0.10241127014160156, 0.11110305786132812, 0.11979484558105469, 0.12848663330078125, 0.1371784210205078, 0.14587020874023438, 0.15456199645996094, 0.1632537841796875, 0.17194557189941406, 0.18063735961914062, 0.1893291473388672, 0.19802093505859375, 0.2067127227783203, 0.21540451049804688, 0.22409629821777344, 0.2327880859375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 1.0, 3.0, 5.0, 7.0, 9.0, 11.0, 12.0, 11.0, 14.0, 29.0, 34.0, 39.0, 55.0, 55.0, 80.0, 66.0, 46.0, 62.0, 76.0, 55.0, 57.0, 58.0, 48.0, 34.0, 32.0, 22.0, 14.0, 14.0, 10.0, 9.0, 9.0, 8.0, 4.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.219482421875, -0.2124652862548828, -0.20544815063476562, -0.19843101501464844, -0.19141387939453125, -0.18439674377441406, -0.17737960815429688, -0.1703624725341797, -0.1633453369140625, -0.1563282012939453, -0.14931106567382812, -0.14229393005371094, -0.13527679443359375, -0.12825965881347656, -0.12124252319335938, -0.11422538757324219, -0.107208251953125, -0.10019111633300781, -0.09317398071289062, -0.08615684509277344, -0.07913970947265625, -0.07212257385253906, -0.06510543823242188, -0.05808830261230469, -0.0510711669921875, -0.04405403137207031, -0.037036895751953125, -0.030019760131835938, -0.02300262451171875, -0.015985488891601562, -0.008968353271484375, -0.0019512176513671875, 0.00506591796875, 0.012083053588867188, 0.019100189208984375, 0.026117324829101562, 0.03313446044921875, 0.04015159606933594, 0.047168731689453125, 0.05418586730957031, 0.0612030029296875, 0.06822013854980469, 0.07523727416992188, 0.08225440979003906, 0.08927154541015625, 0.09628868103027344, 0.10330581665039062, 0.11032295227050781, 0.117340087890625, 0.12435722351074219, 0.13137435913085938, 0.13839149475097656, 0.14540863037109375, 0.15242576599121094, 0.15944290161132812, 0.1664600372314453, 0.1734771728515625, 0.1804943084716797, 0.18751144409179688, 0.19452857971191406, 0.20154571533203125, 0.20856285095214844, 0.21557998657226562, 0.2225971221923828, 0.2296142578125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 11.0, 40.0, 150.0, 298.0, 309.0, 134.0, 41.0, 12.0, 6.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.177391052246094, -9.752223014831543, -9.327054023742676, -8.901885986328125, -8.476716995239258, -8.051548957824707, -7.626380920410156, -7.201212406158447, -6.776043891906738, -6.350875377655029, -5.92570686340332, -5.5005388259887695, -5.0753703117370605, -4.650201797485352, -4.225033760070801, -3.799865245819092, -3.374696731567383, -2.949528217315674, -2.524359941482544, -2.099191665649414, -1.674023151397705, -1.248854637145996, -0.8236863613128662, -0.39851808547973633, 0.026650428771972656, 0.4518188238143921, 0.8769872188568115, 1.302155613899231, 1.7273240089416504, 2.1524925231933594, 2.5776607990264893, 3.002829074859619, 3.427997589111328, 3.853166103363037, 4.278334617614746, 4.703502655029297, 5.128671169281006, 5.553839683532715, 5.979007720947266, 6.404176235198975, 6.829344749450684, 7.254513263702393, 7.679681777954102, 8.104849815368652, 8.530017852783203, 8.95518684387207, 9.380354881286621, 9.805522918701172, 10.230691909790039, 10.65585994720459, 11.081028938293457, 11.506196975708008, 11.931365966796875, 12.356534004211426, 12.781702041625977, 13.206871032714844, 13.632039070129395, 14.057207107543945, 14.482376098632812, 14.907544136047363, 15.332712173461914, 15.757881164550781, 16.18305015563965, 16.608217239379883, 17.03338623046875]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 5.0, 1.0, 3.0, 0.0, 6.0, 6.0, 4.0, 7.0, 10.0, 14.0, 16.0, 25.0, 17.0, 28.0, 31.0, 31.0, 37.0, 33.0, 36.0, 36.0, 47.0, 57.0, 48.0, 49.0, 54.0, 43.0, 42.0, 36.0, 27.0, 27.0, 36.0, 30.0, 34.0, 17.0, 31.0, 13.0, 18.0, 13.0, 12.0, 6.0, 3.0, 3.0, 2.0, 4.0, 4.0, 3.0, 4.0, 0.0, 3.0, 0.0, 1.0, 2.0], "bins": [-3.4539852142333984, -3.3572051525115967, -3.260425090789795, -3.1636452674865723, -3.0668652057647705, -2.9700851440429688, -2.873305082321167, -2.7765250205993652, -2.6797451972961426, -2.582965135574341, -2.486185073852539, -2.3894052505493164, -2.2926251888275146, -2.195845127105713, -2.099065065383911, -2.0022850036621094, -1.9055050611495972, -1.8087249994277954, -1.7119450569152832, -1.6151649951934814, -1.5183850526809692, -1.4216049909591675, -1.3248250484466553, -1.2280449867248535, -1.1312649250030518, -1.03448486328125, -0.9377049207687378, -0.840924859046936, -0.7441449165344238, -0.6473648548126221, -0.5505848526954651, -0.4538048505783081, -0.3570249080657959, -0.2602449059486389, -0.16346488893032074, -0.06668487191200256, 0.03009513020515442, 0.1268751323223114, 0.22365516424179077, 0.32043516635894775, 0.41721516847610474, 0.5139951705932617, 0.6107751727104187, 0.7075551748275757, 0.8043352365493774, 0.9011151790618896, 0.9978952407836914, 1.0946753025054932, 1.1914552450180054, 1.2882353067398071, 1.3850152492523193, 1.481795310974121, 1.5785752534866333, 1.675355315208435, 1.7721352577209473, 1.868915319442749, 1.9656953811645508, 2.0624754428863525, 2.1592555046081543, 2.256035327911377, 2.3528153896331787, 2.4495954513549805, 2.5463755130767822, 2.643155574798584, 2.7399353981018066]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 3.0, 3.0, 3.0, 7.0, 8.0, 16.0, 11.0, 17.0, 13.0, 37.0, 27.0, 46.0, 55.0, 100.0, 141.0, 244.0, 517.0, 1334.0, 5396.0, 48937.0, 3988995.0, 134443.0, 10142.0, 2020.0, 762.0, 371.0, 204.0, 136.0, 88.0, 57.0, 44.0, 35.0, 19.0, 12.0, 7.0, 12.0, 7.0, 8.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-3.181640625, -3.099334716796875, -3.01702880859375, -2.934722900390625, -2.8524169921875, -2.770111083984375, -2.68780517578125, -2.605499267578125, -2.523193359375, -2.440887451171875, -2.35858154296875, -2.276275634765625, -2.1939697265625, -2.111663818359375, -2.02935791015625, -1.947052001953125, -1.86474609375, -1.782440185546875, -1.70013427734375, -1.617828369140625, -1.5355224609375, -1.453216552734375, -1.37091064453125, -1.288604736328125, -1.206298828125, -1.123992919921875, -1.04168701171875, -0.959381103515625, -0.8770751953125, -0.794769287109375, -0.71246337890625, -0.630157470703125, -0.5478515625, -0.465545654296875, -0.38323974609375, -0.300933837890625, -0.2186279296875, -0.136322021484375, -0.05401611328125, 0.028289794921875, 0.110595703125, 0.192901611328125, 0.27520751953125, 0.357513427734375, 0.4398193359375, 0.522125244140625, 0.60443115234375, 0.686737060546875, 0.76904296875, 0.851348876953125, 0.93365478515625, 1.015960693359375, 1.0982666015625, 1.180572509765625, 1.26287841796875, 1.345184326171875, 1.427490234375, 1.509796142578125, 1.59210205078125, 1.674407958984375, 1.7567138671875, 1.839019775390625, 1.92132568359375, 2.003631591796875, 2.0859375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 9.0, 13.0, 17.0, 25.0, 21.0, 49.0, 40.0, 64.0, 72.0, 80.0, 76.0, 84.0, 83.0, 64.0, 59.0, 56.0, 44.0, 35.0, 29.0, 30.0, 14.0, 11.0, 10.0, 3.0, 7.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2418212890625, -0.23584556579589844, -0.22986984252929688, -0.2238941192626953, -0.21791839599609375, -0.2119426727294922, -0.20596694946289062, -0.19999122619628906, -0.1940155029296875, -0.18803977966308594, -0.18206405639648438, -0.1760883331298828, -0.17011260986328125, -0.1641368865966797, -0.15816116333007812, -0.15218544006347656, -0.146209716796875, -0.14023399353027344, -0.13425827026367188, -0.1282825469970703, -0.12230682373046875, -0.11633110046386719, -0.11035537719726562, -0.10437965393066406, -0.0984039306640625, -0.09242820739746094, -0.08645248413085938, -0.08047676086425781, -0.07450103759765625, -0.06852531433105469, -0.06254959106445312, -0.05657386779785156, -0.05059814453125, -0.04462242126464844, -0.038646697998046875, -0.03267097473144531, -0.02669525146484375, -0.020719528198242188, -0.014743804931640625, -0.008768081665039062, -0.0027923583984375, 0.0031833648681640625, 0.009159088134765625, 0.015134811401367188, 0.02111053466796875, 0.027086257934570312, 0.033061981201171875, 0.03903770446777344, 0.045013427734375, 0.05098915100097656, 0.056964874267578125, 0.06294059753417969, 0.06891632080078125, 0.07489204406738281, 0.08086776733398438, 0.08684349060058594, 0.0928192138671875, 0.09879493713378906, 0.10477066040039062, 0.11074638366699219, 0.11672210693359375, 0.12269783020019531, 0.12867355346679688, 0.13464927673339844, 0.140625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 3.0, 6.0, 11.0, 7.0, 8.0, 16.0, 18.0, 20.0, 26.0, 39.0, 61.0, 53.0, 78.0, 190.0, 8687.0, 4182926.0, 1606.0, 135.0, 77.0, 68.0, 50.0, 42.0, 38.0, 27.0, 22.0, 12.0, 15.0, 16.0, 11.0, 6.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.359375, -11.07080078125, -10.7822265625, -10.49365234375, -10.205078125, -9.91650390625, -9.6279296875, -9.33935546875, -9.05078125, -8.76220703125, -8.4736328125, -8.18505859375, -7.896484375, -7.60791015625, -7.3193359375, -7.03076171875, -6.7421875, -6.45361328125, -6.1650390625, -5.87646484375, -5.587890625, -5.29931640625, -5.0107421875, -4.72216796875, -4.43359375, -4.14501953125, -3.8564453125, -3.56787109375, -3.279296875, -2.99072265625, -2.7021484375, -2.41357421875, -2.125, -1.83642578125, -1.5478515625, -1.25927734375, -0.970703125, -0.68212890625, -0.3935546875, -0.10498046875, 0.18359375, 0.47216796875, 0.7607421875, 1.04931640625, 1.337890625, 1.62646484375, 1.9150390625, 2.20361328125, 2.4921875, 2.78076171875, 3.0693359375, 3.35791015625, 3.646484375, 3.93505859375, 4.2236328125, 4.51220703125, 4.80078125, 5.08935546875, 5.3779296875, 5.66650390625, 5.955078125, 6.24365234375, 6.5322265625, 6.82080078125, 7.109375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 6.0, 55.0, 413.0, 3344.0, 219.0, 39.0, 13.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.312744140625, -0.2545433044433594, -0.19634246826171875, -0.13814163208007812, -0.0799407958984375, -0.021739959716796875, 0.03646087646484375, 0.09466171264648438, 0.152862548828125, 0.21106338500976562, 0.26926422119140625, 0.3274650573730469, 0.3856658935546875, 0.4438667297363281, 0.5020675659179688, 0.5602684020996094, 0.61846923828125, 0.6766700744628906, 0.7348709106445312, 0.7930717468261719, 0.8512725830078125, 0.9094734191894531, 0.9676742553710938, 1.0258750915527344, 1.084075927734375, 1.1422767639160156, 1.2004776000976562, 1.2586784362792969, 1.3168792724609375, 1.3750801086425781, 1.4332809448242188, 1.4914817810058594, 1.5496826171875, 1.6078834533691406, 1.6660842895507812, 1.7242851257324219, 1.7824859619140625, 1.8406867980957031, 1.8988876342773438, 1.9570884704589844, 2.015289306640625, 2.0734901428222656, 2.1316909790039062, 2.189891815185547, 2.2480926513671875, 2.306293487548828, 2.3644943237304688, 2.4226951599121094, 2.48089599609375, 2.5390968322753906, 2.5972976684570312, 2.655498504638672, 2.7136993408203125, 2.771900177001953, 2.8301010131835938, 2.8883018493652344, 2.946502685546875, 3.0047035217285156, 3.0629043579101562, 3.121105194091797, 3.1793060302734375, 3.237506866455078, 3.2957077026367188, 3.3539085388183594, 3.412109375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 15.0, 418.0, 564.0, 14.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.514610290527344, -22.494400024414062, -21.47418785095215, -20.453975677490234, -19.433765411376953, -18.413555145263672, -17.393342971801758, -16.373130798339844, -15.352920532226562, -14.332709312438965, -13.312498092651367, -12.29228687286377, -11.272075653076172, -10.251864433288574, -9.231653213500977, -8.211441993713379, -7.191230773925781, -6.171019554138184, -5.150808334350586, -4.130597114562988, -3.1103858947753906, -2.090174674987793, -1.0699634552001953, -0.049752235412597656, 0.970458984375, 1.9906702041625977, 3.0108814239501953, 4.031092643737793, 5.051303863525391, 6.071515083312988, 7.091726303100586, 8.111937522888184, 9.132148742675781, 10.152359962463379, 11.172571182250977, 12.192782402038574, 13.212993621826172, 14.23320484161377, 15.253416061401367, 16.27362823486328, 17.293838500976562, 18.314048767089844, 19.334260940551758, 20.354473114013672, 21.374683380126953, 22.394893646240234, 23.41510581970215, 24.435317993164062, 25.455528259277344, 26.475738525390625, 27.49595069885254, 28.516162872314453, 29.536373138427734, 30.556583404541016, 31.57679557800293, 32.597007751464844, 33.617218017578125, 34.637428283691406, 35.65763854980469, 36.677852630615234, 37.698062896728516, 38.7182731628418, 39.738487243652344, 40.758697509765625, 41.778907775878906]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 7.0, 28.0, 102.0, 163.0, 247.0, 222.0, 147.0, 56.0, 23.0, 8.0, 7.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.795660972595215, -7.550102233886719, -7.304543972015381, -7.058985233306885, -6.813426494598389, -6.567868232727051, -6.322309494018555, -6.076750755310059, -5.8311920166015625, -5.585633277893066, -5.3400750160217285, -5.094516277313232, -4.848957538604736, -4.603399276733398, -4.357840538024902, -4.112281799316406, -3.8667232990264893, -3.6211647987365723, -3.375606060028076, -3.130047559738159, -2.884488821029663, -2.638930320739746, -2.39337158203125, -2.147813081741333, -1.9022544622421265, -1.65669584274292, -1.4111372232437134, -1.1655786037445068, -0.9200200438499451, -0.6744614839553833, -0.42890286445617676, -0.18334424495697021, 0.06221437454223633, 0.30777299404144287, 0.5533316135406494, 0.7988901734352112, 1.0444488525390625, 1.2900073528289795, 1.535565972328186, 1.7811245918273926, 2.0266833305358887, 2.2722418308258057, 2.5178005695343018, 2.7633590698242188, 3.008917808532715, 3.254476308822632, 3.500034809112549, 3.745593547821045, 3.991152048110962, 4.236710548400879, 4.482269287109375, 4.727828025817871, 4.973386287689209, 5.218945026397705, 5.464503765106201, 5.710062026977539, 5.955620765686035, 6.201179504394531, 6.446737766265869, 6.692296504974365, 6.937855243682861, 7.183413505554199, 7.428972244262695, 7.674530982971191, 7.9200897216796875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 5.0, 3.0, 3.0, 10.0, 5.0, 11.0, 11.0, 17.0, 22.0, 25.0, 30.0, 58.0, 52.0, 88.0, 114.0, 146.0, 193.0, 320.0, 437.0, 748.0, 1647.0, 4071.0, 14459.0, 71888.0, 383818.0, 452045.0, 91667.0, 17609.0, 4785.0, 1754.0, 868.0, 501.0, 295.0, 220.0, 161.0, 106.0, 86.0, 62.0, 55.0, 31.0, 32.0, 24.0, 18.0, 22.0, 11.0, 12.0, 5.0, 5.0, 1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.369140625, -1.326446533203125, -1.28375244140625, -1.241058349609375, -1.1983642578125, -1.155670166015625, -1.11297607421875, -1.070281982421875, -1.027587890625, -0.984893798828125, -0.94219970703125, -0.899505615234375, -0.8568115234375, -0.814117431640625, -0.77142333984375, -0.728729248046875, -0.68603515625, -0.643341064453125, -0.60064697265625, -0.557952880859375, -0.5152587890625, -0.472564697265625, -0.42987060546875, -0.387176513671875, -0.344482421875, -0.301788330078125, -0.25909423828125, -0.216400146484375, -0.1737060546875, -0.131011962890625, -0.08831787109375, -0.045623779296875, -0.0029296875, 0.039764404296875, 0.08245849609375, 0.125152587890625, 0.1678466796875, 0.210540771484375, 0.25323486328125, 0.295928955078125, 0.338623046875, 0.381317138671875, 0.42401123046875, 0.466705322265625, 0.5093994140625, 0.552093505859375, 0.59478759765625, 0.637481689453125, 0.68017578125, 0.722869873046875, 0.76556396484375, 0.808258056640625, 0.8509521484375, 0.893646240234375, 0.93634033203125, 0.979034423828125, 1.021728515625, 1.064422607421875, 1.10711669921875, 1.149810791015625, 1.1925048828125, 1.235198974609375, 1.27789306640625, 1.320587158203125, 1.36328125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 9.0, 26.0, 33.0, 56.0, 74.0, 112.0, 127.0, 132.0, 99.0, 106.0, 70.0, 59.0, 31.0, 31.0, 13.0, 14.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23095703125, -0.22116851806640625, -0.2113800048828125, -0.20159149169921875, -0.191802978515625, -0.18201446533203125, -0.1722259521484375, -0.16243743896484375, -0.15264892578125, -0.14286041259765625, -0.1330718994140625, -0.12328338623046875, -0.113494873046875, -0.10370635986328125, -0.0939178466796875, -0.08412933349609375, -0.0743408203125, -0.06455230712890625, -0.0547637939453125, -0.04497528076171875, -0.035186767578125, -0.02539825439453125, -0.0156097412109375, -0.00582122802734375, 0.00396728515625, 0.01375579833984375, 0.0235443115234375, 0.03333282470703125, 0.043121337890625, 0.05290985107421875, 0.0626983642578125, 0.07248687744140625, 0.082275390625, 0.09206390380859375, 0.1018524169921875, 0.11164093017578125, 0.121429443359375, 0.13121795654296875, 0.1410064697265625, 0.15079498291015625, 0.16058349609375, 0.17037200927734375, 0.1801605224609375, 0.18994903564453125, 0.199737548828125, 0.20952606201171875, 0.2193145751953125, 0.22910308837890625, 0.2388916015625, 0.24868011474609375, 0.2584686279296875, 0.26825714111328125, 0.278045654296875, 0.28783416748046875, 0.2976226806640625, 0.30741119384765625, 0.31719970703125, 0.32698822021484375, 0.3367767333984375, 0.34656524658203125, 0.356353759765625, 0.36614227294921875, 0.3759307861328125, 0.38571929931640625, 0.3955078125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 5.0, 5.0, 4.0, 8.0, 12.0, 16.0, 22.0, 38.0, 34.0, 63.0, 87.0, 121.0, 203.0, 331.0, 561.0, 1111.0, 2135.0, 4593.0, 10903.0, 27920.0, 76585.0, 200099.0, 350379.0, 227734.0, 89768.0, 32946.0, 12473.0, 5090.0, 2394.0, 1147.0, 640.0, 396.0, 253.0, 159.0, 94.0, 65.0, 58.0, 27.0, 21.0, 23.0, 7.0, 11.0, 4.0, 6.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.548828125, -0.5302734375, -0.51171875, -0.4931640625, -0.474609375, -0.4560546875, -0.4375, -0.4189453125, -0.400390625, -0.3818359375, -0.36328125, -0.3447265625, -0.326171875, -0.3076171875, -0.2890625, -0.2705078125, -0.251953125, -0.2333984375, -0.21484375, -0.1962890625, -0.177734375, -0.1591796875, -0.140625, -0.1220703125, -0.103515625, -0.0849609375, -0.06640625, -0.0478515625, -0.029296875, -0.0107421875, 0.0078125, 0.0263671875, 0.044921875, 0.0634765625, 0.08203125, 0.1005859375, 0.119140625, 0.1376953125, 0.15625, 0.1748046875, 0.193359375, 0.2119140625, 0.23046875, 0.2490234375, 0.267578125, 0.2861328125, 0.3046875, 0.3232421875, 0.341796875, 0.3603515625, 0.37890625, 0.3974609375, 0.416015625, 0.4345703125, 0.453125, 0.4716796875, 0.490234375, 0.5087890625, 0.52734375, 0.5458984375, 0.564453125, 0.5830078125, 0.6015625, 0.6201171875, 0.638671875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 4.0, 5.0, 14.0, 10.0, 16.0, 9.0, 17.0, 19.0, 31.0, 20.0, 30.0, 33.0, 48.0, 45.0, 52.0, 41.0, 49.0, 47.0, 51.0, 60.0, 36.0, 46.0, 47.0, 41.0, 28.0, 32.0, 30.0, 32.0, 22.0, 13.0, 12.0, 15.0, 13.0, 6.0, 10.0, 6.0, 3.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.525390625, -0.5058746337890625, -0.486358642578125, -0.4668426513671875, -0.44732666015625, -0.4278106689453125, -0.408294677734375, -0.3887786865234375, -0.3692626953125, -0.3497467041015625, -0.330230712890625, -0.3107147216796875, -0.29119873046875, -0.2716827392578125, -0.252166748046875, -0.2326507568359375, -0.213134765625, -0.1936187744140625, -0.174102783203125, -0.1545867919921875, -0.13507080078125, -0.1155548095703125, -0.096038818359375, -0.0765228271484375, -0.0570068359375, -0.0374908447265625, -0.017974853515625, 0.0015411376953125, 0.02105712890625, 0.0405731201171875, 0.060089111328125, 0.0796051025390625, 0.09912109375, 0.1186370849609375, 0.138153076171875, 0.1576690673828125, 0.17718505859375, 0.1967010498046875, 0.216217041015625, 0.2357330322265625, 0.2552490234375, 0.2747650146484375, 0.294281005859375, 0.3137969970703125, 0.33331298828125, 0.3528289794921875, 0.372344970703125, 0.3918609619140625, 0.411376953125, 0.4308929443359375, 0.450408935546875, 0.4699249267578125, 0.48944091796875, 0.5089569091796875, 0.528472900390625, 0.5479888916015625, 0.5675048828125, 0.5870208740234375, 0.606536865234375, 0.6260528564453125, 0.64556884765625, 0.6650848388671875, 0.684600830078125, 0.7041168212890625, 0.7236328125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 5.0, 7.0, 7.0, 6.0, 13.0, 31.0, 38.0, 62.0, 93.0, 137.0, 288.0, 431.0, 865.0, 1833.0, 4804.0, 22762.0, 284584.0, 654974.0, 63633.0, 8678.0, 2678.0, 1164.0, 598.0, 320.0, 205.0, 116.0, 78.0, 51.0, 27.0, 20.0, 14.0, 9.0, 10.0, 3.0, 2.0, 2.0, 5.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67236328125, -0.6527175903320312, -0.6330718994140625, -0.6134262084960938, -0.593780517578125, -0.5741348266601562, -0.5544891357421875, -0.5348434448242188, -0.51519775390625, -0.49555206298828125, -0.4759063720703125, -0.45626068115234375, -0.436614990234375, -0.41696929931640625, -0.3973236083984375, -0.37767791748046875, -0.3580322265625, -0.33838653564453125, -0.3187408447265625, -0.29909515380859375, -0.279449462890625, -0.25980377197265625, -0.2401580810546875, -0.22051239013671875, -0.20086669921875, -0.18122100830078125, -0.1615753173828125, -0.14192962646484375, -0.122283935546875, -0.10263824462890625, -0.0829925537109375, -0.06334686279296875, -0.043701171875, -0.02405548095703125, -0.0044097900390625, 0.01523590087890625, 0.034881591796875, 0.05452728271484375, 0.0741729736328125, 0.09381866455078125, 0.11346435546875, 0.13311004638671875, 0.1527557373046875, 0.17240142822265625, 0.192047119140625, 0.21169281005859375, 0.2313385009765625, 0.25098419189453125, 0.2706298828125, 0.29027557373046875, 0.3099212646484375, 0.32956695556640625, 0.349212646484375, 0.36885833740234375, 0.3885040283203125, 0.40814971923828125, 0.42779541015625, 0.44744110107421875, 0.4670867919921875, 0.48673248291015625, 0.506378173828125, 0.5260238647460938, 0.5456695556640625, 0.5653152465820312, 0.5849609375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 2.0, 1.0, 7.0, 4.0, 7.0, 9.0, 12.0, 33.0, 54.0, 91.0, 126.0, 166.0, 166.0, 134.0, 74.0, 48.0, 26.0, 22.0, 9.0, 8.0, 3.0, 5.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011342763900756836, -0.00010887999087572098, -0.0001043323427438736, -9.978469461202621e-05, -9.523704648017883e-05, -9.068939834833145e-05, -8.614175021648407e-05, -8.159410208463669e-05, -7.70464539527893e-05, -7.249880582094193e-05, -6.795115768909454e-05, -6.340350955724716e-05, -5.885586142539978e-05, -5.43082132935524e-05, -4.976056516170502e-05, -4.5212917029857635e-05, -4.0665268898010254e-05, -3.611762076616287e-05, -3.156997263431549e-05, -2.702232450246811e-05, -2.2474676370620728e-05, -1.7927028238773346e-05, -1.3379380106925964e-05, -8.831731975078583e-06, -4.284083843231201e-06, 2.635642886161804e-07, 4.811212420463562e-06, 9.358860552310944e-06, 1.3906508684158325e-05, 1.8454156816005707e-05, 2.300180494785309e-05, 2.754945307970047e-05, 3.209710121154785e-05, 3.664474934339523e-05, 4.1192397475242615e-05, 4.5740045607089996e-05, 5.028769373893738e-05, 5.483534187078476e-05, 5.938299000263214e-05, 6.393063813447952e-05, 6.84782862663269e-05, 7.302593439817429e-05, 7.757358253002167e-05, 8.212123066186905e-05, 8.666887879371643e-05, 9.121652692556381e-05, 9.57641750574112e-05, 0.00010031182318925858, 0.00010485947132110596, 0.00010940711945295334, 0.00011395476758480072, 0.0001185024157166481, 0.00012305006384849548, 0.00012759771198034286, 0.00013214536011219025, 0.00013669300824403763, 0.000141240656375885, 0.0001457883045077324, 0.00015033595263957977, 0.00015488360077142715, 0.00015943124890327454, 0.00016397889703512192, 0.0001685265451669693, 0.00017307419329881668, 0.00017762184143066406]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 8.0, 2.0, 12.0, 15.0, 18.0, 36.0, 50.0, 72.0, 127.0, 212.0, 367.0, 764.0, 1809.0, 4990.0, 19790.0, 138384.0, 632434.0, 211140.0, 27991.0, 6220.0, 2187.0, 881.0, 464.0, 207.0, 122.0, 84.0, 55.0, 35.0, 23.0, 10.0, 15.0, 12.0, 3.0, 5.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.48779296875, -0.47369384765625, -0.4595947265625, -0.44549560546875, -0.431396484375, -0.41729736328125, -0.4031982421875, -0.38909912109375, -0.375, -0.36090087890625, -0.3468017578125, -0.33270263671875, -0.318603515625, -0.30450439453125, -0.2904052734375, -0.27630615234375, -0.26220703125, -0.24810791015625, -0.2340087890625, -0.21990966796875, -0.205810546875, -0.19171142578125, -0.1776123046875, -0.16351318359375, -0.1494140625, -0.13531494140625, -0.1212158203125, -0.10711669921875, -0.093017578125, -0.07891845703125, -0.0648193359375, -0.05072021484375, -0.03662109375, -0.02252197265625, -0.0084228515625, 0.00567626953125, 0.019775390625, 0.03387451171875, 0.0479736328125, 0.06207275390625, 0.076171875, 0.09027099609375, 0.1043701171875, 0.11846923828125, 0.132568359375, 0.14666748046875, 0.1607666015625, 0.17486572265625, 0.18896484375, 0.20306396484375, 0.2171630859375, 0.23126220703125, 0.245361328125, 0.25946044921875, 0.2735595703125, 0.28765869140625, 0.3017578125, 0.31585693359375, 0.3299560546875, 0.34405517578125, 0.358154296875, 0.37225341796875, 0.3863525390625, 0.40045166015625, 0.41455078125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 1.0, 7.0, 13.0, 3.0, 11.0, 20.0, 35.0, 50.0, 59.0, 72.0, 76.0, 102.0, 91.0, 109.0, 82.0, 63.0, 50.0, 43.0, 41.0, 23.0, 14.0, 6.0, 8.0, 6.0, 4.0, 2.0, 2.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3896484375, -0.3786659240722656, -0.36768341064453125, -0.3567008972167969, -0.3457183837890625, -0.3347358703613281, -0.32375335693359375, -0.3127708435058594, -0.301788330078125, -0.2908058166503906, -0.27982330322265625, -0.2688407897949219, -0.2578582763671875, -0.24687576293945312, -0.23589324951171875, -0.22491073608398438, -0.21392822265625, -0.20294570922851562, -0.19196319580078125, -0.18098068237304688, -0.1699981689453125, -0.15901565551757812, -0.14803314208984375, -0.13705062866210938, -0.126068115234375, -0.11508560180664062, -0.10410308837890625, -0.09312057495117188, -0.0821380615234375, -0.07115554809570312, -0.06017303466796875, -0.049190521240234375, -0.0382080078125, -0.027225494384765625, -0.01624298095703125, -0.005260467529296875, 0.0057220458984375, 0.016704559326171875, 0.02768707275390625, 0.038669586181640625, 0.049652099609375, 0.060634613037109375, 0.07161712646484375, 0.08259963989257812, 0.0935821533203125, 0.10456466674804688, 0.11554718017578125, 0.12652969360351562, 0.13751220703125, 0.14849472045898438, 0.15947723388671875, 0.17045974731445312, 0.1814422607421875, 0.19242477416992188, 0.20340728759765625, 0.21438980102539062, 0.225372314453125, 0.23635482788085938, 0.24733734130859375, 0.2583198547363281, 0.2693023681640625, 0.2802848815917969, 0.29126739501953125, 0.3022499084472656, 0.313232421875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 6.0, 6.0, 24.0, 29.0, 65.0, 132.0, 205.0, 231.0, 137.0, 80.0, 46.0, 25.0, 6.0, 6.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.12966537475586, -8.84589672088623, -8.562128067016602, -8.278360366821289, -7.99459171295166, -7.710823059082031, -7.4270548820495605, -7.14328670501709, -6.859518051147461, -6.575749397277832, -6.291981220245361, -6.008213043212891, -5.724444389343262, -5.440675735473633, -5.156907558441162, -4.873139381408691, -4.5893707275390625, -4.305602073669434, -4.021833896636963, -3.738065481185913, -3.4542970657348633, -3.1705286502838135, -2.8867602348327637, -2.602991819381714, -2.319223403930664, -2.0354549884796143, -1.7516865730285645, -1.4679181575775146, -1.1841497421264648, -0.900381326675415, -0.6166129112243652, -0.33284449577331543, -0.049076080322265625, 0.23469233512878418, 0.518460750579834, 0.8022291660308838, 1.0859975814819336, 1.3697659969329834, 1.6535344123840332, 1.937302827835083, 2.221071243286133, 2.5048396587371826, 2.7886080741882324, 3.0723764896392822, 3.356144905090332, 3.639913320541382, 3.9236817359924316, 4.207449913024902, 4.491218566894531, 4.77498722076416, 5.058755397796631, 5.342523574829102, 5.6262922286987305, 5.910060882568359, 6.19382905960083, 6.477597236633301, 6.76136589050293, 7.045134544372559, 7.328902721405029, 7.6126708984375, 7.896439552307129, 8.180208206176758, 8.46397590637207, 8.7477445602417, 9.031513214111328]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 9.0, 4.0, 5.0, 12.0, 8.0, 7.0, 8.0, 17.0, 14.0, 8.0, 27.0, 20.0, 23.0, 27.0, 21.0, 33.0, 29.0, 29.0, 43.0, 40.0, 45.0, 34.0, 43.0, 30.0, 61.0, 31.0, 40.0, 34.0, 39.0, 29.0, 21.0, 32.0, 24.0, 24.0, 22.0, 13.0, 14.0, 19.0, 18.0, 15.0, 7.0, 4.0, 8.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.2159557342529297, -3.117790460586548, -3.019625186920166, -2.9214601516723633, -2.8232948780059814, -2.7251296043395996, -2.6269643306732178, -2.528799057006836, -2.430633783340454, -2.3324685096740723, -2.2343032360076904, -2.1361379623413086, -2.037972927093506, -1.939807653427124, -1.8416423797607422, -1.7434771060943604, -1.645311951637268, -1.5471466779708862, -1.448981523513794, -1.350816249847412, -1.2526509761810303, -1.1544857025146484, -1.0563205480575562, -0.9581552743911743, -0.8599900603294373, -0.7618248462677002, -0.6636595726013184, -0.5654943585395813, -0.46732911467552185, -0.3691638708114624, -0.27099865674972534, -0.1728333830833435, -0.07466816902160645, 0.023497067391872406, 0.12166230380535126, 0.2198275327682495, 0.31799277663230896, 0.4161580204963684, 0.5143232345581055, 0.6124885082244873, 0.7106537222862244, 0.8088189363479614, 0.9069842100143433, 1.0051493644714355, 1.1033146381378174, 1.2014799118041992, 1.299645185470581, 1.397810459136963, 1.4959756135940552, 1.594140887260437, 1.6923060417175293, 1.7904713153839111, 1.888636589050293, 1.9868018627166748, 2.0849671363830566, 2.1831321716308594, 2.281297445297241, 2.379462718963623, 2.477627992630005, 2.5757932662963867, 2.6739583015441895, 2.7721235752105713, 2.870288848876953, 2.968454122543335, 3.066619396209717]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 6.0, 8.0, 17.0, 18.0, 19.0, 34.0, 58.0, 79.0, 126.0, 204.0, 313.0, 623.0, 1272.0, 3190.0, 12583.0, 84874.0, 3743744.0, 310437.0, 26970.0, 5492.0, 1867.0, 879.0, 464.0, 293.0, 197.0, 126.0, 104.0, 62.0, 49.0, 31.0, 31.0, 29.0, 23.0, 13.0, 12.0, 8.0, 6.0, 6.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3232421875, -1.2697296142578125, -1.216217041015625, -1.1627044677734375, -1.10919189453125, -1.0556793212890625, -1.002166748046875, -0.9486541748046875, -0.8951416015625, -0.8416290283203125, -0.788116455078125, -0.7346038818359375, -0.68109130859375, -0.6275787353515625, -0.574066162109375, -0.5205535888671875, -0.467041015625, -0.4135284423828125, -0.360015869140625, -0.3065032958984375, -0.25299072265625, -0.1994781494140625, -0.145965576171875, -0.0924530029296875, -0.0389404296875, 0.0145721435546875, 0.068084716796875, 0.1215972900390625, 0.17510986328125, 0.2286224365234375, 0.282135009765625, 0.3356475830078125, 0.38916015625, 0.4426727294921875, 0.496185302734375, 0.5496978759765625, 0.60321044921875, 0.6567230224609375, 0.710235595703125, 0.7637481689453125, 0.8172607421875, 0.8707733154296875, 0.924285888671875, 0.9777984619140625, 1.03131103515625, 1.0848236083984375, 1.138336181640625, 1.1918487548828125, 1.245361328125, 1.2988739013671875, 1.352386474609375, 1.4058990478515625, 1.45941162109375, 1.5129241943359375, 1.566436767578125, 1.6199493408203125, 1.6734619140625, 1.7269744873046875, 1.780487060546875, 1.8339996337890625, 1.88751220703125, 1.9410247802734375, 1.994537353515625, 2.0480499267578125, 2.1015625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 5.0, 3.0, 6.0, 13.0, 12.0, 19.0, 26.0, 46.0, 78.0, 75.0, 85.0, 90.0, 96.0, 113.0, 82.0, 66.0, 46.0, 40.0, 49.0, 15.0, 15.0, 12.0, 8.0, 4.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2257080078125, -0.21648597717285156, -0.20726394653320312, -0.1980419158935547, -0.18881988525390625, -0.1795978546142578, -0.17037582397460938, -0.16115379333496094, -0.1519317626953125, -0.14270973205566406, -0.13348770141601562, -0.12426567077636719, -0.11504364013671875, -0.10582160949707031, -0.09659957885742188, -0.08737754821777344, -0.078155517578125, -0.06893348693847656, -0.059711456298828125, -0.05048942565917969, -0.04126739501953125, -0.03204536437988281, -0.022823333740234375, -0.013601303100585938, -0.0043792724609375, 0.0048427581787109375, 0.014064788818359375, 0.023286819458007812, 0.03250885009765625, 0.04173088073730469, 0.050952911376953125, 0.06017494201660156, 0.06939697265625, 0.07861900329589844, 0.08784103393554688, 0.09706306457519531, 0.10628509521484375, 0.11550712585449219, 0.12472915649414062, 0.13395118713378906, 0.1431732177734375, 0.15239524841308594, 0.16161727905273438, 0.1708393096923828, 0.18006134033203125, 0.1892833709716797, 0.19850540161132812, 0.20772743225097656, 0.216949462890625, 0.22617149353027344, 0.23539352416992188, 0.2446155548095703, 0.25383758544921875, 0.2630596160888672, 0.2722816467285156, 0.28150367736816406, 0.2907257080078125, 0.29994773864746094, 0.3091697692871094, 0.3183917999267578, 0.32761383056640625, 0.3368358612060547, 0.3460578918457031, 0.35527992248535156, 0.364501953125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 6.0, 5.0, 9.0, 8.0, 15.0, 29.0, 31.0, 40.0, 50.0, 103.0, 185.0, 330.0, 898.0, 2385.0, 9872.0, 67014.0, 3482397.0, 588440.0, 33130.0, 6091.0, 1757.0, 714.0, 331.0, 153.0, 87.0, 57.0, 45.0, 19.0, 20.0, 17.0, 12.0, 14.0, 6.0, 8.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.9033203125, -1.8530120849609375, -1.802703857421875, -1.7523956298828125, -1.70208740234375, -1.6517791748046875, -1.601470947265625, -1.5511627197265625, -1.5008544921875, -1.4505462646484375, -1.400238037109375, -1.3499298095703125, -1.29962158203125, -1.2493133544921875, -1.199005126953125, -1.1486968994140625, -1.098388671875, -1.0480804443359375, -0.997772216796875, -0.9474639892578125, -0.89715576171875, -0.8468475341796875, -0.796539306640625, -0.7462310791015625, -0.6959228515625, -0.6456146240234375, -0.595306396484375, -0.5449981689453125, -0.49468994140625, -0.4443817138671875, -0.394073486328125, -0.3437652587890625, -0.29345703125, -0.2431488037109375, -0.192840576171875, -0.1425323486328125, -0.09222412109375, -0.0419158935546875, 0.008392333984375, 0.0587005615234375, 0.1090087890625, 0.1593170166015625, 0.209625244140625, 0.2599334716796875, 0.31024169921875, 0.3605499267578125, 0.410858154296875, 0.4611663818359375, 0.511474609375, 0.5617828369140625, 0.612091064453125, 0.6623992919921875, 0.71270751953125, 0.7630157470703125, 0.813323974609375, 0.8636322021484375, 0.9139404296875, 0.9642486572265625, 1.014556884765625, 1.0648651123046875, 1.11517333984375, 1.1654815673828125, 1.215789794921875, 1.2660980224609375, 1.31640625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 7.0, 1.0, 1.0, 4.0, 0.0, 3.0, 10.0, 8.0, 11.0, 27.0, 39.0, 62.0, 121.0, 187.0, 440.0, 1454.0, 894.0, 331.0, 183.0, 87.0, 62.0, 46.0, 26.0, 21.0, 10.0, 14.0, 7.0, 9.0, 0.0, 6.0, 6.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.302734375, -0.28823089599609375, -0.2737274169921875, -0.25922393798828125, -0.244720458984375, -0.23021697998046875, -0.2157135009765625, -0.20121002197265625, -0.18670654296875, -0.17220306396484375, -0.1576995849609375, -0.14319610595703125, -0.128692626953125, -0.11418914794921875, -0.0996856689453125, -0.08518218994140625, -0.0706787109375, -0.05617523193359375, -0.0416717529296875, -0.02716827392578125, -0.012664794921875, 0.00183868408203125, 0.0163421630859375, 0.03084564208984375, 0.04534912109375, 0.05985260009765625, 0.0743560791015625, 0.08885955810546875, 0.103363037109375, 0.11786651611328125, 0.1323699951171875, 0.14687347412109375, 0.161376953125, 0.17588043212890625, 0.1903839111328125, 0.20488739013671875, 0.219390869140625, 0.23389434814453125, 0.2483978271484375, 0.26290130615234375, 0.27740478515625, 0.29190826416015625, 0.3064117431640625, 0.32091522216796875, 0.335418701171875, 0.34992218017578125, 0.3644256591796875, 0.37892913818359375, 0.3934326171875, 0.40793609619140625, 0.4224395751953125, 0.43694305419921875, 0.451446533203125, 0.46595001220703125, 0.4804534912109375, 0.49495697021484375, 0.50946044921875, 0.5239639282226562, 0.5384674072265625, 0.5529708862304688, 0.567474365234375, 0.5819778442382812, 0.5964813232421875, 0.6109848022460938, 0.62548828125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 4.0, 7.0, 6.0, 16.0, 20.0, 67.0, 114.0, 164.0, 188.0, 156.0, 96.0, 68.0, 44.0, 12.0, 10.0, 9.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.503411293029785, -3.3913064002990723, -3.2792015075683594, -3.1670966148376465, -3.0549917221069336, -2.9428868293762207, -2.830781936645508, -2.718677043914795, -2.606572151184082, -2.494467258453369, -2.3823623657226562, -2.2702574729919434, -2.1581525802612305, -2.0460476875305176, -1.9339427947998047, -1.8218379020690918, -1.709733009338379, -1.597628116607666, -1.4855232238769531, -1.3734183311462402, -1.2613134384155273, -1.1492085456848145, -1.0371036529541016, -0.9249987602233887, -0.8128938674926758, -0.7007889747619629, -0.58868408203125, -0.4765791893005371, -0.3644742965698242, -0.25236940383911133, -0.14026451110839844, -0.028159618377685547, 0.08394527435302734, 0.19605016708374023, 0.3081550598144531, 0.420259952545166, 0.5323648452758789, 0.6444697380065918, 0.7565746307373047, 0.8686795234680176, 0.9807844161987305, 1.0928893089294434, 1.2049942016601562, 1.3170990943908691, 1.429203987121582, 1.541308879852295, 1.6534137725830078, 1.7655186653137207, 1.8776235580444336, 1.9897284507751465, 2.1018333435058594, 2.2139382362365723, 2.326043128967285, 2.438148021697998, 2.550252914428711, 2.662357807159424, 2.7744626998901367, 2.8865675926208496, 2.9986724853515625, 3.1107773780822754, 3.2228822708129883, 3.334987163543701, 3.447092056274414, 3.559196949005127, 3.67130184173584]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 2.0, 8.0, 6.0, 10.0, 11.0, 10.0, 29.0, 25.0, 31.0, 50.0, 32.0, 34.0, 33.0, 49.0, 50.0, 56.0, 44.0, 47.0, 47.0, 50.0, 40.0, 43.0, 44.0, 46.0, 33.0, 33.0, 26.0, 13.0, 20.0, 20.0, 17.0, 6.0, 6.0, 6.0, 11.0, 4.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.4813545942306519, -1.4335582256317139, -1.3857619762420654, -1.3379656076431274, -1.2901692390441895, -1.242372989654541, -1.194576621055603, -1.146780252456665, -1.0989840030670166, -1.0511876344680786, -1.0033913850784302, -0.9555950164794922, -0.907798707485199, -0.8600023984909058, -0.8122060298919678, -0.7644097208976746, -0.7166134119033813, -0.6688171029090881, -0.6210207939147949, -0.5732244253158569, -0.5254281163215637, -0.4776318073272705, -0.4298354685306549, -0.3820391297340393, -0.3342428207397461, -0.2864465117454529, -0.23865017294883728, -0.19085384905338287, -0.14305752515792847, -0.09526120126247406, -0.04746487736701965, 0.00033146142959594727, 0.04812788963317871, 0.09592421352863312, 0.14372053742408752, 0.19151686131954193, 0.23931318521499634, 0.28710949420928955, 0.33490583300590515, 0.38270217180252075, 0.43049848079681396, 0.4782947897911072, 0.5260910987854004, 0.5738874673843384, 0.6216837763786316, 0.6694800853729248, 0.7172764539718628, 0.765072762966156, 0.8128690719604492, 0.8606653809547424, 0.9084616899490356, 0.9562580585479736, 1.004054307937622, 1.05185067653656, 1.099647045135498, 1.1474432945251465, 1.1952396631240845, 1.2430360317230225, 1.290832281112671, 1.3386286497116089, 1.3864250183105469, 1.4342212677001953, 1.4820176362991333, 1.5298140048980713, 1.5776102542877197]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 7.0, 10.0, 8.0, 13.0, 15.0, 24.0, 35.0, 84.0, 182.0, 337.0, 851.0, 2831.0, 19343.0, 380639.0, 608520.0, 29966.0, 3862.0, 1009.0, 399.0, 184.0, 98.0, 56.0, 35.0, 17.0, 9.0, 12.0, 8.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.828125, -2.749755859375, -2.67138671875, -2.593017578125, -2.5146484375, -2.436279296875, -2.35791015625, -2.279541015625, -2.201171875, -2.122802734375, -2.04443359375, -1.966064453125, -1.8876953125, -1.809326171875, -1.73095703125, -1.652587890625, -1.57421875, -1.495849609375, -1.41748046875, -1.339111328125, -1.2607421875, -1.182373046875, -1.10400390625, -1.025634765625, -0.947265625, -0.868896484375, -0.79052734375, -0.712158203125, -0.6337890625, -0.555419921875, -0.47705078125, -0.398681640625, -0.3203125, -0.241943359375, -0.16357421875, -0.085205078125, -0.0068359375, 0.071533203125, 0.14990234375, 0.228271484375, 0.306640625, 0.385009765625, 0.46337890625, 0.541748046875, 0.6201171875, 0.698486328125, 0.77685546875, 0.855224609375, 0.93359375, 1.011962890625, 1.09033203125, 1.168701171875, 1.2470703125, 1.325439453125, 1.40380859375, 1.482177734375, 1.560546875, 1.638916015625, 1.71728515625, 1.795654296875, 1.8740234375, 1.952392578125, 2.03076171875, 2.109130859375, 2.1875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 7.0, 11.0, 13.0, 29.0, 32.0, 55.0, 63.0, 94.0, 104.0, 96.0, 128.0, 84.0, 76.0, 71.0, 44.0, 37.0, 23.0, 13.0, 6.0, 4.0, 5.0, 9.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22119140625, -0.21104049682617188, -0.20088958740234375, -0.19073867797851562, -0.1805877685546875, -0.17043685913085938, -0.16028594970703125, -0.15013504028320312, -0.139984130859375, -0.12983322143554688, -0.11968231201171875, -0.10953140258789062, -0.0993804931640625, -0.08922958374023438, -0.07907867431640625, -0.06892776489257812, -0.05877685546875, -0.048625946044921875, -0.03847503662109375, -0.028324127197265625, -0.0181732177734375, -0.008022308349609375, 0.00212860107421875, 0.012279510498046875, 0.022430419921875, 0.032581329345703125, 0.04273223876953125, 0.052883148193359375, 0.0630340576171875, 0.07318496704101562, 0.08333587646484375, 0.09348678588867188, 0.1036376953125, 0.11378860473632812, 0.12393951416015625, 0.13409042358398438, 0.1442413330078125, 0.15439224243164062, 0.16454315185546875, 0.17469406127929688, 0.184844970703125, 0.19499588012695312, 0.20514678955078125, 0.21529769897460938, 0.2254486083984375, 0.23559951782226562, 0.24575042724609375, 0.2559013366699219, 0.26605224609375, 0.2762031555175781, 0.28635406494140625, 0.2965049743652344, 0.3066558837890625, 0.3168067932128906, 0.32695770263671875, 0.3371086120605469, 0.347259521484375, 0.3574104309082031, 0.36756134033203125, 0.3777122497558594, 0.3878631591796875, 0.3980140686035156, 0.40816497802734375, 0.4183158874511719, 0.428466796875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 9.0, 9.0, 13.0, 16.0, 20.0, 17.0, 30.0, 37.0, 75.0, 129.0, 242.0, 457.0, 1010.0, 2904.0, 9280.0, 39662.0, 208538.0, 564934.0, 174709.0, 33849.0, 8253.0, 2456.0, 939.0, 405.0, 214.0, 127.0, 64.0, 48.0, 35.0, 23.0, 19.0, 12.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.1171875, -1.0856704711914062, -1.0541534423828125, -1.0226364135742188, -0.991119384765625, -0.9596023559570312, -0.9280853271484375, -0.8965682983398438, -0.86505126953125, -0.8335342407226562, -0.8020172119140625, -0.7705001831054688, -0.738983154296875, -0.7074661254882812, -0.6759490966796875, -0.6444320678710938, -0.6129150390625, -0.5813980102539062, -0.5498809814453125, -0.5183639526367188, -0.486846923828125, -0.45532989501953125, -0.4238128662109375, -0.39229583740234375, -0.36077880859375, -0.32926177978515625, -0.2977447509765625, -0.26622772216796875, -0.234710693359375, -0.20319366455078125, -0.1716766357421875, -0.14015960693359375, -0.108642578125, -0.07712554931640625, -0.0456085205078125, -0.01409149169921875, 0.017425537109375, 0.04894256591796875, 0.0804595947265625, 0.11197662353515625, 0.14349365234375, 0.17501068115234375, 0.2065277099609375, 0.23804473876953125, 0.269561767578125, 0.30107879638671875, 0.3325958251953125, 0.36411285400390625, 0.3956298828125, 0.42714691162109375, 0.4586639404296875, 0.49018096923828125, 0.521697998046875, 0.5532150268554688, 0.5847320556640625, 0.6162490844726562, 0.64776611328125, 0.6792831420898438, 0.7108001708984375, 0.7423171997070312, 0.773834228515625, 0.8053512573242188, 0.8368682861328125, 0.8683853149414062, 0.89990234375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 0.0, 2.0, 3.0, 6.0, 6.0, 5.0, 16.0, 5.0, 15.0, 14.0, 11.0, 19.0, 23.0, 41.0, 27.0, 31.0, 39.0, 38.0, 45.0, 40.0, 50.0, 48.0, 55.0, 58.0, 51.0, 41.0, 40.0, 46.0, 31.0, 29.0, 22.0, 21.0, 26.0, 19.0, 22.0, 8.0, 12.0, 7.0, 12.0, 4.0, 8.0, 2.0, 2.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5869140625, -0.5660629272460938, -0.5452117919921875, -0.5243606567382812, -0.503509521484375, -0.48265838623046875, -0.4618072509765625, -0.44095611572265625, -0.42010498046875, -0.39925384521484375, -0.3784027099609375, -0.35755157470703125, -0.336700439453125, -0.31584930419921875, -0.2949981689453125, -0.27414703369140625, -0.2532958984375, -0.23244476318359375, -0.2115936279296875, -0.19074249267578125, -0.169891357421875, -0.14904022216796875, -0.1281890869140625, -0.10733795166015625, -0.08648681640625, -0.06563568115234375, -0.0447845458984375, -0.02393341064453125, -0.003082275390625, 0.01776885986328125, 0.0386199951171875, 0.05947113037109375, 0.080322265625, 0.10117340087890625, 0.1220245361328125, 0.14287567138671875, 0.163726806640625, 0.18457794189453125, 0.2054290771484375, 0.22628021240234375, 0.24713134765625, 0.26798248291015625, 0.2888336181640625, 0.30968475341796875, 0.330535888671875, 0.35138702392578125, 0.3722381591796875, 0.39308929443359375, 0.4139404296875, 0.43479156494140625, 0.4556427001953125, 0.47649383544921875, 0.497344970703125, 0.5181961059570312, 0.5390472412109375, 0.5598983764648438, 0.58074951171875, 0.6016006469726562, 0.6224517822265625, 0.6433029174804688, 0.664154052734375, 0.6850051879882812, 0.7058563232421875, 0.7267074584960938, 0.74755859375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 7.0, 11.0, 17.0, 53.0, 168.0, 415.0, 3352.0, 876505.0, 165968.0, 1585.0, 280.0, 124.0, 46.0, 13.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.888671875, -1.831207275390625, -1.77374267578125, -1.716278076171875, -1.6588134765625, -1.601348876953125, -1.54388427734375, -1.486419677734375, -1.428955078125, -1.371490478515625, -1.31402587890625, -1.256561279296875, -1.1990966796875, -1.141632080078125, -1.08416748046875, -1.026702880859375, -0.96923828125, -0.911773681640625, -0.85430908203125, -0.796844482421875, -0.7393798828125, -0.681915283203125, -0.62445068359375, -0.566986083984375, -0.509521484375, -0.452056884765625, -0.39459228515625, -0.337127685546875, -0.2796630859375, -0.222198486328125, -0.16473388671875, -0.107269287109375, -0.0498046875, 0.007659912109375, 0.06512451171875, 0.122589111328125, 0.1800537109375, 0.237518310546875, 0.29498291015625, 0.352447509765625, 0.409912109375, 0.467376708984375, 0.52484130859375, 0.582305908203125, 0.6397705078125, 0.697235107421875, 0.75469970703125, 0.812164306640625, 0.86962890625, 0.927093505859375, 0.98455810546875, 1.042022705078125, 1.0994873046875, 1.156951904296875, 1.21441650390625, 1.271881103515625, 1.329345703125, 1.386810302734375, 1.44427490234375, 1.501739501953125, 1.5592041015625, 1.616668701171875, 1.67413330078125, 1.731597900390625, 1.7890625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 4.0, 11.0, 11.0, 21.0, 26.0, 49.0, 75.0, 91.0, 137.0, 162.0, 126.0, 108.0, 66.0, 49.0, 27.0, 17.0, 7.0, 10.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.259845733642578e-05, -6.901286542415619e-05, -6.54272735118866e-05, -6.1841681599617e-05, -5.825608968734741e-05, -5.467049777507782e-05, -5.108490586280823e-05, -4.7499313950538635e-05, -4.391372203826904e-05, -4.032813012599945e-05, -3.674253821372986e-05, -3.3156946301460266e-05, -2.9571354389190674e-05, -2.598576247692108e-05, -2.240017056465149e-05, -1.8814578652381897e-05, -1.5228986740112305e-05, -1.1643394827842712e-05, -8.05780291557312e-06, -4.472211003303528e-06, -8.866190910339355e-07, 2.6989728212356567e-06, 6.284564733505249e-06, 9.870156645774841e-06, 1.3455748558044434e-05, 1.7041340470314026e-05, 2.0626932382583618e-05, 2.421252429485321e-05, 2.7798116207122803e-05, 3.1383708119392395e-05, 3.496930003166199e-05, 3.855489194393158e-05, 4.214048385620117e-05, 4.5726075768470764e-05, 4.9311667680740356e-05, 5.289725959300995e-05, 5.648285150527954e-05, 6.006844341754913e-05, 6.365403532981873e-05, 6.723962724208832e-05, 7.082521915435791e-05, 7.44108110666275e-05, 7.79964029788971e-05, 8.158199489116669e-05, 8.516758680343628e-05, 8.875317871570587e-05, 9.233877062797546e-05, 9.592436254024506e-05, 9.950995445251465e-05, 0.00010309554636478424, 0.00010668113827705383, 0.00011026673018932343, 0.00011385232210159302, 0.00011743791401386261, 0.0001210235059261322, 0.0001246090978384018, 0.0001281946897506714, 0.00013178028166294098, 0.00013536587357521057, 0.00013895146548748016, 0.00014253705739974976, 0.00014612264931201935, 0.00014970824122428894, 0.00015329383313655853, 0.00015687942504882812]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 19.0, 55.0, 119.0, 346.0, 3380.0, 1033962.0, 9997.0, 424.0, 165.0, 61.0, 19.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.345703125, -2.26904296875, -2.1923828125, -2.11572265625, -2.0390625, -1.96240234375, -1.8857421875, -1.80908203125, -1.732421875, -1.65576171875, -1.5791015625, -1.50244140625, -1.42578125, -1.34912109375, -1.2724609375, -1.19580078125, -1.119140625, -1.04248046875, -0.9658203125, -0.88916015625, -0.8125, -0.73583984375, -0.6591796875, -0.58251953125, -0.505859375, -0.42919921875, -0.3525390625, -0.27587890625, -0.19921875, -0.12255859375, -0.0458984375, 0.03076171875, 0.107421875, 0.18408203125, 0.2607421875, 0.33740234375, 0.4140625, 0.49072265625, 0.5673828125, 0.64404296875, 0.720703125, 0.79736328125, 0.8740234375, 0.95068359375, 1.02734375, 1.10400390625, 1.1806640625, 1.25732421875, 1.333984375, 1.41064453125, 1.4873046875, 1.56396484375, 1.640625, 1.71728515625, 1.7939453125, 1.87060546875, 1.947265625, 2.02392578125, 2.1005859375, 2.17724609375, 2.25390625, 2.33056640625, 2.4072265625, 2.48388671875, 2.560546875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 9.0, 12.0, 95.0, 331.0, 406.0, 127.0, 20.0, 9.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.544921875, -1.4935455322265625, -1.442169189453125, -1.3907928466796875, -1.33941650390625, -1.2880401611328125, -1.236663818359375, -1.1852874755859375, -1.1339111328125, -1.0825347900390625, -1.031158447265625, -0.9797821044921875, -0.92840576171875, -0.8770294189453125, -0.825653076171875, -0.7742767333984375, -0.722900390625, -0.6715240478515625, -0.620147705078125, -0.5687713623046875, -0.51739501953125, -0.4660186767578125, -0.414642333984375, -0.3632659912109375, -0.3118896484375, -0.2605133056640625, -0.209136962890625, -0.1577606201171875, -0.10638427734375, -0.0550079345703125, -0.003631591796875, 0.0477447509765625, 0.09912109375, 0.1504974365234375, 0.201873779296875, 0.2532501220703125, 0.30462646484375, 0.3560028076171875, 0.407379150390625, 0.4587554931640625, 0.5101318359375, 0.5615081787109375, 0.612884521484375, 0.6642608642578125, 0.71563720703125, 0.7670135498046875, 0.818389892578125, 0.8697662353515625, 0.921142578125, 0.9725189208984375, 1.023895263671875, 1.0752716064453125, 1.12664794921875, 1.1780242919921875, 1.229400634765625, 1.2807769775390625, 1.3321533203125, 1.3835296630859375, 1.434906005859375, 1.4862823486328125, 1.53765869140625, 1.5890350341796875, 1.640411376953125, 1.6917877197265625, 1.7431640625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 8.0, 12.0, 25.0, 95.0, 213.0, 310.0, 208.0, 87.0, 26.0, 16.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.107353210449219, -7.7137064933776855, -7.3200602531433105, -6.926413536071777, -6.532767295837402, -6.139120578765869, -5.745473861694336, -5.351827621459961, -4.958180904388428, -4.5645341873168945, -4.1708879470825195, -3.7772412300109863, -3.3835947513580322, -2.989948272705078, -2.596301555633545, -2.202655076980591, -1.8090085983276367, -1.4153621196746826, -1.021715521812439, -0.6280689239501953, -0.2344224452972412, 0.1592240333557129, 0.5528707504272461, 0.9465172290802002, 1.3401637077331543, 1.7338101863861084, 2.1274566650390625, 2.5211033821105957, 2.91474986076355, 3.308396339416504, 3.702043056488037, 4.09568977355957, 4.489336013793945, 4.8829827308654785, 5.2766289710998535, 5.670275688171387, 6.063921928405762, 6.457568645477295, 6.851215362548828, 7.244861602783203, 7.638508319854736, 8.03215503692627, 8.425801277160645, 8.819448471069336, 9.213094711303711, 9.606740951538086, 10.000387191772461, 10.394034385681152, 10.787680625915527, 11.181326866149902, 11.574974060058594, 11.968620300292969, 12.362266540527344, 12.755912780761719, 13.14955997467041, 13.543206214904785, 13.936853408813477, 14.330499649047852, 14.724146842956543, 15.117793083190918, 15.511439323425293, 15.905086517333984, 16.29873275756836, 16.692378997802734, 17.08602523803711]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 5.0, 2.0, 1.0, 8.0, 10.0, 5.0, 13.0, 15.0, 7.0, 14.0, 23.0, 24.0, 21.0, 28.0, 29.0, 23.0, 38.0, 40.0, 35.0, 43.0, 36.0, 50.0, 32.0, 40.0, 43.0, 39.0, 36.0, 54.0, 39.0, 31.0, 34.0, 23.0, 27.0, 24.0, 21.0, 24.0, 12.0, 11.0, 7.0, 10.0, 6.0, 8.0, 3.0, 4.0, 3.0, 1.0, 4.0, 1.0, 5.0], "bins": [-3.5458197593688965, -3.450713872909546, -3.3556082248687744, -3.260502338409424, -3.1653966903686523, -3.0702908039093018, -2.975184917449951, -2.8800792694091797, -2.784973621368408, -2.6898677349090576, -2.594762086868286, -2.4996562004089355, -2.404550552368164, -2.3094446659088135, -2.214338779449463, -2.1192331314086914, -2.024127244949341, -1.9290214776992798, -1.8339157104492188, -1.7388098239898682, -1.6437041759490967, -1.548598289489746, -1.453492522239685, -1.358386754989624, -1.263280987739563, -1.168175220489502, -1.073069453239441, -0.9779636263847351, -0.8828578591346741, -0.787752091884613, -0.6926462650299072, -0.5975404977798462, -0.502434492111206, -0.407328724861145, -0.3122229278087616, -0.21711713075637817, -0.12201136350631714, -0.026905596256256104, 0.06820023059844971, 0.16330599784851074, 0.2584117650985718, 0.3535175323486328, 0.44862332940101624, 0.5437291264533997, 0.6388348937034607, 0.7339406609535217, 0.8290464878082275, 0.9241522550582886, 1.0192580223083496, 1.1143637895584106, 1.2094695568084717, 1.3045754432678223, 1.3996810913085938, 1.4947869777679443, 1.5898927450180054, 1.6849985122680664, 1.7801042795181274, 1.8752100467681885, 1.9703158140182495, 2.0654215812683105, 2.160527467727661, 2.2556331157684326, 2.350739002227783, 2.4458446502685547, 2.5409505367279053]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 4.0, 2.0, 9.0, 3.0, 11.0, 26.0, 31.0, 36.0, 62.0, 131.0, 196.0, 404.0, 861.0, 2048.0, 7225.0, 37962.0, 1496392.0, 2598875.0, 38647.0, 7203.0, 2167.0, 832.0, 411.0, 216.0, 147.0, 97.0, 61.0, 61.0, 39.0, 28.0, 22.0, 18.0, 15.0, 7.0, 9.0, 4.0, 4.0, 4.0, 8.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.4150390625, -1.3645172119140625, -1.313995361328125, -1.2634735107421875, -1.21295166015625, -1.1624298095703125, -1.111907958984375, -1.0613861083984375, -1.0108642578125, -0.9603424072265625, -0.909820556640625, -0.8592987060546875, -0.80877685546875, -0.7582550048828125, -0.707733154296875, -0.6572113037109375, -0.606689453125, -0.5561676025390625, -0.505645751953125, -0.4551239013671875, -0.40460205078125, -0.3540802001953125, -0.303558349609375, -0.2530364990234375, -0.2025146484375, -0.1519927978515625, -0.101470947265625, -0.0509490966796875, -0.00042724609375, 0.0500946044921875, 0.100616455078125, 0.1511383056640625, 0.20166015625, 0.2521820068359375, 0.302703857421875, 0.3532257080078125, 0.40374755859375, 0.4542694091796875, 0.504791259765625, 0.5553131103515625, 0.6058349609375, 0.6563568115234375, 0.706878662109375, 0.7574005126953125, 0.80792236328125, 0.8584442138671875, 0.908966064453125, 0.9594879150390625, 1.010009765625, 1.0605316162109375, 1.111053466796875, 1.1615753173828125, 1.21209716796875, 1.2626190185546875, 1.313140869140625, 1.3636627197265625, 1.4141845703125, 1.4647064208984375, 1.515228271484375, 1.5657501220703125, 1.61627197265625, 1.6667938232421875, 1.717315673828125, 1.7678375244140625, 1.818359375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 5.0, 6.0, 6.0, 8.0, 17.0, 14.0, 31.0, 63.0, 94.0, 98.0, 94.0, 112.0, 110.0, 77.0, 74.0, 72.0, 41.0, 37.0, 26.0, 12.0, 7.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2607421875, -0.2492218017578125, -0.237701416015625, -0.2261810302734375, -0.21466064453125, -0.2031402587890625, -0.191619873046875, -0.1800994873046875, -0.1685791015625, -0.1570587158203125, -0.145538330078125, -0.1340179443359375, -0.12249755859375, -0.1109771728515625, -0.099456787109375, -0.0879364013671875, -0.076416015625, -0.0648956298828125, -0.053375244140625, -0.0418548583984375, -0.03033447265625, -0.0188140869140625, -0.007293701171875, 0.0042266845703125, 0.0157470703125, 0.0272674560546875, 0.038787841796875, 0.0503082275390625, 0.06182861328125, 0.0733489990234375, 0.084869384765625, 0.0963897705078125, 0.10791015625, 0.1194305419921875, 0.130950927734375, 0.1424713134765625, 0.15399169921875, 0.1655120849609375, 0.177032470703125, 0.1885528564453125, 0.2000732421875, 0.2115936279296875, 0.223114013671875, 0.2346343994140625, 0.24615478515625, 0.2576751708984375, 0.269195556640625, 0.2807159423828125, 0.292236328125, 0.3037567138671875, 0.315277099609375, 0.3267974853515625, 0.33831787109375, 0.3498382568359375, 0.361358642578125, 0.3728790283203125, 0.3843994140625, 0.3959197998046875, 0.407440185546875, 0.4189605712890625, 0.43048095703125, 0.4420013427734375, 0.453521728515625, 0.4650421142578125, 0.4765625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 5.0, 4.0, 9.0, 9.0, 22.0, 34.0, 63.0, 107.0, 184.0, 431.0, 876.0, 2335.0, 9067.0, 87146.0, 3931138.0, 145602.0, 12395.0, 2928.0, 1033.0, 448.0, 210.0, 108.0, 65.0, 35.0, 16.0, 10.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.5546875, -2.496063232421875, -2.43743896484375, -2.378814697265625, -2.3201904296875, -2.261566162109375, -2.20294189453125, -2.144317626953125, -2.085693359375, -2.027069091796875, -1.96844482421875, -1.909820556640625, -1.8511962890625, -1.792572021484375, -1.73394775390625, -1.675323486328125, -1.61669921875, -1.558074951171875, -1.49945068359375, -1.440826416015625, -1.3822021484375, -1.323577880859375, -1.26495361328125, -1.206329345703125, -1.147705078125, -1.089080810546875, -1.03045654296875, -0.971832275390625, -0.9132080078125, -0.854583740234375, -0.79595947265625, -0.737335205078125, -0.6787109375, -0.620086669921875, -0.56146240234375, -0.502838134765625, -0.4442138671875, -0.385589599609375, -0.32696533203125, -0.268341064453125, -0.209716796875, -0.151092529296875, -0.09246826171875, -0.033843994140625, 0.0247802734375, 0.083404541015625, 0.14202880859375, 0.200653076171875, 0.25927734375, 0.317901611328125, 0.37652587890625, 0.435150146484375, 0.4937744140625, 0.552398681640625, 0.61102294921875, 0.669647216796875, 0.728271484375, 0.786895751953125, 0.84552001953125, 0.904144287109375, 0.9627685546875, 1.021392822265625, 1.08001708984375, 1.138641357421875, 1.197265625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 16.0, 15.0, 33.0, 51.0, 97.0, 272.0, 1411.0, 1590.0, 294.0, 106.0, 59.0, 53.0, 34.0, 10.0, 11.0, 4.0, 5.0, 4.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64208984375, -0.623748779296875, -0.60540771484375, -0.587066650390625, -0.5687255859375, -0.550384521484375, -0.53204345703125, -0.513702392578125, -0.495361328125, -0.477020263671875, -0.45867919921875, -0.440338134765625, -0.4219970703125, -0.403656005859375, -0.38531494140625, -0.366973876953125, -0.3486328125, -0.330291748046875, -0.31195068359375, -0.293609619140625, -0.2752685546875, -0.256927490234375, -0.23858642578125, -0.220245361328125, -0.201904296875, -0.183563232421875, -0.16522216796875, -0.146881103515625, -0.1285400390625, -0.110198974609375, -0.09185791015625, -0.073516845703125, -0.05517578125, -0.036834716796875, -0.01849365234375, -0.000152587890625, 0.0181884765625, 0.036529541015625, 0.05487060546875, 0.073211669921875, 0.091552734375, 0.109893798828125, 0.12823486328125, 0.146575927734375, 0.1649169921875, 0.183258056640625, 0.20159912109375, 0.219940185546875, 0.23828125, 0.256622314453125, 0.27496337890625, 0.293304443359375, 0.3116455078125, 0.329986572265625, 0.34832763671875, 0.366668701171875, 0.385009765625, 0.403350830078125, 0.42169189453125, 0.440032958984375, 0.4583740234375, 0.476715087890625, 0.49505615234375, 0.513397216796875, 0.53173828125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 1.0, 7.0, 27.0, 105.0, 409.0, 342.0, 84.0, 18.0, 5.0, 7.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.522583961486816, -4.281192302703857, -4.039801120758057, -3.7984094619750977, -3.5570180416107178, -3.315626621246338, -3.074235200881958, -2.832843780517578, -2.591452121734619, -2.3500607013702393, -2.1086692810058594, -1.86727774143219, -1.6258862018585205, -1.3844947814941406, -1.1431033611297607, -0.9017118215560913, -0.660320520401001, -0.4189290404319763, -0.17753759026527405, 0.06385385990142822, 0.3052453398704529, 0.5466368198394775, 0.7880282402038574, 1.0294197797775269, 1.2708112001419067, 1.5122026205062866, 1.753594160079956, 1.994985580444336, 2.236377000808716, 2.4777684211730957, 2.7191600799560547, 2.9605515003204346, 3.2019429206848145, 3.4433343410491943, 3.684725761413574, 3.926117420196533, 4.167508602142334, 4.408900260925293, 4.650291442871094, 4.891683101654053, 5.133074760437012, 5.374466419219971, 5.6158576011657715, 5.8572492599487305, 6.098640441894531, 6.34003210067749, 6.581423759460449, 6.82281494140625, 7.064206123352051, 7.30559778213501, 7.5469889640808105, 7.7883806228637695, 8.02977180480957, 8.271163940429688, 8.512555122375488, 8.753946304321289, 8.995338439941406, 9.236729621887207, 9.478121757507324, 9.719512939453125, 9.960904121398926, 10.202295303344727, 10.443687438964844, 10.685078620910645, 10.926469802856445]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 6.0, 9.0, 13.0, 17.0, 27.0, 39.0, 37.0, 57.0, 66.0, 74.0, 74.0, 84.0, 81.0, 89.0, 75.0, 56.0, 56.0, 30.0, 31.0, 31.0, 21.0, 12.0, 4.0, 4.0, 5.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9352753162384033, -1.8642559051513672, -1.7932363748550415, -1.7222169637680054, -1.6511974334716797, -1.5801780223846436, -1.5091586112976074, -1.4381392002105713, -1.3671196699142456, -1.2961002588272095, -1.2250807285308838, -1.1540613174438477, -1.0830419063568115, -1.0120223760604858, -0.9410029649734497, -0.8699834942817688, -0.7989640235900879, -0.727944552898407, -0.6569250822067261, -0.5859056711196899, -0.514886200428009, -0.4438667297363281, -0.3728472888469696, -0.3018278479576111, -0.23080837726593018, -0.15978892147541046, -0.08876946568489075, -0.017750009894371033, 0.05326944589614868, 0.12428891658782959, 0.1953083574771881, 0.26632779836654663, 0.33734703063964844, 0.40836650133132935, 0.47938594222068787, 0.5504053831100464, 0.6214248538017273, 0.6924443244934082, 0.7634637355804443, 0.8344832062721252, 0.9055026769638062, 0.9765221476554871, 1.047541618347168, 1.118561029434204, 1.1895804405212402, 1.260599970817566, 1.331619381904602, 1.4026389122009277, 1.4736583232879639, 1.544677734375, 1.6156972646713257, 1.6867166757583618, 1.7577362060546875, 1.8287556171417236, 1.8997750282287598, 1.970794439315796, 2.041813850402832, 2.112833261489868, 2.1838526725769043, 2.2548723220825195, 2.3258917331695557, 2.396911144256592, 2.467930555343628, 2.538949966430664, 2.6099696159362793]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 9.0, 5.0, 8.0, 12.0, 16.0, 24.0, 42.0, 69.0, 73.0, 136.0, 223.0, 394.0, 888.0, 2432.0, 10022.0, 64780.0, 515307.0, 394771.0, 47751.0, 7851.0, 2055.0, 787.0, 353.0, 197.0, 102.0, 88.0, 42.0, 40.0, 22.0, 14.0, 9.0, 10.0, 9.0, 4.0, 5.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1728515625, -1.1216888427734375, -1.070526123046875, -1.0193634033203125, -0.96820068359375, -0.9170379638671875, -0.865875244140625, -0.8147125244140625, -0.7635498046875, -0.7123870849609375, -0.661224365234375, -0.6100616455078125, -0.55889892578125, -0.5077362060546875, -0.456573486328125, -0.4054107666015625, -0.354248046875, -0.3030853271484375, -0.251922607421875, -0.2007598876953125, -0.14959716796875, -0.0984344482421875, -0.047271728515625, 0.0038909912109375, 0.0550537109375, 0.1062164306640625, 0.157379150390625, 0.2085418701171875, 0.25970458984375, 0.3108673095703125, 0.362030029296875, 0.4131927490234375, 0.46435546875, 0.5155181884765625, 0.566680908203125, 0.6178436279296875, 0.66900634765625, 0.7201690673828125, 0.771331787109375, 0.8224945068359375, 0.8736572265625, 0.9248199462890625, 0.975982666015625, 1.0271453857421875, 1.07830810546875, 1.1294708251953125, 1.180633544921875, 1.2317962646484375, 1.282958984375, 1.3341217041015625, 1.385284423828125, 1.4364471435546875, 1.48760986328125, 1.5387725830078125, 1.589935302734375, 1.6410980224609375, 1.6922607421875, 1.7434234619140625, 1.794586181640625, 1.8457489013671875, 1.89691162109375, 1.9480743408203125, 1.999237060546875, 2.0503997802734375, 2.1015625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 7.0, 11.0, 21.0, 31.0, 56.0, 74.0, 100.0, 105.0, 120.0, 127.0, 76.0, 100.0, 67.0, 45.0, 29.0, 17.0, 9.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.281982421875, -0.2683906555175781, -0.25479888916015625, -0.24120712280273438, -0.2276153564453125, -0.21402359008789062, -0.20043182373046875, -0.18684005737304688, -0.173248291015625, -0.15965652465820312, -0.14606475830078125, -0.13247299194335938, -0.1188812255859375, -0.10528945922851562, -0.09169769287109375, -0.07810592651367188, -0.06451416015625, -0.050922393798828125, -0.03733062744140625, -0.023738861083984375, -0.0101470947265625, 0.003444671630859375, 0.01703643798828125, 0.030628204345703125, 0.044219970703125, 0.057811737060546875, 0.07140350341796875, 0.08499526977539062, 0.0985870361328125, 0.11217880249023438, 0.12577056884765625, 0.13936233520507812, 0.1529541015625, 0.16654586791992188, 0.18013763427734375, 0.19372940063476562, 0.2073211669921875, 0.22091293334960938, 0.23450469970703125, 0.24809646606445312, 0.261688232421875, 0.2752799987792969, 0.28887176513671875, 0.3024635314941406, 0.3160552978515625, 0.3296470642089844, 0.34323883056640625, 0.3568305969238281, 0.37042236328125, 0.3840141296386719, 0.39760589599609375, 0.4111976623535156, 0.4247894287109375, 0.4383811950683594, 0.45197296142578125, 0.4655647277832031, 0.479156494140625, 0.4927482604980469, 0.5063400268554688, 0.5199317932128906, 0.5335235595703125, 0.5471153259277344, 0.5607070922851562, 0.5742988586425781, 0.587890625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 2.0, 3.0, 3.0, 9.0, 9.0, 13.0, 10.0, 28.0, 29.0, 45.0, 63.0, 113.0, 172.0, 352.0, 674.0, 1676.0, 4958.0, 17921.0, 73710.0, 318234.0, 466619.0, 122869.0, 28864.0, 7829.0, 2429.0, 931.0, 423.0, 195.0, 126.0, 74.0, 47.0, 39.0, 30.0, 15.0, 9.0, 11.0, 7.0, 4.0, 3.0, 1.0, 0.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.9931640625, -0.9649276733398438, -0.9366912841796875, -0.9084548950195312, -0.880218505859375, -0.8519821166992188, -0.8237457275390625, -0.7955093383789062, -0.76727294921875, -0.7390365600585938, -0.7108001708984375, -0.6825637817382812, -0.654327392578125, -0.6260910034179688, -0.5978546142578125, -0.5696182250976562, -0.5413818359375, -0.5131454467773438, -0.4849090576171875, -0.45667266845703125, -0.428436279296875, -0.40019989013671875, -0.3719635009765625, -0.34372711181640625, -0.31549072265625, -0.28725433349609375, -0.2590179443359375, -0.23078155517578125, -0.202545166015625, -0.17430877685546875, -0.1460723876953125, -0.11783599853515625, -0.089599609375, -0.06136322021484375, -0.0331268310546875, -0.00489044189453125, 0.023345947265625, 0.05158233642578125, 0.0798187255859375, 0.10805511474609375, 0.13629150390625, 0.16452789306640625, 0.1927642822265625, 0.22100067138671875, 0.249237060546875, 0.27747344970703125, 0.3057098388671875, 0.33394622802734375, 0.3621826171875, 0.39041900634765625, 0.4186553955078125, 0.44689178466796875, 0.475128173828125, 0.5033645629882812, 0.5316009521484375, 0.5598373413085938, 0.58807373046875, 0.6163101196289062, 0.6445465087890625, 0.6727828979492188, 0.701019287109375, 0.7292556762695312, 0.7574920654296875, 0.7857284545898438, 0.81396484375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 0.0, 1.0, 3.0, 5.0, 3.0, 5.0, 8.0, 4.0, 8.0, 6.0, 14.0, 14.0, 18.0, 18.0, 28.0, 25.0, 24.0, 30.0, 35.0, 46.0, 45.0, 54.0, 46.0, 45.0, 40.0, 39.0, 40.0, 41.0, 38.0, 47.0, 34.0, 30.0, 36.0, 18.0, 29.0, 25.0, 23.0, 16.0, 19.0, 13.0, 7.0, 5.0, 6.0, 5.0, 6.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.67919921875, -0.6577529907226562, -0.6363067626953125, -0.6148605346679688, -0.593414306640625, -0.5719680786132812, -0.5505218505859375, -0.5290756225585938, -0.50762939453125, -0.48618316650390625, -0.4647369384765625, -0.44329071044921875, -0.421844482421875, -0.40039825439453125, -0.3789520263671875, -0.35750579833984375, -0.3360595703125, -0.31461334228515625, -0.2931671142578125, -0.27172088623046875, -0.250274658203125, -0.22882843017578125, -0.2073822021484375, -0.18593597412109375, -0.16448974609375, -0.14304351806640625, -0.1215972900390625, -0.10015106201171875, -0.078704833984375, -0.05725860595703125, -0.0358123779296875, -0.01436614990234375, 0.007080078125, 0.02852630615234375, 0.0499725341796875, 0.07141876220703125, 0.092864990234375, 0.11431121826171875, 0.1357574462890625, 0.15720367431640625, 0.17864990234375, 0.20009613037109375, 0.2215423583984375, 0.24298858642578125, 0.264434814453125, 0.28588104248046875, 0.3073272705078125, 0.32877349853515625, 0.3502197265625, 0.37166595458984375, 0.3931121826171875, 0.41455841064453125, 0.436004638671875, 0.45745086669921875, 0.4788970947265625, 0.5003433227539062, 0.52178955078125, 0.5432357788085938, 0.5646820068359375, 0.5861282348632812, 0.607574462890625, 0.6290206909179688, 0.6504669189453125, 0.6719131469726562, 0.693359375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 10.0, 4.0, 10.0, 18.0, 18.0, 33.0, 58.0, 62.0, 113.0, 194.0, 427.0, 932.0, 3172.0, 19614.0, 243758.0, 692029.0, 76896.0, 8172.0, 1704.0, 592.0, 263.0, 159.0, 108.0, 67.0, 44.0, 38.0, 15.0, 16.0, 13.0, 3.0, 8.0, 7.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.392578125, -0.3757171630859375, -0.358856201171875, -0.3419952392578125, -0.32513427734375, -0.3082733154296875, -0.291412353515625, -0.2745513916015625, -0.2576904296875, -0.2408294677734375, -0.223968505859375, -0.2071075439453125, -0.19024658203125, -0.1733856201171875, -0.156524658203125, -0.1396636962890625, -0.122802734375, -0.1059417724609375, -0.089080810546875, -0.0722198486328125, -0.05535888671875, -0.0384979248046875, -0.021636962890625, -0.0047760009765625, 0.0120849609375, 0.0289459228515625, 0.045806884765625, 0.0626678466796875, 0.07952880859375, 0.0963897705078125, 0.113250732421875, 0.1301116943359375, 0.14697265625, 0.1638336181640625, 0.180694580078125, 0.1975555419921875, 0.21441650390625, 0.2312774658203125, 0.248138427734375, 0.2649993896484375, 0.2818603515625, 0.2987213134765625, 0.315582275390625, 0.3324432373046875, 0.34930419921875, 0.3661651611328125, 0.383026123046875, 0.3998870849609375, 0.416748046875, 0.4336090087890625, 0.450469970703125, 0.4673309326171875, 0.48419189453125, 0.5010528564453125, 0.517913818359375, 0.5347747802734375, 0.5516357421875, 0.5684967041015625, 0.585357666015625, 0.6022186279296875, 0.61907958984375, 0.6359405517578125, 0.652801513671875, 0.6696624755859375, 0.6865234375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 7.0, 9.0, 19.0, 32.0, 49.0, 79.0, 144.0, 202.0, 182.0, 126.0, 71.0, 49.0, 15.0, 11.0, 4.0, 8.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.577108383178711e-05, -8.091423660516739e-05, -7.605738937854767e-05, -7.120054215192795e-05, -6.634369492530823e-05, -6.148684769868851e-05, -5.663000047206879e-05, -5.1773153245449066e-05, -4.6916306018829346e-05, -4.2059458792209625e-05, -3.7202611565589905e-05, -3.2345764338970184e-05, -2.7488917112350464e-05, -2.2632069885730743e-05, -1.7775222659111023e-05, -1.2918375432491302e-05, -8.061528205871582e-06, -3.2046809792518616e-06, 1.6521662473678589e-06, 6.509013473987579e-06, 1.13658607006073e-05, 1.622270792722702e-05, 2.107955515384674e-05, 2.593640238046646e-05, 3.079324960708618e-05, 3.56500968337059e-05, 4.050694406032562e-05, 4.536379128694534e-05, 5.0220638513565063e-05, 5.5077485740184784e-05, 5.9934332966804504e-05, 6.479118019342422e-05, 6.964802742004395e-05, 7.450487464666367e-05, 7.936172187328339e-05, 8.42185690999031e-05, 8.907541632652283e-05, 9.393226355314255e-05, 9.878911077976227e-05, 0.00010364595800638199, 0.00010850280523300171, 0.00011335965245962143, 0.00011821649968624115, 0.00012307334691286087, 0.0001279301941394806, 0.0001327870413661003, 0.00013764388859272003, 0.00014250073581933975, 0.00014735758304595947, 0.0001522144302725792, 0.00015707127749919891, 0.00016192812472581863, 0.00016678497195243835, 0.00017164181917905807, 0.0001764986664056778, 0.00018135551363229752, 0.00018621236085891724, 0.00019106920808553696, 0.00019592605531215668, 0.0002007829025387764, 0.00020563974976539612, 0.00021049659699201584, 0.00021535344421863556, 0.00022021029144525528, 0.000225067138671875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 13.0, 18.0, 24.0, 69.0, 131.0, 320.0, 876.0, 4033.0, 59561.0, 861998.0, 113617.0, 6103.0, 1105.0, 368.0, 171.0, 74.0, 35.0, 16.0, 12.0, 5.0, 5.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.85009765625, -0.827484130859375, -0.80487060546875, -0.782257080078125, -0.7596435546875, -0.737030029296875, -0.71441650390625, -0.691802978515625, -0.669189453125, -0.646575927734375, -0.62396240234375, -0.601348876953125, -0.5787353515625, -0.556121826171875, -0.53350830078125, -0.510894775390625, -0.48828125, -0.465667724609375, -0.44305419921875, -0.420440673828125, -0.3978271484375, -0.375213623046875, -0.35260009765625, -0.329986572265625, -0.307373046875, -0.284759521484375, -0.26214599609375, -0.239532470703125, -0.2169189453125, -0.194305419921875, -0.17169189453125, -0.149078369140625, -0.12646484375, -0.103851318359375, -0.08123779296875, -0.058624267578125, -0.0360107421875, -0.013397216796875, 0.00921630859375, 0.031829833984375, 0.054443359375, 0.077056884765625, 0.09967041015625, 0.122283935546875, 0.1448974609375, 0.167510986328125, 0.19012451171875, 0.212738037109375, 0.2353515625, 0.257965087890625, 0.28057861328125, 0.303192138671875, 0.3258056640625, 0.348419189453125, 0.37103271484375, 0.393646240234375, 0.416259765625, 0.438873291015625, 0.46148681640625, 0.484100341796875, 0.5067138671875, 0.529327392578125, 0.55194091796875, 0.574554443359375, 0.59716796875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 7.0, 12.0, 16.0, 31.0, 66.0, 121.0, 211.0, 217.0, 128.0, 95.0, 47.0, 25.0, 11.0, 9.0, 5.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9072265625, -0.8871574401855469, -0.8670883178710938, -0.8470191955566406, -0.8269500732421875, -0.8068809509277344, -0.7868118286132812, -0.7667427062988281, -0.746673583984375, -0.7266044616699219, -0.7065353393554688, -0.6864662170410156, -0.6663970947265625, -0.6463279724121094, -0.6262588500976562, -0.6061897277832031, -0.58612060546875, -0.5660514831542969, -0.5459823608398438, -0.5259132385253906, -0.5058441162109375, -0.4857749938964844, -0.46570587158203125, -0.4456367492675781, -0.425567626953125, -0.4054985046386719, -0.38542938232421875, -0.3653602600097656, -0.3452911376953125, -0.3252220153808594, -0.30515289306640625, -0.2850837707519531, -0.2650146484375, -0.24494552612304688, -0.22487640380859375, -0.20480728149414062, -0.1847381591796875, -0.16466903686523438, -0.14459991455078125, -0.12453079223632812, -0.104461669921875, -0.08439254760742188, -0.06432342529296875, -0.044254302978515625, -0.0241851806640625, -0.004116058349609375, 0.01595306396484375, 0.036022186279296875, 0.05609130859375, 0.07616043090820312, 0.09622955322265625, 0.11629867553710938, 0.1363677978515625, 0.15643692016601562, 0.17650604248046875, 0.19657516479492188, 0.216644287109375, 0.23671340942382812, 0.25678253173828125, 0.2768516540527344, 0.2969207763671875, 0.3169898986816406, 0.33705902099609375, 0.3571281433105469, 0.377197265625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 5.0, 4.0, 7.0, 10.0, 15.0, 23.0, 47.0, 53.0, 84.0, 100.0, 141.0, 133.0, 117.0, 108.0, 54.0, 34.0, 25.0, 22.0, 6.0, 10.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.417672157287598, -7.24643611907959, -7.075200080871582, -6.903964042663574, -6.732728004455566, -6.561491966247559, -6.390255928039551, -6.219019889831543, -6.047783851623535, -5.876547813415527, -5.7053117752075195, -5.534075736999512, -5.362839698791504, -5.191603660583496, -5.020367622375488, -4.8491315841674805, -4.677895545959473, -4.506659507751465, -4.335423469543457, -4.164187431335449, -3.9929513931274414, -3.8217153549194336, -3.650479316711426, -3.479243278503418, -3.308006763458252, -3.136770725250244, -2.9655346870422363, -2.7942986488342285, -2.6230626106262207, -2.451826572418213, -2.280590534210205, -2.1093544960021973, -1.9381182193756104, -1.7668821811676025, -1.5956461429595947, -1.424410104751587, -1.253174066543579, -1.0819380283355713, -0.9107018709182739, -0.7394658327102661, -0.5682297945022583, -0.3969937562942505, -0.2257576882839203, -0.05452162027359009, 0.11671441793441772, 0.28795045614242554, 0.4591865539550781, 0.6304225921630859, 0.8016586303710938, 0.9728946685791016, 1.1441307067871094, 1.3153667449951172, 1.486602783203125, 1.6578388214111328, 1.8290749788284302, 2.0003108978271484, 2.1715469360351562, 2.342782974243164, 2.514019012451172, 2.6852550506591797, 2.8564910888671875, 3.0277271270751953, 3.198963165283203, 3.370199203491211, 3.541435480117798]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 5.0, 4.0, 3.0, 8.0, 5.0, 7.0, 4.0, 9.0, 10.0, 18.0, 16.0, 15.0, 19.0, 26.0, 35.0, 47.0, 43.0, 43.0, 54.0, 43.0, 63.0, 36.0, 44.0, 43.0, 46.0, 37.0, 37.0, 38.0, 45.0, 34.0, 31.0, 25.0, 14.0, 27.0, 15.0, 12.0, 12.0, 10.0, 6.0, 5.0, 4.0, 8.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.011470794677734, -3.9004287719726562, -3.7893869876861572, -3.678344964981079, -3.56730318069458, -3.456261157989502, -3.345219135284424, -3.2341771125793457, -3.1231353282928467, -3.0120933055877686, -2.9010515213012695, -2.7900094985961914, -2.6789674758911133, -2.5679256916046143, -2.456883668899536, -2.345841884613037, -2.234799861907959, -2.123757839202881, -2.012716054916382, -1.9016740322113037, -1.7906321287155151, -1.6795902252197266, -1.5685482025146484, -1.4575062990188599, -1.3464643955230713, -1.2354224920272827, -1.1243805885314941, -1.013338565826416, -0.9022966623306274, -0.7912547588348389, -0.6802127957344055, -0.5691708326339722, -0.4581291675567627, -0.34708723425865173, -0.23604530096054077, -0.1250033676624298, -0.013961434364318848, 0.09708046913146973, 0.20812243223190308, 0.3191643953323364, 0.430206298828125, 0.5412482023239136, 0.6522901654243469, 0.7633321285247803, 0.8743740320205688, 0.9854159355163574, 1.0964579582214355, 1.2074998617172241, 1.3185417652130127, 1.4295836687088013, 1.5406255722045898, 1.651667594909668, 1.7627094984054565, 1.8737514019012451, 1.9847934246063232, 2.0958352088928223, 2.2068772315979004, 2.3179192543029785, 2.4289610385894775, 2.5400030612945557, 2.6510448455810547, 2.762086868286133, 2.873128890991211, 2.984170913696289, 3.095212697982788]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 6.0, 13.0, 6.0, 13.0, 39.0, 63.0, 101.0, 196.0, 384.0, 731.0, 1827.0, 5312.0, 24543.0, 286135.0, 3809320.0, 51449.0, 9171.0, 2628.0, 1067.0, 479.0, 275.0, 138.0, 110.0, 66.0, 49.0, 49.0, 23.0, 23.0, 17.0, 16.0, 9.0, 8.0, 6.0, 5.0, 1.0, 6.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.396484375, -1.333587646484375, -1.27069091796875, -1.207794189453125, -1.1448974609375, -1.082000732421875, -1.01910400390625, -0.956207275390625, -0.893310546875, -0.830413818359375, -0.76751708984375, -0.704620361328125, -0.6417236328125, -0.578826904296875, -0.51593017578125, -0.453033447265625, -0.39013671875, -0.327239990234375, -0.26434326171875, -0.201446533203125, -0.1385498046875, -0.075653076171875, -0.01275634765625, 0.050140380859375, 0.113037109375, 0.175933837890625, 0.23883056640625, 0.301727294921875, 0.3646240234375, 0.427520751953125, 0.49041748046875, 0.553314208984375, 0.6162109375, 0.679107666015625, 0.74200439453125, 0.804901123046875, 0.8677978515625, 0.930694580078125, 0.99359130859375, 1.056488037109375, 1.119384765625, 1.182281494140625, 1.24517822265625, 1.308074951171875, 1.3709716796875, 1.433868408203125, 1.49676513671875, 1.559661865234375, 1.62255859375, 1.685455322265625, 1.74835205078125, 1.811248779296875, 1.8741455078125, 1.937042236328125, 1.99993896484375, 2.062835693359375, 2.125732421875, 2.188629150390625, 2.25152587890625, 2.314422607421875, 2.3773193359375, 2.440216064453125, 2.50311279296875, 2.566009521484375, 2.62890625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 6.0, 13.0, 12.0, 25.0, 48.0, 52.0, 68.0, 80.0, 95.0, 94.0, 86.0, 94.0, 78.0, 72.0, 51.0, 40.0, 32.0, 23.0, 13.0, 13.0, 1.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.255615234375, -0.24350357055664062, -0.23139190673828125, -0.21928024291992188, -0.2071685791015625, -0.19505691528320312, -0.18294525146484375, -0.17083358764648438, -0.158721923828125, -0.14661026000976562, -0.13449859619140625, -0.12238693237304688, -0.1102752685546875, -0.09816360473632812, -0.08605194091796875, -0.07394027709960938, -0.06182861328125, -0.049716949462890625, -0.03760528564453125, -0.025493621826171875, -0.0133819580078125, -0.001270294189453125, 0.01084136962890625, 0.022953033447265625, 0.035064697265625, 0.047176361083984375, 0.05928802490234375, 0.07139968872070312, 0.0835113525390625, 0.09562301635742188, 0.10773468017578125, 0.11984634399414062, 0.1319580078125, 0.14406967163085938, 0.15618133544921875, 0.16829299926757812, 0.1804046630859375, 0.19251632690429688, 0.20462799072265625, 0.21673965454101562, 0.228851318359375, 0.24096298217773438, 0.25307464599609375, 0.2651863098144531, 0.2772979736328125, 0.2894096374511719, 0.30152130126953125, 0.3136329650878906, 0.32574462890625, 0.3378562927246094, 0.34996795654296875, 0.3620796203613281, 0.3741912841796875, 0.3863029479980469, 0.39841461181640625, 0.4105262756347656, 0.422637939453125, 0.4347496032714844, 0.44686126708984375, 0.4589729309082031, 0.4710845947265625, 0.4831962585449219, 0.49530792236328125, 0.5074195861816406, 0.51953125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 9.0, 5.0, 8.0, 12.0, 24.0, 31.0, 39.0, 40.0, 91.0, 141.0, 251.0, 625.0, 2122.0, 9936.0, 79346.0, 3905699.0, 175619.0, 15778.0, 2922.0, 803.0, 327.0, 171.0, 87.0, 77.0, 36.0, 29.0, 22.0, 7.0, 13.0, 7.0, 6.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-2.623046875, -2.5600433349609375, -2.497039794921875, -2.4340362548828125, -2.37103271484375, -2.3080291748046875, -2.245025634765625, -2.1820220947265625, -2.1190185546875, -2.0560150146484375, -1.993011474609375, -1.9300079345703125, -1.86700439453125, -1.8040008544921875, -1.740997314453125, -1.6779937744140625, -1.614990234375, -1.5519866943359375, -1.488983154296875, -1.4259796142578125, -1.36297607421875, -1.2999725341796875, -1.236968994140625, -1.1739654541015625, -1.1109619140625, -1.0479583740234375, -0.984954833984375, -0.9219512939453125, -0.85894775390625, -0.7959442138671875, -0.732940673828125, -0.6699371337890625, -0.60693359375, -0.5439300537109375, -0.480926513671875, -0.4179229736328125, -0.35491943359375, -0.2919158935546875, -0.228912353515625, -0.1659088134765625, -0.1029052734375, -0.0399017333984375, 0.023101806640625, 0.0861053466796875, 0.14910888671875, 0.2121124267578125, 0.275115966796875, 0.3381195068359375, 0.401123046875, 0.4641265869140625, 0.527130126953125, 0.5901336669921875, 0.65313720703125, 0.7161407470703125, 0.779144287109375, 0.8421478271484375, 0.9051513671875, 0.9681549072265625, 1.031158447265625, 1.0941619873046875, 1.15716552734375, 1.2201690673828125, 1.283172607421875, 1.3461761474609375, 1.4091796875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 0.0, 2.0, 4.0, 3.0, 3.0, 5.0, 9.0, 3.0, 5.0, 17.0, 14.0, 21.0, 23.0, 46.0, 47.0, 94.0, 188.0, 381.0, 2179.0, 534.0, 205.0, 100.0, 59.0, 42.0, 31.0, 16.0, 13.0, 10.0, 5.0, 7.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.461669921875, -0.4483299255371094, -0.43498992919921875, -0.4216499328613281, -0.4083099365234375, -0.3949699401855469, -0.38162994384765625, -0.3682899475097656, -0.354949951171875, -0.3416099548339844, -0.32826995849609375, -0.3149299621582031, -0.3015899658203125, -0.2882499694824219, -0.27490997314453125, -0.2615699768066406, -0.24822998046875, -0.23488998413085938, -0.22154998779296875, -0.20820999145507812, -0.1948699951171875, -0.18152999877929688, -0.16819000244140625, -0.15485000610351562, -0.141510009765625, -0.12817001342773438, -0.11483001708984375, -0.10149002075195312, -0.0881500244140625, -0.07481002807617188, -0.06147003173828125, -0.048130035400390625, -0.0347900390625, -0.021450042724609375, -0.00811004638671875, 0.005229949951171875, 0.0185699462890625, 0.031909942626953125, 0.04524993896484375, 0.058589935302734375, 0.071929931640625, 0.08526992797851562, 0.09860992431640625, 0.11194992065429688, 0.1252899169921875, 0.13862991333007812, 0.15196990966796875, 0.16530990600585938, 0.17864990234375, 0.19198989868164062, 0.20532989501953125, 0.21866989135742188, 0.2320098876953125, 0.24534988403320312, 0.25868988037109375, 0.2720298767089844, 0.285369873046875, 0.2987098693847656, 0.31204986572265625, 0.3253898620605469, 0.3387298583984375, 0.3520698547363281, 0.36540985107421875, 0.3787498474121094, 0.39208984375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 4.0, 9.0, 25.0, 100.0, 291.0, 348.0, 154.0, 38.0, 13.0, 3.0, 5.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.679964065551758, -7.4977874755859375, -7.315610885620117, -7.133434295654297, -6.951257705688477, -6.769081115722656, -6.586904525756836, -6.404727458953857, -6.222550868988037, -6.040374279022217, -5.8581976890563965, -5.676021099090576, -5.493844509124756, -5.311667442321777, -5.129490852355957, -4.947314262390137, -4.765137672424316, -4.582961082458496, -4.400784492492676, -4.2186079025268555, -4.036431312561035, -3.8542544841766357, -3.6720778942108154, -3.489901065826416, -3.307724952697754, -3.1255483627319336, -2.9433717727661133, -2.761195182800293, -2.5790183544158936, -2.3968417644500732, -2.214665174484253, -2.0324883460998535, -1.8503117561340332, -1.668135166168213, -1.485958456993103, -1.3037818670272827, -1.1216051578521729, -0.9394285678863525, -0.7572519779205322, -0.5750752687454224, -0.39289867877960205, -0.21072204411029816, -0.028545409440994263, 0.15363121032714844, 0.3358078598976135, 0.5179845094680786, 0.7001610994338989, 0.8823378086090088, 1.064514398574829, 1.2466909885406494, 1.4288676977157593, 1.6110442876815796, 1.7932209968566895, 1.9753975868225098, 2.15757417678833, 2.3397507667541504, 2.5219273567199707, 2.704103946685791, 2.8862805366516113, 3.0684571266174316, 3.250633955001831, 3.4328105449676514, 3.6149871349334717, 3.797163963317871, 3.9793405532836914]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 9.0, 2.0, 1.0, 12.0, 7.0, 11.0, 11.0, 14.0, 19.0, 19.0, 27.0, 25.0, 39.0, 29.0, 38.0, 37.0, 41.0, 50.0, 57.0, 58.0, 49.0, 40.0, 38.0, 43.0, 37.0, 34.0, 31.0, 21.0, 18.0, 39.0, 27.0, 26.0, 14.0, 12.0, 14.0, 7.0, 8.0, 6.0, 8.0, 4.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.9652738571166992, -0.9320940971374512, -0.8989143371582031, -0.8657345771789551, -0.832554817199707, -0.799375057220459, -0.7661952376365662, -0.7330154776573181, -0.6998357176780701, -0.666655957698822, -0.633476197719574, -0.6002964377403259, -0.5671166181564331, -0.5339368581771851, -0.500757098197937, -0.46757733821868896, -0.4343975782394409, -0.40121781826019287, -0.3680380582809448, -0.3348582684993744, -0.30167850852012634, -0.2684987485408783, -0.23531897366046906, -0.20213919878005981, -0.16895943880081177, -0.13577967882156372, -0.10259990394115448, -0.06942013651132584, -0.03624036908149719, -0.0030606091022491455, 0.030119165778160095, 0.06329894065856934, 0.09647881984710693, 0.12965857982635498, 0.16283835470676422, 0.19601812958717346, 0.2291978895664215, 0.26237764954566956, 0.29555743932724, 0.32873719930648804, 0.3619169592857361, 0.39509671926498413, 0.4282764792442322, 0.4614562690258026, 0.49463602900505066, 0.5278158187866211, 0.5609955787658691, 0.5941753387451172, 0.6273550987243652, 0.6605348587036133, 0.6937146186828613, 0.7268943786621094, 0.7600741386413574, 0.7932538986206055, 0.8264337182044983, 0.8596134781837463, 0.8927932381629944, 0.9259729981422424, 0.9591527581214905, 0.9923325181007385, 1.0255123376846313, 1.0586920976638794, 1.0918718576431274, 1.1250516176223755, 1.1582313776016235]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 5.0, 13.0, 26.0, 31.0, 39.0, 56.0, 70.0, 136.0, 229.0, 457.0, 922.0, 2628.0, 10068.0, 55531.0, 366282.0, 505056.0, 86754.0, 14443.0, 3468.0, 1138.0, 500.0, 248.0, 163.0, 109.0, 61.0, 35.0, 23.0, 16.0, 16.0, 9.0, 6.0, 6.0, 5.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7939453125, -1.74285888671875, -1.6917724609375, -1.64068603515625, -1.589599609375, -1.53851318359375, -1.4874267578125, -1.43634033203125, -1.38525390625, -1.33416748046875, -1.2830810546875, -1.23199462890625, -1.180908203125, -1.12982177734375, -1.0787353515625, -1.02764892578125, -0.9765625, -0.92547607421875, -0.8743896484375, -0.82330322265625, -0.772216796875, -0.72113037109375, -0.6700439453125, -0.61895751953125, -0.56787109375, -0.51678466796875, -0.4656982421875, -0.41461181640625, -0.363525390625, -0.31243896484375, -0.2613525390625, -0.21026611328125, -0.1591796875, -0.10809326171875, -0.0570068359375, -0.00592041015625, 0.045166015625, 0.09625244140625, 0.1473388671875, 0.19842529296875, 0.24951171875, 0.30059814453125, 0.3516845703125, 0.40277099609375, 0.453857421875, 0.50494384765625, 0.5560302734375, 0.60711669921875, 0.658203125, 0.70928955078125, 0.7603759765625, 0.81146240234375, 0.862548828125, 0.91363525390625, 0.9647216796875, 1.01580810546875, 1.06689453125, 1.11798095703125, 1.1690673828125, 1.22015380859375, 1.271240234375, 1.32232666015625, 1.3734130859375, 1.42449951171875, 1.4755859375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 5.0, 4.0, 11.0, 18.0, 20.0, 27.0, 42.0, 71.0, 69.0, 83.0, 80.0, 82.0, 102.0, 88.0, 66.0, 51.0, 50.0, 49.0, 28.0, 21.0, 16.0, 15.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2425537109375, -0.23035621643066406, -0.21815872192382812, -0.2059612274169922, -0.19376373291015625, -0.1815662384033203, -0.16936874389648438, -0.15717124938964844, -0.1449737548828125, -0.13277626037597656, -0.12057876586914062, -0.10838127136230469, -0.09618377685546875, -0.08398628234863281, -0.07178878784179688, -0.05959129333496094, -0.047393798828125, -0.03519630432128906, -0.022998809814453125, -0.010801315307617188, 0.00139617919921875, 0.013593673706054688, 0.025791168212890625, 0.03798866271972656, 0.0501861572265625, 0.06238365173339844, 0.07458114624023438, 0.08677864074707031, 0.09897613525390625, 0.11117362976074219, 0.12337112426757812, 0.13556861877441406, 0.14776611328125, 0.15996360778808594, 0.17216110229492188, 0.1843585968017578, 0.19655609130859375, 0.2087535858154297, 0.22095108032226562, 0.23314857482910156, 0.2453460693359375, 0.25754356384277344, 0.2697410583496094, 0.2819385528564453, 0.29413604736328125, 0.3063335418701172, 0.3185310363769531, 0.33072853088378906, 0.342926025390625, 0.35512351989746094, 0.3673210144042969, 0.3795185089111328, 0.39171600341796875, 0.4039134979248047, 0.4161109924316406, 0.42830848693847656, 0.4405059814453125, 0.45270347595214844, 0.4649009704589844, 0.4770984649658203, 0.48929595947265625, 0.5014934539794922, 0.5136909484863281, 0.5258884429931641, 0.5380859375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 7.0, 5.0, 11.0, 20.0, 19.0, 50.0, 59.0, 58.0, 114.0, 139.0, 231.0, 368.0, 624.0, 1043.0, 2085.0, 4271.0, 10501.0, 27113.0, 76137.0, 203748.0, 355504.0, 227574.0, 86225.0, 30853.0, 11790.0, 4867.0, 2253.0, 1129.0, 619.0, 383.0, 222.0, 170.0, 120.0, 83.0, 45.0, 30.0, 18.0, 17.0, 19.0, 15.0, 8.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6474609375, -0.6269454956054688, -0.6064300537109375, -0.5859146118164062, -0.565399169921875, -0.5448837280273438, -0.5243682861328125, -0.5038528442382812, -0.48333740234375, -0.46282196044921875, -0.4423065185546875, -0.42179107666015625, -0.401275634765625, -0.38076019287109375, -0.3602447509765625, -0.33972930908203125, -0.3192138671875, -0.29869842529296875, -0.2781829833984375, -0.25766754150390625, -0.237152099609375, -0.21663665771484375, -0.1961212158203125, -0.17560577392578125, -0.15509033203125, -0.13457489013671875, -0.1140594482421875, -0.09354400634765625, -0.073028564453125, -0.05251312255859375, -0.0319976806640625, -0.01148223876953125, 0.009033203125, 0.02954864501953125, 0.0500640869140625, 0.07057952880859375, 0.091094970703125, 0.11161041259765625, 0.1321258544921875, 0.15264129638671875, 0.17315673828125, 0.19367218017578125, 0.2141876220703125, 0.23470306396484375, 0.255218505859375, 0.27573394775390625, 0.2962493896484375, 0.31676483154296875, 0.3372802734375, 0.35779571533203125, 0.3783111572265625, 0.39882659912109375, 0.419342041015625, 0.43985748291015625, 0.4603729248046875, 0.48088836669921875, 0.50140380859375, 0.5219192504882812, 0.5424346923828125, 0.5629501342773438, 0.583465576171875, 0.6039810180664062, 0.6244964599609375, 0.6450119018554688, 0.66552734375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 6.0, 3.0, 2.0, 6.0, 10.0, 9.0, 9.0, 16.0, 19.0, 14.0, 22.0, 28.0, 28.0, 37.0, 34.0, 38.0, 41.0, 35.0, 53.0, 41.0, 53.0, 50.0, 37.0, 44.0, 31.0, 52.0, 39.0, 33.0, 29.0, 32.0, 32.0, 24.0, 19.0, 14.0, 9.0, 14.0, 6.0, 6.0, 5.0, 10.0, 6.0, 2.0, 3.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.05078125, -1.0204391479492188, -0.9900970458984375, -0.9597549438476562, -0.929412841796875, -0.8990707397460938, -0.8687286376953125, -0.8383865356445312, -0.80804443359375, -0.7777023315429688, -0.7473602294921875, -0.7170181274414062, -0.686676025390625, -0.6563339233398438, -0.6259918212890625, -0.5956497192382812, -0.5653076171875, -0.5349655151367188, -0.5046234130859375, -0.47428131103515625, -0.443939208984375, -0.41359710693359375, -0.3832550048828125, -0.35291290283203125, -0.32257080078125, -0.29222869873046875, -0.2618865966796875, -0.23154449462890625, -0.201202392578125, -0.17086029052734375, -0.1405181884765625, -0.11017608642578125, -0.079833984375, -0.04949188232421875, -0.0191497802734375, 0.01119232177734375, 0.041534423828125, 0.07187652587890625, 0.1022186279296875, 0.13256072998046875, 0.16290283203125, 0.19324493408203125, 0.2235870361328125, 0.25392913818359375, 0.284271240234375, 0.31461334228515625, 0.3449554443359375, 0.37529754638671875, 0.4056396484375, 0.43598175048828125, 0.4663238525390625, 0.49666595458984375, 0.527008056640625, 0.5573501586914062, 0.5876922607421875, 0.6180343627929688, 0.64837646484375, 0.6787185668945312, 0.7090606689453125, 0.7394027709960938, 0.769744873046875, 0.8000869750976562, 0.8304290771484375, 0.8607711791992188, 0.89111328125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 11.0, 11.0, 13.0, 35.0, 79.0, 113.0, 231.0, 521.0, 1242.0, 4732.0, 31110.0, 359428.0, 579385.0, 61319.0, 7338.0, 1726.0, 638.0, 307.0, 149.0, 68.0, 50.0, 19.0, 13.0, 9.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64453125, -0.626190185546875, -0.60784912109375, -0.589508056640625, -0.5711669921875, -0.552825927734375, -0.53448486328125, -0.516143798828125, -0.497802734375, -0.479461669921875, -0.46112060546875, -0.442779541015625, -0.4244384765625, -0.406097412109375, -0.38775634765625, -0.369415283203125, -0.35107421875, -0.332733154296875, -0.31439208984375, -0.296051025390625, -0.2777099609375, -0.259368896484375, -0.24102783203125, -0.222686767578125, -0.204345703125, -0.186004638671875, -0.16766357421875, -0.149322509765625, -0.1309814453125, -0.112640380859375, -0.09429931640625, -0.075958251953125, -0.0576171875, -0.039276123046875, -0.02093505859375, -0.002593994140625, 0.0157470703125, 0.034088134765625, 0.05242919921875, 0.070770263671875, 0.089111328125, 0.107452392578125, 0.12579345703125, 0.144134521484375, 0.1624755859375, 0.180816650390625, 0.19915771484375, 0.217498779296875, 0.23583984375, 0.254180908203125, 0.27252197265625, 0.290863037109375, 0.3092041015625, 0.327545166015625, 0.34588623046875, 0.364227294921875, 0.382568359375, 0.400909423828125, 0.41925048828125, 0.437591552734375, 0.4559326171875, 0.474273681640625, 0.49261474609375, 0.510955810546875, 0.529296875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 2.0, 4.0, 5.0, 7.0, 8.0, 17.0, 15.0, 14.0, 19.0, 20.0, 30.0, 35.0, 40.0, 53.0, 57.0, 41.0, 73.0, 65.0, 73.0, 50.0, 70.0, 56.0, 39.0, 46.0, 21.0, 23.0, 19.0, 20.0, 19.0, 7.0, 6.0, 9.0, 7.0, 7.0, 5.0, 7.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.079673767089844e-05, -5.902908742427826e-05, -5.726143717765808e-05, -5.54937869310379e-05, -5.3726136684417725e-05, -5.1958486437797546e-05, -5.019083619117737e-05, -4.842318594455719e-05, -4.665553569793701e-05, -4.4887885451316833e-05, -4.3120235204696655e-05, -4.135258495807648e-05, -3.95849347114563e-05, -3.781728446483612e-05, -3.604963421821594e-05, -3.4281983971595764e-05, -3.2514333724975586e-05, -3.074668347835541e-05, -2.897903323173523e-05, -2.721138298511505e-05, -2.5443732738494873e-05, -2.3676082491874695e-05, -2.1908432245254517e-05, -2.014078199863434e-05, -1.837313175201416e-05, -1.6605481505393982e-05, -1.4837831258773804e-05, -1.3070181012153625e-05, -1.1302530765533447e-05, -9.534880518913269e-06, -7.76723027229309e-06, -5.999580025672913e-06, -4.231929779052734e-06, -2.464279532432556e-06, -6.966292858123779e-07, 1.0710209608078003e-06, 2.8386712074279785e-06, 4.606321454048157e-06, 6.373971700668335e-06, 8.141621947288513e-06, 9.909272193908691e-06, 1.167692244052887e-05, 1.3444572687149048e-05, 1.5212222933769226e-05, 1.6979873180389404e-05, 1.8747523427009583e-05, 2.051517367362976e-05, 2.228282392024994e-05, 2.4050474166870117e-05, 2.5818124413490295e-05, 2.7585774660110474e-05, 2.9353424906730652e-05, 3.112107515335083e-05, 3.288872539997101e-05, 3.4656375646591187e-05, 3.6424025893211365e-05, 3.819167613983154e-05, 3.995932638645172e-05, 4.17269766330719e-05, 4.349462687969208e-05, 4.5262277126312256e-05, 4.7029927372932434e-05, 4.879757761955261e-05, 5.056522786617279e-05, 5.233287811279297e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 6.0, 8.0, 13.0, 25.0, 33.0, 66.0, 110.0, 242.0, 428.0, 1153.0, 3507.0, 14737.0, 85230.0, 428693.0, 414948.0, 80004.0, 13810.0, 3457.0, 1117.0, 423.0, 229.0, 121.0, 79.0, 52.0, 21.0, 10.0, 18.0, 7.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.56005859375, -0.5456924438476562, -0.5313262939453125, -0.5169601440429688, -0.502593994140625, -0.48822784423828125, -0.4738616943359375, -0.45949554443359375, -0.44512939453125, -0.43076324462890625, -0.4163970947265625, -0.40203094482421875, -0.387664794921875, -0.37329864501953125, -0.3589324951171875, -0.34456634521484375, -0.3302001953125, -0.31583404541015625, -0.3014678955078125, -0.28710174560546875, -0.272735595703125, -0.25836944580078125, -0.2440032958984375, -0.22963714599609375, -0.21527099609375, -0.20090484619140625, -0.1865386962890625, -0.17217254638671875, -0.157806396484375, -0.14344024658203125, -0.1290740966796875, -0.11470794677734375, -0.100341796875, -0.08597564697265625, -0.0716094970703125, -0.05724334716796875, -0.042877197265625, -0.02851104736328125, -0.0141448974609375, 0.00022125244140625, 0.01458740234375, 0.02895355224609375, 0.0433197021484375, 0.05768585205078125, 0.072052001953125, 0.08641815185546875, 0.1007843017578125, 0.11515045166015625, 0.1295166015625, 0.14388275146484375, 0.1582489013671875, 0.17261505126953125, 0.186981201171875, 0.20134735107421875, 0.2157135009765625, 0.23007965087890625, 0.24444580078125, 0.25881195068359375, 0.2731781005859375, 0.28754425048828125, 0.301910400390625, 0.31627655029296875, 0.3306427001953125, 0.34500885009765625, 0.359375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 0.0, 2.0, 2.0, 7.0, 8.0, 3.0, 11.0, 13.0, 14.0, 23.0, 22.0, 26.0, 32.0, 43.0, 42.0, 69.0, 68.0, 62.0, 64.0, 69.0, 65.0, 59.0, 50.0, 47.0, 34.0, 44.0, 30.0, 21.0, 13.0, 18.0, 18.0, 9.0, 7.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.342529296875, -0.3314857482910156, -0.32044219970703125, -0.3093986511230469, -0.2983551025390625, -0.2873115539550781, -0.27626800537109375, -0.2652244567871094, -0.254180908203125, -0.24313735961914062, -0.23209381103515625, -0.22105026245117188, -0.2100067138671875, -0.19896316528320312, -0.18791961669921875, -0.17687606811523438, -0.16583251953125, -0.15478897094726562, -0.14374542236328125, -0.13270187377929688, -0.1216583251953125, -0.11061477661132812, -0.09957122802734375, -0.08852767944335938, -0.077484130859375, -0.06644058227539062, -0.05539703369140625, -0.044353485107421875, -0.0333099365234375, -0.022266387939453125, -0.01122283935546875, -0.000179290771484375, 0.0108642578125, 0.021907806396484375, 0.03295135498046875, 0.043994903564453125, 0.0550384521484375, 0.06608200073242188, 0.07712554931640625, 0.08816909790039062, 0.099212646484375, 0.11025619506835938, 0.12129974365234375, 0.13234329223632812, 0.1433868408203125, 0.15443038940429688, 0.16547393798828125, 0.17651748657226562, 0.18756103515625, 0.19860458374023438, 0.20964813232421875, 0.22069168090820312, 0.2317352294921875, 0.24277877807617188, 0.25382232666015625, 0.2648658752441406, 0.275909423828125, 0.2869529724121094, 0.29799652099609375, 0.3090400695800781, 0.3200836181640625, 0.3311271667480469, 0.34217071533203125, 0.3532142639160156, 0.3642578125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 5.0, 4.0, 12.0, 9.0, 18.0, 21.0, 37.0, 54.0, 70.0, 114.0, 119.0, 140.0, 125.0, 84.0, 69.0, 45.0, 22.0, 25.0, 9.0, 9.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-10.03009033203125, -9.813689231872559, -9.597288131713867, -9.380887031555176, -9.164485931396484, -8.948084831237793, -8.731683731079102, -8.515283584594727, -8.298882484436035, -8.082481384277344, -7.866080284118652, -7.649679183959961, -7.433278560638428, -7.216877460479736, -7.000476360321045, -6.7840752601623535, -6.567673683166504, -6.3512725830078125, -6.134871482849121, -5.91847038269043, -5.7020697593688965, -5.485668659210205, -5.269267559051514, -5.052866458892822, -4.836465835571289, -4.620064735412598, -4.403663635253906, -4.187262535095215, -3.9708616733551025, -3.7544608116149902, -3.538059711456299, -3.3216586112976074, -3.105257272720337, -2.8888561725616455, -2.672455310821533, -2.456054210662842, -2.2396531105041504, -2.023252010345459, -1.8068511486053467, -1.5904500484466553, -1.3740490674972534, -1.1576480865478516, -0.9412469863891602, -0.7248460054397583, -0.5084449648857117, -0.29204392433166504, -0.07564294338226318, 0.14075815677642822, 0.3571591377258301, 0.5735601782798767, 0.7899612188339233, 1.0063621997833252, 1.2227632999420166, 1.4391642808914185, 1.6555652618408203, 1.8719663619995117, 2.088367462158203, 2.3047685623168945, 2.521169424057007, 2.7375705242156982, 2.9539716243743896, 3.170372486114502, 3.3867735862731934, 3.6031746864318848, 3.819575548171997]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 4.0, 2.0, 9.0, 13.0, 10.0, 9.0, 17.0, 22.0, 10.0, 26.0, 35.0, 28.0, 21.0, 28.0, 38.0, 35.0, 40.0, 34.0, 39.0, 50.0, 34.0, 37.0, 43.0, 39.0, 37.0, 38.0, 31.0, 31.0, 34.0, 29.0, 30.0, 19.0, 29.0, 13.0, 17.0, 15.0, 8.0, 12.0, 6.0, 12.0, 8.0, 6.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.842136383056641, -4.691004753112793, -4.5398736000061035, -4.388741970062256, -4.237610816955566, -4.086479187011719, -3.935347557067871, -3.7842161655426025, -3.633084774017334, -3.4819533824920654, -3.330821990966797, -3.179690361022949, -3.0285589694976807, -2.877427577972412, -2.7262959480285645, -2.575164556503296, -2.4240331649780273, -2.272901773452759, -2.1217703819274902, -1.9706387519836426, -1.819507360458374, -1.6683759689331055, -1.5172444581985474, -1.3661129474639893, -1.2149815559387207, -1.0638501644134521, -0.912718653678894, -0.7615872025489807, -0.6104557514190674, -0.45932430028915405, -0.3081928491592407, -0.15706133842468262, -0.0059299468994140625, 0.14520150423049927, 0.2963329553604126, 0.4474644064903259, 0.5985958576202393, 0.7497273087501526, 0.9008587598800659, 1.051990270614624, 1.2031216621398926, 1.3542530536651611, 1.5053845643997192, 1.6565160751342773, 1.807647466659546, 1.9587788581848145, 2.109910488128662, 2.2610418796539307, 2.412173271179199, 2.5633046627044678, 2.7144360542297363, 2.865567684173584, 3.0166990756988525, 3.167830467224121, 3.3189620971679688, 3.4700934886932373, 3.621224880218506, 3.7723562717437744, 3.923487663269043, 4.074619293212891, 4.225750923156738, 4.376882076263428, 4.528013706207275, 4.679144859313965, 4.8302764892578125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 8.0, 6.0, 7.0, 15.0, 16.0, 33.0, 82.0, 126.0, 293.0, 626.0, 1538.0, 4097.0, 14983.0, 91163.0, 3857692.0, 191567.0, 22471.0, 5678.0, 1926.0, 802.0, 440.0, 230.0, 138.0, 98.0, 68.0, 44.0, 35.0, 19.0, 26.0, 19.0, 9.0, 9.0, 8.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.8408203125, -1.7807464599609375, -1.720672607421875, -1.6605987548828125, -1.60052490234375, -1.5404510498046875, -1.480377197265625, -1.4203033447265625, -1.3602294921875, -1.3001556396484375, -1.240081787109375, -1.1800079345703125, -1.11993408203125, -1.0598602294921875, -0.999786376953125, -0.9397125244140625, -0.879638671875, -0.8195648193359375, -0.759490966796875, -0.6994171142578125, -0.63934326171875, -0.5792694091796875, -0.519195556640625, -0.4591217041015625, -0.3990478515625, -0.3389739990234375, -0.278900146484375, -0.2188262939453125, -0.15875244140625, -0.0986785888671875, -0.038604736328125, 0.0214691162109375, 0.08154296875, 0.1416168212890625, 0.201690673828125, 0.2617645263671875, 0.32183837890625, 0.3819122314453125, 0.441986083984375, 0.5020599365234375, 0.5621337890625, 0.6222076416015625, 0.682281494140625, 0.7423553466796875, 0.80242919921875, 0.8625030517578125, 0.922576904296875, 0.9826507568359375, 1.042724609375, 1.1027984619140625, 1.162872314453125, 1.2229461669921875, 1.28302001953125, 1.3430938720703125, 1.403167724609375, 1.4632415771484375, 1.5233154296875, 1.5833892822265625, 1.643463134765625, 1.7035369873046875, 1.76361083984375, 1.8236846923828125, 1.883758544921875, 1.9438323974609375, 2.00390625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 8.0, 8.0, 11.0, 14.0, 6.0, 18.0, 40.0, 39.0, 54.0, 63.0, 68.0, 71.0, 73.0, 63.0, 81.0, 71.0, 76.0, 54.0, 41.0, 39.0, 36.0, 27.0, 10.0, 12.0, 9.0, 8.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26220703125, -0.2499847412109375, -0.237762451171875, -0.2255401611328125, -0.21331787109375, -0.2010955810546875, -0.188873291015625, -0.1766510009765625, -0.1644287109375, -0.1522064208984375, -0.139984130859375, -0.1277618408203125, -0.11553955078125, -0.1033172607421875, -0.091094970703125, -0.0788726806640625, -0.066650390625, -0.0544281005859375, -0.042205810546875, -0.0299835205078125, -0.01776123046875, -0.0055389404296875, 0.006683349609375, 0.0189056396484375, 0.0311279296875, 0.0433502197265625, 0.055572509765625, 0.0677947998046875, 0.08001708984375, 0.0922393798828125, 0.104461669921875, 0.1166839599609375, 0.12890625, 0.1411285400390625, 0.153350830078125, 0.1655731201171875, 0.17779541015625, 0.1900177001953125, 0.202239990234375, 0.2144622802734375, 0.2266845703125, 0.2389068603515625, 0.251129150390625, 0.2633514404296875, 0.27557373046875, 0.2877960205078125, 0.300018310546875, 0.3122406005859375, 0.324462890625, 0.3366851806640625, 0.348907470703125, 0.3611297607421875, 0.37335205078125, 0.3855743408203125, 0.397796630859375, 0.4100189208984375, 0.4222412109375, 0.4344635009765625, 0.446685791015625, 0.4589080810546875, 0.47113037109375, 0.4833526611328125, 0.495574951171875, 0.5077972412109375, 0.52001953125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 6.0, 4.0, 12.0, 14.0, 14.0, 27.0, 43.0, 57.0, 84.0, 102.0, 148.0, 215.0, 304.0, 480.0, 833.0, 1623.0, 3656.0, 9095.0, 27929.0, 128337.0, 3483539.0, 456639.0, 54235.0, 15641.0, 5754.0, 2463.0, 1135.0, 637.0, 419.0, 244.0, 162.0, 135.0, 80.0, 65.0, 47.0, 25.0, 22.0, 20.0, 16.0, 6.0, 3.0, 4.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0], "bins": [-1.3486328125, -1.3119354248046875, -1.275238037109375, -1.2385406494140625, -1.20184326171875, -1.1651458740234375, -1.128448486328125, -1.0917510986328125, -1.0550537109375, -1.0183563232421875, -0.981658935546875, -0.9449615478515625, -0.90826416015625, -0.8715667724609375, -0.834869384765625, -0.7981719970703125, -0.761474609375, -0.7247772216796875, -0.688079833984375, -0.6513824462890625, -0.61468505859375, -0.5779876708984375, -0.541290283203125, -0.5045928955078125, -0.4678955078125, -0.4311981201171875, -0.394500732421875, -0.3578033447265625, -0.32110595703125, -0.2844085693359375, -0.247711181640625, -0.2110137939453125, -0.17431640625, -0.1376190185546875, -0.100921630859375, -0.0642242431640625, -0.02752685546875, 0.0091705322265625, 0.045867919921875, 0.0825653076171875, 0.1192626953125, 0.1559600830078125, 0.192657470703125, 0.2293548583984375, 0.26605224609375, 0.3027496337890625, 0.339447021484375, 0.3761444091796875, 0.412841796875, 0.4495391845703125, 0.486236572265625, 0.5229339599609375, 0.55963134765625, 0.5963287353515625, 0.633026123046875, 0.6697235107421875, 0.7064208984375, 0.7431182861328125, 0.779815673828125, 0.8165130615234375, 0.85321044921875, 0.8899078369140625, 0.926605224609375, 0.9633026123046875, 1.0]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 8.0, 13.0, 17.0, 35.0, 65.0, 110.0, 425.0, 2666.0, 473.0, 127.0, 51.0, 26.0, 22.0, 10.0, 6.0, 11.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7392578125, -0.7064208984375, -0.673583984375, -0.6407470703125, -0.60791015625, -0.5750732421875, -0.542236328125, -0.5093994140625, -0.4765625, -0.4437255859375, -0.410888671875, -0.3780517578125, -0.34521484375, -0.3123779296875, -0.279541015625, -0.2467041015625, -0.2138671875, -0.1810302734375, -0.148193359375, -0.1153564453125, -0.08251953125, -0.0496826171875, -0.016845703125, 0.0159912109375, 0.048828125, 0.0816650390625, 0.114501953125, 0.1473388671875, 0.18017578125, 0.2130126953125, 0.245849609375, 0.2786865234375, 0.3115234375, 0.3443603515625, 0.377197265625, 0.4100341796875, 0.44287109375, 0.4757080078125, 0.508544921875, 0.5413818359375, 0.57421875, 0.6070556640625, 0.639892578125, 0.6727294921875, 0.70556640625, 0.7384033203125, 0.771240234375, 0.8040771484375, 0.8369140625, 0.8697509765625, 0.902587890625, 0.9354248046875, 0.96826171875, 1.0010986328125, 1.033935546875, 1.0667724609375, 1.099609375, 1.1324462890625, 1.165283203125, 1.1981201171875, 1.23095703125, 1.2637939453125, 1.296630859375, 1.3294677734375, 1.3623046875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0, 4.0, 6.0, 4.0, 4.0, 22.0, 42.0, 131.0, 204.0, 236.0, 174.0, 90.0, 51.0, 12.0, 8.0, 1.0, 6.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.640812397003174, -5.475379943847656, -5.309947490692139, -5.144515037536621, -4.979082107543945, -4.813649654388428, -4.64821720123291, -4.482784748077393, -4.317352294921875, -4.151919841766357, -3.98648738861084, -3.821054697036743, -3.6556222438812256, -3.490189790725708, -3.3247570991516113, -3.1593246459960938, -2.993892192840576, -2.8284597396850586, -2.663027286529541, -2.4975945949554443, -2.3321621417999268, -2.166729688644409, -2.0012969970703125, -1.835864543914795, -1.6704320907592773, -1.5049996376037598, -1.3395670652389526, -1.1741344928741455, -1.008702039718628, -0.8432695269584656, -0.6778370141983032, -0.5124044418334961, -0.3469715118408203, -0.18153899908065796, -0.016106486320495605, 0.14932602643966675, 0.3147585391998291, 0.48019105195999146, 0.6456235647201538, 0.8110561370849609, 0.9764885902404785, 1.141921043395996, 1.3073536157608032, 1.4727861881256104, 1.638218641281128, 1.8036510944366455, 1.9690836668014526, 2.1345162391662598, 2.2999486923217773, 2.465381145477295, 2.6308135986328125, 2.796246290206909, 2.9616787433624268, 3.1271111965179443, 3.292543888092041, 3.4579763412475586, 3.623408794403076, 3.7888412475585938, 3.9542737007141113, 4.119706153869629, 4.285139083862305, 4.450571537017822, 4.61600399017334, 4.781436443328857, 4.946868896484375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 3.0, 0.0, 4.0, 2.0, 6.0, 6.0, 8.0, 12.0, 14.0, 19.0, 21.0, 22.0, 21.0, 32.0, 30.0, 31.0, 45.0, 35.0, 37.0, 53.0, 52.0, 50.0, 40.0, 34.0, 47.0, 45.0, 32.0, 46.0, 45.0, 38.0, 27.0, 28.0, 8.0, 13.0, 16.0, 19.0, 14.0, 10.0, 19.0, 6.0, 8.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.945880651473999, -1.8837227821350098, -1.8215649127960205, -1.7594070434570312, -1.697249174118042, -1.6350913047790527, -1.5729334354400635, -1.5107754468917847, -1.4486175775527954, -1.3864597082138062, -1.324301838874817, -1.2621439695358276, -1.1999861001968384, -1.1378281116485596, -1.0756702423095703, -1.013512372970581, -0.9513545632362366, -0.8891966938972473, -0.8270388245582581, -0.764880895614624, -0.7027230262756348, -0.6405651569366455, -0.5784072875976562, -0.516249418258667, -0.45409151911735535, -0.3919336497783661, -0.32977575063705444, -0.2676178812980652, -0.20545999705791473, -0.14330211281776428, -0.08114424347877502, -0.01898634433746338, 0.04317152500152588, 0.10532940924167633, 0.16748729348182678, 0.22964516282081604, 0.2918030619621277, 0.35396093130111694, 0.4161188006401062, 0.47827669978141785, 0.5404345989227295, 0.6025924682617188, 0.664750337600708, 0.7269082069396973, 0.7890661358833313, 0.8512240052223206, 0.9133818745613098, 0.9755398035049438, 1.0376975536346436, 1.0998554229736328, 1.162013292312622, 1.2241711616516113, 1.2863290309906006, 1.3484869003295898, 1.410644769668579, 1.472802758216858, 1.5349606275558472, 1.5971184968948364, 1.6592763662338257, 1.721434235572815, 1.7835921049118042, 1.845750093460083, 1.9079079627990723, 1.9700658321380615, 2.032223701477051]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 2.0, 6.0, 6.0, 10.0, 6.0, 17.0, 14.0, 30.0, 44.0, 51.0, 90.0, 124.0, 211.0, 338.0, 650.0, 1336.0, 3216.0, 9036.0, 30256.0, 117819.0, 390587.0, 354929.0, 99997.0, 25977.0, 8103.0, 2935.0, 1288.0, 611.0, 327.0, 179.0, 122.0, 77.0, 50.0, 37.0, 22.0, 16.0, 11.0, 11.0, 4.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.345703125, -1.3035736083984375, -1.261444091796875, -1.2193145751953125, -1.17718505859375, -1.1350555419921875, -1.092926025390625, -1.0507965087890625, -1.0086669921875, -0.9665374755859375, -0.924407958984375, -0.8822784423828125, -0.84014892578125, -0.7980194091796875, -0.755889892578125, -0.7137603759765625, -0.671630859375, -0.6295013427734375, -0.587371826171875, -0.5452423095703125, -0.50311279296875, -0.4609832763671875, -0.418853759765625, -0.3767242431640625, -0.3345947265625, -0.2924652099609375, -0.250335693359375, -0.2082061767578125, -0.16607666015625, -0.1239471435546875, -0.081817626953125, -0.0396881103515625, 0.00244140625, 0.0445709228515625, 0.086700439453125, 0.1288299560546875, 0.17095947265625, 0.2130889892578125, 0.255218505859375, 0.2973480224609375, 0.3394775390625, 0.3816070556640625, 0.423736572265625, 0.4658660888671875, 0.50799560546875, 0.5501251220703125, 0.592254638671875, 0.6343841552734375, 0.676513671875, 0.7186431884765625, 0.760772705078125, 0.8029022216796875, 0.84503173828125, 0.8871612548828125, 0.929290771484375, 0.9714202880859375, 1.0135498046875, 1.0556793212890625, 1.097808837890625, 1.1399383544921875, 1.18206787109375, 1.2241973876953125, 1.266326904296875, 1.3084564208984375, 1.3505859375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 3.0, 4.0, 6.0, 9.0, 10.0, 11.0, 12.0, 21.0, 16.0, 28.0, 32.0, 50.0, 55.0, 67.0, 62.0, 62.0, 85.0, 73.0, 54.0, 62.0, 54.0, 52.0, 35.0, 41.0, 19.0, 25.0, 18.0, 9.0, 10.0, 10.0, 11.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2431640625, -0.2308502197265625, -0.218536376953125, -0.2062225341796875, -0.19390869140625, -0.1815948486328125, -0.169281005859375, -0.1569671630859375, -0.1446533203125, -0.1323394775390625, -0.120025634765625, -0.1077117919921875, -0.09539794921875, -0.0830841064453125, -0.070770263671875, -0.0584564208984375, -0.046142578125, -0.0338287353515625, -0.021514892578125, -0.0092010498046875, 0.00311279296875, 0.0154266357421875, 0.027740478515625, 0.0400543212890625, 0.0523681640625, 0.0646820068359375, 0.076995849609375, 0.0893096923828125, 0.10162353515625, 0.1139373779296875, 0.126251220703125, 0.1385650634765625, 0.15087890625, 0.1631927490234375, 0.175506591796875, 0.1878204345703125, 0.20013427734375, 0.2124481201171875, 0.224761962890625, 0.2370758056640625, 0.2493896484375, 0.2617034912109375, 0.274017333984375, 0.2863311767578125, 0.29864501953125, 0.3109588623046875, 0.323272705078125, 0.3355865478515625, 0.347900390625, 0.3602142333984375, 0.372528076171875, 0.3848419189453125, 0.39715576171875, 0.4094696044921875, 0.421783447265625, 0.4340972900390625, 0.4464111328125, 0.4587249755859375, 0.471038818359375, 0.4833526611328125, 0.49566650390625, 0.5079803466796875, 0.520294189453125, 0.5326080322265625, 0.544921875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 6.0, 9.0, 8.0, 15.0, 18.0, 32.0, 55.0, 139.0, 340.0, 877.0, 3184.0, 14923.0, 97405.0, 598087.0, 286312.0, 37650.0, 6798.0, 1654.0, 567.0, 226.0, 100.0, 61.0, 34.0, 15.0, 14.0, 9.0, 4.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.09375, -2.0367889404296875, -1.979827880859375, -1.9228668212890625, -1.86590576171875, -1.8089447021484375, -1.751983642578125, -1.6950225830078125, -1.6380615234375, -1.5811004638671875, -1.524139404296875, -1.4671783447265625, -1.41021728515625, -1.3532562255859375, -1.296295166015625, -1.2393341064453125, -1.182373046875, -1.1254119873046875, -1.068450927734375, -1.0114898681640625, -0.95452880859375, -0.8975677490234375, -0.840606689453125, -0.7836456298828125, -0.7266845703125, -0.6697235107421875, -0.612762451171875, -0.5558013916015625, -0.49884033203125, -0.4418792724609375, -0.384918212890625, -0.3279571533203125, -0.27099609375, -0.2140350341796875, -0.157073974609375, -0.1001129150390625, -0.04315185546875, 0.0138092041015625, 0.070770263671875, 0.1277313232421875, 0.1846923828125, 0.2416534423828125, 0.298614501953125, 0.3555755615234375, 0.41253662109375, 0.4694976806640625, 0.526458740234375, 0.5834197998046875, 0.640380859375, 0.6973419189453125, 0.754302978515625, 0.8112640380859375, 0.86822509765625, 0.9251861572265625, 0.982147216796875, 1.0391082763671875, 1.0960693359375, 1.1530303955078125, 1.209991455078125, 1.2669525146484375, 1.32391357421875, 1.3808746337890625, 1.437835693359375, 1.4947967529296875, 1.5517578125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 3.0, 10.0, 6.0, 8.0, 9.0, 16.0, 14.0, 24.0, 18.0, 19.0, 35.0, 38.0, 48.0, 42.0, 36.0, 40.0, 44.0, 73.0, 56.0, 65.0, 47.0, 40.0, 44.0, 40.0, 39.0, 30.0, 37.0, 17.0, 23.0, 16.0, 17.0, 17.0, 10.0, 7.0, 3.0, 5.0, 3.0, 4.0, 0.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6591796875, -1.6095428466796875, -1.559906005859375, -1.5102691650390625, -1.46063232421875, -1.4109954833984375, -1.361358642578125, -1.3117218017578125, -1.2620849609375, -1.2124481201171875, -1.162811279296875, -1.1131744384765625, -1.06353759765625, -1.0139007568359375, -0.964263916015625, -0.9146270751953125, -0.864990234375, -0.8153533935546875, -0.765716552734375, -0.7160797119140625, -0.66644287109375, -0.6168060302734375, -0.567169189453125, -0.5175323486328125, -0.4678955078125, -0.4182586669921875, -0.368621826171875, -0.3189849853515625, -0.26934814453125, -0.2197113037109375, -0.170074462890625, -0.1204376220703125, -0.07080078125, -0.0211639404296875, 0.028472900390625, 0.0781097412109375, 0.12774658203125, 0.1773834228515625, 0.227020263671875, 0.2766571044921875, 0.3262939453125, 0.3759307861328125, 0.425567626953125, 0.4752044677734375, 0.52484130859375, 0.5744781494140625, 0.624114990234375, 0.6737518310546875, 0.723388671875, 0.7730255126953125, 0.822662353515625, 0.8722991943359375, 0.92193603515625, 0.9715728759765625, 1.021209716796875, 1.0708465576171875, 1.1204833984375, 1.1701202392578125, 1.219757080078125, 1.2693939208984375, 1.31903076171875, 1.3686676025390625, 1.418304443359375, 1.4679412841796875, 1.517578125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 6.0, 7.0, 10.0, 14.0, 20.0, 48.0, 83.0, 144.0, 282.0, 565.0, 1452.0, 5571.0, 42230.0, 560387.0, 401976.0, 29098.0, 4410.0, 1167.0, 495.0, 266.0, 126.0, 80.0, 46.0, 32.0, 16.0, 13.0, 3.0, 1.0, 4.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90234375, -0.8731613159179688, -0.8439788818359375, -0.8147964477539062, -0.785614013671875, -0.7564315795898438, -0.7272491455078125, -0.6980667114257812, -0.66888427734375, -0.6397018432617188, -0.6105194091796875, -0.5813369750976562, -0.552154541015625, -0.5229721069335938, -0.4937896728515625, -0.46460723876953125, -0.4354248046875, -0.40624237060546875, -0.3770599365234375, -0.34787750244140625, -0.318695068359375, -0.28951263427734375, -0.2603302001953125, -0.23114776611328125, -0.20196533203125, -0.17278289794921875, -0.1436004638671875, -0.11441802978515625, -0.085235595703125, -0.05605316162109375, -0.0268707275390625, 0.00231170654296875, 0.031494140625, 0.06067657470703125, 0.0898590087890625, 0.11904144287109375, 0.148223876953125, 0.17740631103515625, 0.2065887451171875, 0.23577117919921875, 0.26495361328125, 0.29413604736328125, 0.3233184814453125, 0.35250091552734375, 0.381683349609375, 0.41086578369140625, 0.4400482177734375, 0.46923065185546875, 0.4984130859375, 0.5275955200195312, 0.5567779541015625, 0.5859603881835938, 0.615142822265625, 0.6443252563476562, 0.6735076904296875, 0.7026901245117188, 0.73187255859375, 0.7610549926757812, 0.7902374267578125, 0.8194198608398438, 0.848602294921875, 0.8777847290039062, 0.9069671630859375, 0.9361495971679688, 0.96533203125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 7.0, 2.0, 5.0, 4.0, 5.0, 11.0, 14.0, 16.0, 31.0, 33.0, 33.0, 51.0, 60.0, 83.0, 91.0, 91.0, 78.0, 95.0, 63.0, 59.0, 44.0, 38.0, 16.0, 22.0, 16.0, 10.0, 4.0, 5.0, 4.0, 7.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011032819747924805, -0.0001070583239197731, -0.00010378845036029816, -0.00010051857680082321, -9.724870324134827e-05, -9.397882968187332e-05, -9.070895612239838e-05, -8.743908256292343e-05, -8.416920900344849e-05, -8.089933544397354e-05, -7.76294618844986e-05, -7.435958832502365e-05, -7.10897147655487e-05, -6.781984120607376e-05, -6.454996764659882e-05, -6.128009408712387e-05, -5.8010220527648926e-05, -5.474034696817398e-05, -5.1470473408699036e-05, -4.820059984922409e-05, -4.4930726289749146e-05, -4.16608527302742e-05, -3.8390979170799255e-05, -3.512110561132431e-05, -3.1851232051849365e-05, -2.858135849237442e-05, -2.5311484932899475e-05, -2.204161137342453e-05, -1.8771737813949585e-05, -1.550186425447464e-05, -1.2231990694999695e-05, -8.96211713552475e-06, -5.692243576049805e-06, -2.4223700165748596e-06, 8.475035429000854e-07, 4.1173771023750305e-06, 7.387250661849976e-06, 1.065712422132492e-05, 1.3926997780799866e-05, 1.719687134027481e-05, 2.0466744899749756e-05, 2.37366184592247e-05, 2.7006492018699646e-05, 3.027636557817459e-05, 3.3546239137649536e-05, 3.681611269712448e-05, 4.0085986256599426e-05, 4.335585981607437e-05, 4.6625733375549316e-05, 4.989560693502426e-05, 5.3165480494499207e-05, 5.643535405397415e-05, 5.97052276134491e-05, 6.297510117292404e-05, 6.624497473239899e-05, 6.951484829187393e-05, 7.278472185134888e-05, 7.605459541082382e-05, 7.932446897029877e-05, 8.259434252977371e-05, 8.586421608924866e-05, 8.91340896487236e-05, 9.240396320819855e-05, 9.567383676767349e-05, 9.894371032714844e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 5.0, 6.0, 12.0, 17.0, 24.0, 45.0, 64.0, 88.0, 165.0, 238.0, 449.0, 845.0, 1801.0, 4846.0, 17208.0, 82133.0, 407130.0, 420703.0, 86377.0, 17492.0, 4945.0, 1858.0, 911.0, 500.0, 272.0, 163.0, 81.0, 62.0, 37.0, 18.0, 16.0, 8.0, 10.0, 6.0, 5.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.4931640625, -0.476165771484375, -0.45916748046875, -0.442169189453125, -0.4251708984375, -0.408172607421875, -0.39117431640625, -0.374176025390625, -0.357177734375, -0.340179443359375, -0.32318115234375, -0.306182861328125, -0.2891845703125, -0.272186279296875, -0.25518798828125, -0.238189697265625, -0.22119140625, -0.204193115234375, -0.18719482421875, -0.170196533203125, -0.1531982421875, -0.136199951171875, -0.11920166015625, -0.102203369140625, -0.085205078125, -0.068206787109375, -0.05120849609375, -0.034210205078125, -0.0172119140625, -0.000213623046875, 0.01678466796875, 0.033782958984375, 0.05078125, 0.067779541015625, 0.08477783203125, 0.101776123046875, 0.1187744140625, 0.135772705078125, 0.15277099609375, 0.169769287109375, 0.186767578125, 0.203765869140625, 0.22076416015625, 0.237762451171875, 0.2547607421875, 0.271759033203125, 0.28875732421875, 0.305755615234375, 0.32275390625, 0.339752197265625, 0.35675048828125, 0.373748779296875, 0.3907470703125, 0.407745361328125, 0.42474365234375, 0.441741943359375, 0.458740234375, 0.475738525390625, 0.49273681640625, 0.509735107421875, 0.5267333984375, 0.543731689453125, 0.56072998046875, 0.577728271484375, 0.5947265625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 5.0, 6.0, 7.0, 13.0, 14.0, 18.0, 24.0, 30.0, 43.0, 71.0, 82.0, 127.0, 120.0, 121.0, 95.0, 64.0, 47.0, 40.0, 21.0, 18.0, 13.0, 8.0, 5.0, 2.0, 4.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.88134765625, -0.8557205200195312, -0.8300933837890625, -0.8044662475585938, -0.778839111328125, -0.7532119750976562, -0.7275848388671875, -0.7019577026367188, -0.67633056640625, -0.6507034301757812, -0.6250762939453125, -0.5994491577148438, -0.573822021484375, -0.5481948852539062, -0.5225677490234375, -0.49694061279296875, -0.4713134765625, -0.44568634033203125, -0.4200592041015625, -0.39443206787109375, -0.368804931640625, -0.34317779541015625, -0.3175506591796875, -0.29192352294921875, -0.26629638671875, -0.24066925048828125, -0.2150421142578125, -0.18941497802734375, -0.163787841796875, -0.13816070556640625, -0.1125335693359375, -0.08690643310546875, -0.061279296875, -0.03565216064453125, -0.0100250244140625, 0.01560211181640625, 0.041229248046875, 0.06685638427734375, 0.0924835205078125, 0.11811065673828125, 0.14373779296875, 0.16936492919921875, 0.1949920654296875, 0.22061920166015625, 0.246246337890625, 0.27187347412109375, 0.2975006103515625, 0.32312774658203125, 0.3487548828125, 0.37438201904296875, 0.4000091552734375, 0.42563629150390625, 0.451263427734375, 0.47689056396484375, 0.5025177001953125, 0.5281448364257812, 0.55377197265625, 0.5793991088867188, 0.6050262451171875, 0.6306533813476562, 0.656280517578125, 0.6819076538085938, 0.7075347900390625, 0.7331619262695312, 0.7587890625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 10.0, 14.0, 14.0, 37.0, 64.0, 84.0, 156.0, 148.0, 163.0, 115.0, 74.0, 52.0, 32.0, 26.0, 8.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.134284496307373, -5.749335289001465, -5.364386081695557, -4.979436874389648, -4.594487190246582, -4.209538459777832, -3.8245887756347656, -3.4396395683288574, -3.054690361022949, -2.669741153717041, -2.284791946411133, -1.8998425006866455, -1.5148932933807373, -1.129944086074829, -0.7449946403503418, -0.3600454330444336, 0.02490377426147461, 0.4098530411720276, 0.7948023080825806, 1.1797516345977783, 1.5647008419036865, 1.9496500492095947, 2.334599494934082, 2.7195487022399902, 3.1044979095458984, 3.4894471168518066, 3.874396324157715, 4.259346008300781, 4.644294738769531, 5.029244422912598, 5.414193630218506, 5.799142837524414, 6.184091567993164, 6.569040775299072, 6.9539899826049805, 7.338939666748047, 7.723888397216797, 8.108838081359863, 8.49378776550293, 8.87873649597168, 9.26368522644043, 9.648634910583496, 10.033583641052246, 10.418533325195312, 10.803482055664062, 11.188431739807129, 11.573381423950195, 11.958330154418945, 12.343279838562012, 12.728229522705078, 13.113178253173828, 13.498127937316895, 13.883076667785645, 14.268026351928711, 14.652975082397461, 15.037924766540527, 15.422874450683594, 15.80782413482666, 16.192773818969727, 16.577722549438477, 16.962671279907227, 17.347620010375977, 17.73257064819336, 18.11751937866211, 18.50246810913086]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 8.0, 2.0, 3.0, 5.0, 9.0, 8.0, 10.0, 19.0, 14.0, 16.0, 24.0, 34.0, 22.0, 31.0, 32.0, 44.0, 37.0, 41.0, 48.0, 44.0, 41.0, 40.0, 57.0, 38.0, 45.0, 35.0, 42.0, 24.0, 32.0, 36.0, 21.0, 23.0, 18.0, 25.0, 14.0, 19.0, 10.0, 6.0, 8.0, 7.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-8.193939208984375, -7.955328464508057, -7.7167181968688965, -7.478107452392578, -7.23949670791626, -7.0008864402771, -6.762275695800781, -6.523665428161621, -6.285054683685303, -6.046443939208984, -5.807833671569824, -5.569222927093506, -5.3306121826171875, -5.092001914978027, -4.853391170501709, -4.614780426025391, -4.3761701583862305, -4.137559413909912, -3.898948907852173, -3.6603384017944336, -3.4217278957366943, -3.183117389678955, -2.9445066452026367, -2.7058961391448975, -2.46728515625, -2.2286746501922607, -1.990064024925232, -1.7514533996582031, -1.5128428936004639, -1.274232268333435, -1.0356216430664062, -0.797011137008667, -0.5584006309509277, -0.3197900652885437, -0.08117946982383728, 0.15743112564086914, 0.3960416913032532, 0.6346522569656372, 0.873262882232666, 1.1118733882904053, 1.350484013557434, 1.589094638824463, 1.8277051448822021, 2.0663156509399414, 2.3049263954162598, 2.543536901473999, 2.7821474075317383, 3.0207581520080566, 3.259368658065796, 3.497979164123535, 3.7365899085998535, 3.9752004146575928, 4.213810920715332, 4.45242166519165, 4.691032409667969, 4.929642677307129, 5.168253421783447, 5.406864166259766, 5.645474433898926, 5.884085178375244, 6.1226959228515625, 6.361306190490723, 6.599916934967041, 6.838527679443359, 7.0771379470825195]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 7.0, 21.0, 40.0, 67.0, 195.0, 809.0, 7667.0, 4162969.0, 20573.0, 1454.0, 287.0, 93.0, 45.0, 20.0, 16.0, 9.0, 5.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.84765625, -5.6568603515625, -5.466064453125, -5.2752685546875, -5.08447265625, -4.8936767578125, -4.702880859375, -4.5120849609375, -4.3212890625, -4.1304931640625, -3.939697265625, -3.7489013671875, -3.55810546875, -3.3673095703125, -3.176513671875, -2.9857177734375, -2.794921875, -2.6041259765625, -2.413330078125, -2.2225341796875, -2.03173828125, -1.8409423828125, -1.650146484375, -1.4593505859375, -1.2685546875, -1.0777587890625, -0.886962890625, -0.6961669921875, -0.50537109375, -0.3145751953125, -0.123779296875, 0.0670166015625, 0.2578125, 0.4486083984375, 0.639404296875, 0.8302001953125, 1.02099609375, 1.2117919921875, 1.402587890625, 1.5933837890625, 1.7841796875, 1.9749755859375, 2.165771484375, 2.3565673828125, 2.54736328125, 2.7381591796875, 2.928955078125, 3.1197509765625, 3.310546875, 3.5013427734375, 3.692138671875, 3.8829345703125, 4.07373046875, 4.2645263671875, 4.455322265625, 4.6461181640625, 4.8369140625, 5.0277099609375, 5.218505859375, 5.4093017578125, 5.60009765625, 5.7908935546875, 5.981689453125, 6.1724853515625, 6.36328125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 6.0, 14.0, 9.0, 14.0, 18.0, 26.0, 28.0, 34.0, 39.0, 42.0, 51.0, 65.0, 50.0, 61.0, 56.0, 48.0, 52.0, 68.0, 57.0, 59.0, 55.0, 35.0, 28.0, 16.0, 17.0, 10.0, 11.0, 10.0, 5.0, 4.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34716796875, -0.3330841064453125, -0.319000244140625, -0.3049163818359375, -0.29083251953125, -0.2767486572265625, -0.262664794921875, -0.2485809326171875, -0.2344970703125, -0.2204132080078125, -0.206329345703125, -0.1922454833984375, -0.17816162109375, -0.1640777587890625, -0.149993896484375, -0.1359100341796875, -0.121826171875, -0.1077423095703125, -0.093658447265625, -0.0795745849609375, -0.06549072265625, -0.0514068603515625, -0.037322998046875, -0.0232391357421875, -0.0091552734375, 0.0049285888671875, 0.019012451171875, 0.0330963134765625, 0.04718017578125, 0.0612640380859375, 0.075347900390625, 0.0894317626953125, 0.103515625, 0.1175994873046875, 0.131683349609375, 0.1457672119140625, 0.15985107421875, 0.1739349365234375, 0.188018798828125, 0.2021026611328125, 0.2161865234375, 0.2302703857421875, 0.244354248046875, 0.2584381103515625, 0.27252197265625, 0.2866058349609375, 0.300689697265625, 0.3147735595703125, 0.328857421875, 0.3429412841796875, 0.357025146484375, 0.3711090087890625, 0.38519287109375, 0.3992767333984375, 0.413360595703125, 0.4274444580078125, 0.4415283203125, 0.4556121826171875, 0.469696044921875, 0.4837799072265625, 0.49786376953125, 0.5119476318359375, 0.526031494140625, 0.5401153564453125, 0.55419921875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 6.0, 5.0, 9.0, 11.0, 11.0, 30.0, 30.0, 36.0, 56.0, 78.0, 91.0, 150.0, 207.0, 268.0, 426.0, 671.0, 962.0, 1570.0, 2718.0, 5222.0, 11551.0, 40564.0, 3924259.0, 164373.0, 22715.0, 8103.0, 4003.0, 2185.0, 1297.0, 832.0, 542.0, 400.0, 241.0, 194.0, 132.0, 105.0, 78.0, 43.0, 33.0, 21.0, 18.0, 10.0, 12.0, 6.0, 5.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.53125, -1.48724365234375, -1.4432373046875, -1.39923095703125, -1.355224609375, -1.31121826171875, -1.2672119140625, -1.22320556640625, -1.17919921875, -1.13519287109375, -1.0911865234375, -1.04718017578125, -1.003173828125, -0.95916748046875, -0.9151611328125, -0.87115478515625, -0.8271484375, -0.78314208984375, -0.7391357421875, -0.69512939453125, -0.651123046875, -0.60711669921875, -0.5631103515625, -0.51910400390625, -0.47509765625, -0.43109130859375, -0.3870849609375, -0.34307861328125, -0.299072265625, -0.25506591796875, -0.2110595703125, -0.16705322265625, -0.123046875, -0.07904052734375, -0.0350341796875, 0.00897216796875, 0.052978515625, 0.09698486328125, 0.1409912109375, 0.18499755859375, 0.22900390625, 0.27301025390625, 0.3170166015625, 0.36102294921875, 0.405029296875, 0.44903564453125, 0.4930419921875, 0.53704833984375, 0.5810546875, 0.62506103515625, 0.6690673828125, 0.71307373046875, 0.757080078125, 0.80108642578125, 0.8450927734375, 0.88909912109375, 0.93310546875, 0.97711181640625, 1.0211181640625, 1.06512451171875, 1.109130859375, 1.15313720703125, 1.1971435546875, 1.24114990234375, 1.28515625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 8.0, 4.0, 7.0, 11.0, 20.0, 52.0, 137.0, 3525.0, 159.0, 57.0, 31.0, 10.0, 10.0, 14.0, 2.0, 5.0, 4.0, 3.0, 5.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.404052734375, -0.3926887512207031, -0.38132476806640625, -0.3699607849121094, -0.3585968017578125, -0.3472328186035156, -0.33586883544921875, -0.3245048522949219, -0.313140869140625, -0.3017768859863281, -0.29041290283203125, -0.2790489196777344, -0.2676849365234375, -0.2563209533691406, -0.24495697021484375, -0.23359298706054688, -0.22222900390625, -0.21086502075195312, -0.19950103759765625, -0.18813705444335938, -0.1767730712890625, -0.16540908813476562, -0.15404510498046875, -0.14268112182617188, -0.131317138671875, -0.11995315551757812, -0.10858917236328125, -0.09722518920898438, -0.0858612060546875, -0.07449722290039062, -0.06313323974609375, -0.051769256591796875, -0.0404052734375, -0.029041290283203125, -0.01767730712890625, -0.006313323974609375, 0.0050506591796875, 0.016414642333984375, 0.02777862548828125, 0.039142608642578125, 0.050506591796875, 0.061870574951171875, 0.07323455810546875, 0.08459854125976562, 0.0959625244140625, 0.10732650756835938, 0.11869049072265625, 0.13005447387695312, 0.14141845703125, 0.15278244018554688, 0.16414642333984375, 0.17551040649414062, 0.1868743896484375, 0.19823837280273438, 0.20960235595703125, 0.22096633911132812, 0.232330322265625, 0.24369430541992188, 0.25505828857421875, 0.2664222717285156, 0.2777862548828125, 0.2891502380371094, 0.30051422119140625, 0.3118782043457031, 0.3232421875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 10.0, 31.0, 92.0, 237.0, 289.0, 190.0, 99.0, 32.0, 16.0, 8.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0462324619293213, -0.9535099267959595, -0.8607873916625977, -0.7680649161338806, -0.6753423810005188, -0.582619845867157, -0.48989737033843994, -0.3971748352050781, -0.3044523000717163, -0.21172977983951569, -0.11900725960731506, -0.026284754276275635, 0.06643778085708618, 0.159160315990448, 0.25188279151916504, 0.34460532665252686, 0.43732786178588867, 0.5300503969192505, 0.6227729320526123, 0.7154954075813293, 0.8082179427146912, 0.900940477848053, 0.99366295337677, 1.0863854885101318, 1.1791080236434937, 1.2718305587768555, 1.3645530939102173, 1.457275629043579, 1.5499980449676514, 1.6427206993103027, 1.735443115234375, 1.8281656503677368, 1.9208884239196777, 2.01361083984375, 2.1063334941864014, 2.1990559101104736, 2.291778564453125, 2.3845009803771973, 2.4772233963012695, 2.569946050643921, 2.6626687049865723, 2.7553911209106445, 2.848113775253296, 2.940836191177368, 3.0335588455200195, 3.126281261444092, 3.219003677368164, 3.3117263317108154, 3.4044487476348877, 3.49717116355896, 3.5898938179016113, 3.6826162338256836, 3.775338888168335, 3.8680613040924072, 3.9607839584350586, 4.053506374359131, 4.146228790283203, 4.238951206207275, 4.331673622131348, 4.424396514892578, 4.51711893081665, 4.609841346740723, 4.702563762664795, 4.795286178588867, 4.888009071350098]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 5.0, 3.0, 5.0, 9.0, 11.0, 7.0, 13.0, 10.0, 11.0, 15.0, 12.0, 22.0, 34.0, 26.0, 31.0, 33.0, 43.0, 32.0, 52.0, 46.0, 66.0, 39.0, 38.0, 43.0, 37.0, 40.0, 36.0, 37.0, 33.0, 28.0, 24.0, 21.0, 28.0, 21.0, 22.0, 16.0, 14.0, 4.0, 11.0, 6.0, 2.0, 3.0, 7.0, 3.0, 4.0, 4.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.7976868748664856, -0.7757668495178223, -0.7538468241691589, -0.7319267988204956, -0.7100067734718323, -0.688086748123169, -0.6661666631698608, -0.6442466974258423, -0.6223266124725342, -0.6004065871238708, -0.5784865617752075, -0.5565665364265442, -0.5346465110778809, -0.5127264857292175, -0.4908064305782318, -0.4688864052295685, -0.44696640968322754, -0.4250463843345642, -0.4031263589859009, -0.38120633363723755, -0.3592863082885742, -0.3373662829399109, -0.31544622778892517, -0.29352620244026184, -0.2716061770915985, -0.24968615174293518, -0.22776612639427185, -0.20584608614444733, -0.183926060795784, -0.16200603544712067, -0.14008599519729614, -0.11816596984863281, -0.09624588489532471, -0.07432585954666138, -0.05240582674741745, -0.030485793948173523, -0.008565768599510193, 0.013354256749153137, 0.03527429699897766, 0.05719432234764099, 0.07911434769630432, 0.10103437304496765, 0.12295440584421158, 0.1448744386434555, 0.16679446399211884, 0.18871448934078217, 0.2106345295906067, 0.23255455493927002, 0.25447458028793335, 0.2763946056365967, 0.29831463098526, 0.32023465633392334, 0.34215468168258667, 0.36407470703125, 0.3859947621822357, 0.40791478753089905, 0.4298348128795624, 0.4517548382282257, 0.47367486357688904, 0.49559491872787476, 0.5175149440765381, 0.5394349694252014, 0.5613549947738647, 0.5832750201225281, 0.6051950454711914]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 2.0, 3.0, 7.0, 11.0, 6.0, 10.0, 15.0, 22.0, 21.0, 34.0, 63.0, 86.0, 115.0, 178.0, 326.0, 562.0, 1114.0, 2232.0, 5050.0, 11364.0, 27631.0, 66528.0, 154987.0, 286040.0, 263722.0, 131824.0, 55557.0, 22732.0, 9754.0, 4228.0, 1966.0, 1009.0, 517.0, 280.0, 192.0, 111.0, 70.0, 51.0, 36.0, 28.0, 21.0, 18.0, 14.0, 6.0, 2.0, 1.0, 5.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.96240234375, -0.9302139282226562, -0.8980255126953125, -0.8658370971679688, -0.833648681640625, -0.8014602661132812, -0.7692718505859375, -0.7370834350585938, -0.70489501953125, -0.6727066040039062, -0.6405181884765625, -0.6083297729492188, -0.576141357421875, -0.5439529418945312, -0.5117645263671875, -0.47957611083984375, -0.4473876953125, -0.41519927978515625, -0.3830108642578125, -0.35082244873046875, -0.318634033203125, -0.28644561767578125, -0.2542572021484375, -0.22206878662109375, -0.18988037109375, -0.15769195556640625, -0.1255035400390625, -0.09331512451171875, -0.061126708984375, -0.02893829345703125, 0.0032501220703125, 0.03543853759765625, 0.067626953125, 0.09981536865234375, 0.1320037841796875, 0.16419219970703125, 0.196380615234375, 0.22856903076171875, 0.2607574462890625, 0.29294586181640625, 0.32513427734375, 0.35732269287109375, 0.3895111083984375, 0.42169952392578125, 0.453887939453125, 0.48607635498046875, 0.5182647705078125, 0.5504531860351562, 0.5826416015625, 0.6148300170898438, 0.6470184326171875, 0.6792068481445312, 0.711395263671875, 0.7435836791992188, 0.7757720947265625, 0.8079605102539062, 0.84014892578125, 0.8723373413085938, 0.9045257568359375, 0.9367141723632812, 0.968902587890625, 1.0010910034179688, 1.0332794189453125, 1.0654678344726562, 1.09765625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 9.0, 7.0, 13.0, 11.0, 11.0, 19.0, 24.0, 30.0, 36.0, 27.0, 40.0, 45.0, 51.0, 67.0, 70.0, 54.0, 40.0, 50.0, 63.0, 53.0, 60.0, 48.0, 34.0, 32.0, 27.0, 19.0, 8.0, 12.0, 13.0, 4.0, 2.0, 7.0, 12.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38720703125, -0.37223052978515625, -0.3572540283203125, -0.34227752685546875, -0.327301025390625, -0.31232452392578125, -0.2973480224609375, -0.28237152099609375, -0.26739501953125, -0.25241851806640625, -0.2374420166015625, -0.22246551513671875, -0.207489013671875, -0.19251251220703125, -0.1775360107421875, -0.16255950927734375, -0.1475830078125, -0.13260650634765625, -0.1176300048828125, -0.10265350341796875, -0.087677001953125, -0.07270050048828125, -0.0577239990234375, -0.04274749755859375, -0.02777099609375, -0.01279449462890625, 0.0021820068359375, 0.01715850830078125, 0.032135009765625, 0.04711151123046875, 0.0620880126953125, 0.07706451416015625, 0.092041015625, 0.10701751708984375, 0.1219940185546875, 0.13697052001953125, 0.151947021484375, 0.16692352294921875, 0.1819000244140625, 0.19687652587890625, 0.21185302734375, 0.22682952880859375, 0.2418060302734375, 0.25678253173828125, 0.271759033203125, 0.28673553466796875, 0.3017120361328125, 0.31668853759765625, 0.3316650390625, 0.34664154052734375, 0.3616180419921875, 0.37659454345703125, 0.391571044921875, 0.40654754638671875, 0.4215240478515625, 0.43650054931640625, 0.45147705078125, 0.46645355224609375, 0.4814300537109375, 0.49640655517578125, 0.511383056640625, 0.5263595581054688, 0.5413360595703125, 0.5563125610351562, 0.5712890625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 7.0, 3.0, 4.0, 7.0, 9.0, 22.0, 34.0, 36.0, 64.0, 93.0, 181.0, 348.0, 685.0, 1655.0, 4231.0, 12371.0, 41516.0, 152567.0, 438159.0, 282486.0, 79953.0, 22241.0, 7146.0, 2598.0, 1071.0, 472.0, 225.0, 126.0, 85.0, 59.0, 38.0, 25.0, 5.0, 10.0, 6.0, 5.0, 2.0, 4.0, 7.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.49609375, -1.4517669677734375, -1.407440185546875, -1.3631134033203125, -1.31878662109375, -1.2744598388671875, -1.230133056640625, -1.1858062744140625, -1.1414794921875, -1.0971527099609375, -1.052825927734375, -1.0084991455078125, -0.96417236328125, -0.9198455810546875, -0.875518798828125, -0.8311920166015625, -0.786865234375, -0.7425384521484375, -0.698211669921875, -0.6538848876953125, -0.60955810546875, -0.5652313232421875, -0.520904541015625, -0.4765777587890625, -0.4322509765625, -0.3879241943359375, -0.343597412109375, -0.2992706298828125, -0.25494384765625, -0.2106170654296875, -0.166290283203125, -0.1219635009765625, -0.07763671875, -0.0333099365234375, 0.011016845703125, 0.0553436279296875, 0.09967041015625, 0.1439971923828125, 0.188323974609375, 0.2326507568359375, 0.2769775390625, 0.3213043212890625, 0.365631103515625, 0.4099578857421875, 0.45428466796875, 0.4986114501953125, 0.542938232421875, 0.5872650146484375, 0.631591796875, 0.6759185791015625, 0.720245361328125, 0.7645721435546875, 0.80889892578125, 0.8532257080078125, 0.897552490234375, 0.9418792724609375, 0.9862060546875, 1.0305328369140625, 1.074859619140625, 1.1191864013671875, 1.16351318359375, 1.2078399658203125, 1.252166748046875, 1.2964935302734375, 1.3408203125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 3.0, 5.0, 6.0, 4.0, 11.0, 19.0, 12.0, 15.0, 22.0, 24.0, 28.0, 32.0, 39.0, 38.0, 46.0, 33.0, 46.0, 39.0, 55.0, 44.0, 50.0, 54.0, 55.0, 55.0, 35.0, 49.0, 26.0, 26.0, 19.0, 26.0, 23.0, 13.0, 9.0, 8.0, 10.0, 5.0, 5.0, 7.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8994140625, -1.8316192626953125, -1.763824462890625, -1.6960296630859375, -1.62823486328125, -1.5604400634765625, -1.492645263671875, -1.4248504638671875, -1.3570556640625, -1.2892608642578125, -1.221466064453125, -1.1536712646484375, -1.08587646484375, -1.0180816650390625, -0.950286865234375, -0.8824920654296875, -0.814697265625, -0.7469024658203125, -0.679107666015625, -0.6113128662109375, -0.54351806640625, -0.4757232666015625, -0.407928466796875, -0.3401336669921875, -0.2723388671875, -0.2045440673828125, -0.136749267578125, -0.0689544677734375, -0.00115966796875, 0.0666351318359375, 0.134429931640625, 0.2022247314453125, 0.27001953125, 0.3378143310546875, 0.405609130859375, 0.4734039306640625, 0.54119873046875, 0.6089935302734375, 0.676788330078125, 0.7445831298828125, 0.8123779296875, 0.8801727294921875, 0.947967529296875, 1.0157623291015625, 1.08355712890625, 1.1513519287109375, 1.219146728515625, 1.2869415283203125, 1.354736328125, 1.4225311279296875, 1.490325927734375, 1.5581207275390625, 1.62591552734375, 1.6937103271484375, 1.761505126953125, 1.8292999267578125, 1.8970947265625, 1.9648895263671875, 2.032684326171875, 2.1004791259765625, 2.16827392578125, 2.2360687255859375, 2.303863525390625, 2.3716583251953125, 2.439453125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 5.0, 7.0, 8.0, 27.0, 48.0, 128.0, 316.0, 1101.0, 8330.0, 332230.0, 690169.0, 13981.0, 1547.0, 387.0, 156.0, 64.0, 22.0, 15.0, 8.0, 6.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8671875, -1.8071441650390625, -1.747100830078125, -1.6870574951171875, -1.62701416015625, -1.5669708251953125, -1.506927490234375, -1.4468841552734375, -1.3868408203125, -1.3267974853515625, -1.266754150390625, -1.2067108154296875, -1.14666748046875, -1.0866241455078125, -1.026580810546875, -0.9665374755859375, -0.906494140625, -0.8464508056640625, -0.786407470703125, -0.7263641357421875, -0.66632080078125, -0.6062774658203125, -0.546234130859375, -0.4861907958984375, -0.4261474609375, -0.3661041259765625, -0.306060791015625, -0.2460174560546875, -0.18597412109375, -0.1259307861328125, -0.065887451171875, -0.0058441162109375, 0.05419921875, 0.1142425537109375, 0.174285888671875, 0.2343292236328125, 0.29437255859375, 0.3544158935546875, 0.414459228515625, 0.4745025634765625, 0.5345458984375, 0.5945892333984375, 0.654632568359375, 0.7146759033203125, 0.77471923828125, 0.8347625732421875, 0.894805908203125, 0.9548492431640625, 1.014892578125, 1.0749359130859375, 1.134979248046875, 1.1950225830078125, 1.25506591796875, 1.3151092529296875, 1.375152587890625, 1.4351959228515625, 1.4952392578125, 1.5552825927734375, 1.615325927734375, 1.6753692626953125, 1.73541259765625, 1.7954559326171875, 1.855499267578125, 1.9155426025390625, 1.9755859375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 2.0, 6.0, 9.0, 8.0, 10.0, 15.0, 29.0, 36.0, 38.0, 43.0, 65.0, 69.0, 70.0, 88.0, 86.0, 105.0, 86.0, 65.0, 53.0, 38.0, 17.0, 19.0, 10.0, 8.0, 11.0, 9.0, 1.0, 3.0, 3.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010341405868530273, -9.95611771941185e-05, -9.570829570293427e-05, -9.185541421175003e-05, -8.80025327205658e-05, -8.414965122938156e-05, -8.029676973819733e-05, -7.644388824701309e-05, -7.259100675582886e-05, -6.873812526464462e-05, -6.488524377346039e-05, -6.1032362282276154e-05, -5.717948079109192e-05, -5.3326599299907684e-05, -4.947371780872345e-05, -4.5620836317539215e-05, -4.176795482635498e-05, -3.7915073335170746e-05, -3.406219184398651e-05, -3.0209310352802277e-05, -2.6356428861618042e-05, -2.2503547370433807e-05, -1.8650665879249573e-05, -1.4797784388065338e-05, -1.0944902896881104e-05, -7.092021405696869e-06, -3.2391399145126343e-06, 6.137415766716003e-07, 4.466623067855835e-06, 8.31950455904007e-06, 1.2172386050224304e-05, 1.602526754140854e-05, 1.9878149032592773e-05, 2.3731030523777008e-05, 2.7583912014961243e-05, 3.143679350614548e-05, 3.528967499732971e-05, 3.9142556488513947e-05, 4.299543797969818e-05, 4.6848319470882416e-05, 5.070120096206665e-05, 5.4554082453250885e-05, 5.840696394443512e-05, 6.225984543561935e-05, 6.611272692680359e-05, 6.996560841798782e-05, 7.381848990917206e-05, 7.767137140035629e-05, 8.152425289154053e-05, 8.537713438272476e-05, 8.9230015873909e-05, 9.308289736509323e-05, 9.693577885627747e-05, 0.0001007886603474617, 0.00010464154183864594, 0.00010849442332983017, 0.0001123473048210144, 0.00011620018631219864, 0.00012005306780338287, 0.0001239059492945671, 0.00012775883078575134, 0.00013161171227693558, 0.0001354645937681198, 0.00013931747525930405, 0.00014317035675048828]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 5.0, 4.0, 14.0, 24.0, 37.0, 80.0, 211.0, 484.0, 1405.0, 5472.0, 38059.0, 505359.0, 455582.0, 34629.0, 5050.0, 1314.0, 433.0, 190.0, 92.0, 45.0, 18.0, 14.0, 16.0, 4.0, 8.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2314453125, -1.1981430053710938, -1.1648406982421875, -1.1315383911132812, -1.098236083984375, -1.0649337768554688, -1.0316314697265625, -0.9983291625976562, -0.96502685546875, -0.9317245483398438, -0.8984222412109375, -0.8651199340820312, -0.831817626953125, -0.7985153198242188, -0.7652130126953125, -0.7319107055664062, -0.6986083984375, -0.6653060913085938, -0.6320037841796875, -0.5987014770507812, -0.565399169921875, -0.5320968627929688, -0.4987945556640625, -0.46549224853515625, -0.43218994140625, -0.39888763427734375, -0.3655853271484375, -0.33228302001953125, -0.298980712890625, -0.26567840576171875, -0.2323760986328125, -0.19907379150390625, -0.165771484375, -0.13246917724609375, -0.0991668701171875, -0.06586456298828125, -0.032562255859375, 0.00074005126953125, 0.0340423583984375, 0.06734466552734375, 0.10064697265625, 0.13394927978515625, 0.1672515869140625, 0.20055389404296875, 0.233856201171875, 0.26715850830078125, 0.3004608154296875, 0.33376312255859375, 0.3670654296875, 0.40036773681640625, 0.4336700439453125, 0.46697235107421875, 0.500274658203125, 0.5335769653320312, 0.5668792724609375, 0.6001815795898438, 0.63348388671875, 0.6667861938476562, 0.7000885009765625, 0.7333908081054688, 0.766693115234375, 0.7999954223632812, 0.8332977294921875, 0.8666000366210938, 0.89990234375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 6.0, 5.0, 4.0, 1.0, 8.0, 8.0, 9.0, 19.0, 28.0, 38.0, 58.0, 75.0, 98.0, 101.0, 107.0, 107.0, 76.0, 66.0, 49.0, 38.0, 32.0, 19.0, 16.0, 7.0, 7.0, 9.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.1708984375, -1.138763427734375, -1.10662841796875, -1.074493408203125, -1.0423583984375, -1.010223388671875, -0.97808837890625, -0.945953369140625, -0.913818359375, -0.881683349609375, -0.84954833984375, -0.817413330078125, -0.7852783203125, -0.753143310546875, -0.72100830078125, -0.688873291015625, -0.65673828125, -0.624603271484375, -0.59246826171875, -0.560333251953125, -0.5281982421875, -0.496063232421875, -0.46392822265625, -0.431793212890625, -0.399658203125, -0.367523193359375, -0.33538818359375, -0.303253173828125, -0.2711181640625, -0.238983154296875, -0.20684814453125, -0.174713134765625, -0.142578125, -0.110443115234375, -0.07830810546875, -0.046173095703125, -0.0140380859375, 0.018096923828125, 0.05023193359375, 0.082366943359375, 0.114501953125, 0.146636962890625, 0.17877197265625, 0.210906982421875, 0.2430419921875, 0.275177001953125, 0.30731201171875, 0.339447021484375, 0.37158203125, 0.403717041015625, 0.43585205078125, 0.467987060546875, 0.5001220703125, 0.532257080078125, 0.56439208984375, 0.596527099609375, 0.628662109375, 0.660797119140625, 0.69293212890625, 0.725067138671875, 0.7572021484375, 0.789337158203125, 0.82147216796875, 0.853607177734375, 0.8857421875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 7.0, 10.0, 15.0, 34.0, 59.0, 71.0, 125.0, 130.0, 126.0, 144.0, 103.0, 63.0, 45.0, 22.0, 20.0, 8.0, 5.0, 11.0, 5.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.77946949005127, -10.329562187194824, -9.879655838012695, -9.42974853515625, -8.979841232299805, -8.52993392944336, -8.080026626586914, -7.630120277404785, -7.18021297454834, -6.7303056716918945, -6.280398845672607, -5.83049201965332, -5.380584716796875, -4.93067741394043, -4.480770587921143, -4.0308637619018555, -3.58095645904541, -3.131049394607544, -2.6811423301696777, -2.2312352657318115, -1.7813282012939453, -1.331421136856079, -0.8815140724182129, -0.4316070079803467, 0.01830005645751953, 0.46820712089538574, 0.918114185333252, 1.3680212497711182, 1.8179283142089844, 2.2678353786468506, 2.717742443084717, 3.167649507522583, 3.617555618286133, 4.067462921142578, 4.517369747161865, 4.967276573181152, 5.417183876037598, 5.867091178894043, 6.31699800491333, 6.766904830932617, 7.2168121337890625, 7.666719436645508, 8.116626739501953, 8.566533088684082, 9.016440391540527, 9.466347694396973, 9.916254043579102, 10.366161346435547, 10.816068649291992, 11.265975952148438, 11.715883255004883, 12.165789604187012, 12.615696907043457, 13.065604209899902, 13.515510559082031, 13.965417861938477, 14.415325164794922, 14.865232467651367, 15.315139770507812, 15.765046119689941, 16.214954376220703, 16.664859771728516, 17.11476707458496, 17.564674377441406, 18.01458168029785]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 9.0, 11.0, 13.0, 11.0, 2.0, 15.0, 13.0, 18.0, 28.0, 21.0, 29.0, 20.0, 42.0, 35.0, 45.0, 44.0, 42.0, 48.0, 46.0, 45.0, 52.0, 45.0, 41.0, 44.0, 40.0, 30.0, 34.0, 29.0, 24.0, 20.0, 16.0, 18.0, 12.0, 9.0, 10.0, 12.0, 7.0, 11.0, 2.0, 3.0, 4.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.964408874511719, -9.643903732299805, -9.323399543762207, -9.002894401550293, -8.682389259338379, -8.361885070800781, -8.041379928588867, -7.720874786376953, -7.400370121002197, -7.079865455627441, -6.759360313415527, -6.4388556480407715, -6.118350982666016, -5.797845840454102, -5.477341175079346, -5.15683650970459, -4.836331367492676, -4.51582670211792, -4.195321559906006, -3.87481689453125, -3.554311990737915, -3.23380708694458, -2.913302421569824, -2.5927975177764893, -2.2722926139831543, -1.9517877101898193, -1.631282925605774, -1.3107781410217285, -0.9902732372283936, -0.6697683334350586, -0.3492635488510132, -0.028758764266967773, 0.2917461395263672, 0.6122509837150574, 0.9327558279037476, 1.253260612487793, 1.573765516281128, 1.894270420074463, 2.2147750854492188, 2.5352799892425537, 2.8557848930358887, 3.1762897968292236, 3.4967947006225586, 3.8172993659973145, 4.13780403137207, 4.458309173583984, 4.77881383895874, 5.099318504333496, 5.41982364654541, 5.740328311920166, 6.06083345413208, 6.381338119506836, 6.70184326171875, 7.022347927093506, 7.342852592468262, 7.663357734680176, 7.983862400054932, 8.304367065429688, 8.624872207641602, 8.945377349853516, 9.265881538391113, 9.586386680603027, 9.906891822814941, 10.227396011352539, 10.547901153564453]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 6.0, 10.0, 8.0, 16.0, 24.0, 31.0, 43.0, 66.0, 99.0, 192.0, 337.0, 602.0, 1214.0, 2793.0, 7386.0, 28560.0, 3951876.0, 171251.0, 19420.0, 5743.0, 2191.0, 1026.0, 510.0, 343.0, 197.0, 109.0, 61.0, 51.0, 37.0, 23.0, 15.0, 11.0, 10.0, 8.0, 6.0, 5.0, 0.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4375, -1.3819580078125, -1.326416015625, -1.2708740234375, -1.21533203125, -1.1597900390625, -1.104248046875, -1.0487060546875, -0.9931640625, -0.9376220703125, -0.882080078125, -0.8265380859375, -0.77099609375, -0.7154541015625, -0.659912109375, -0.6043701171875, -0.548828125, -0.4932861328125, -0.437744140625, -0.3822021484375, -0.32666015625, -0.2711181640625, -0.215576171875, -0.1600341796875, -0.1044921875, -0.0489501953125, 0.006591796875, 0.0621337890625, 0.11767578125, 0.1732177734375, 0.228759765625, 0.2843017578125, 0.33984375, 0.3953857421875, 0.450927734375, 0.5064697265625, 0.56201171875, 0.6175537109375, 0.673095703125, 0.7286376953125, 0.7841796875, 0.8397216796875, 0.895263671875, 0.9508056640625, 1.00634765625, 1.0618896484375, 1.117431640625, 1.1729736328125, 1.228515625, 1.2840576171875, 1.339599609375, 1.3951416015625, 1.45068359375, 1.5062255859375, 1.561767578125, 1.6173095703125, 1.6728515625, 1.7283935546875, 1.783935546875, 1.8394775390625, 1.89501953125, 1.9505615234375, 2.006103515625, 2.0616455078125, 2.1171875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 6.0, 5.0, 8.0, 11.0, 16.0, 19.0, 19.0, 31.0, 30.0, 43.0, 48.0, 41.0, 51.0, 69.0, 72.0, 72.0, 62.0, 49.0, 56.0, 45.0, 39.0, 45.0, 27.0, 32.0, 29.0, 19.0, 18.0, 9.0, 8.0, 4.0, 4.0, 3.0, 2.0, 3.0, 1.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.6240234375, -0.605438232421875, -0.58685302734375, -0.568267822265625, -0.5496826171875, -0.531097412109375, -0.51251220703125, -0.493927001953125, -0.475341796875, -0.456756591796875, -0.43817138671875, -0.419586181640625, -0.4010009765625, -0.382415771484375, -0.36383056640625, -0.345245361328125, -0.32666015625, -0.308074951171875, -0.28948974609375, -0.270904541015625, -0.2523193359375, -0.233734130859375, -0.21514892578125, -0.196563720703125, -0.177978515625, -0.159393310546875, -0.14080810546875, -0.122222900390625, -0.1036376953125, -0.085052490234375, -0.06646728515625, -0.047882080078125, -0.029296875, -0.010711669921875, 0.00787353515625, 0.026458740234375, 0.0450439453125, 0.063629150390625, 0.08221435546875, 0.100799560546875, 0.119384765625, 0.137969970703125, 0.15655517578125, 0.175140380859375, 0.1937255859375, 0.212310791015625, 0.23089599609375, 0.249481201171875, 0.26806640625, 0.286651611328125, 0.30523681640625, 0.323822021484375, 0.3424072265625, 0.360992431640625, 0.37957763671875, 0.398162841796875, 0.416748046875, 0.435333251953125, 0.45391845703125, 0.472503662109375, 0.4910888671875, 0.509674072265625, 0.52825927734375, 0.546844482421875, 0.5654296875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 4.0, 5.0, 10.0, 15.0, 17.0, 20.0, 28.0, 41.0, 59.0, 98.0, 141.0, 195.0, 296.0, 432.0, 664.0, 1064.0, 1658.0, 2761.0, 5155.0, 10648.0, 24686.0, 76959.0, 3766543.0, 223620.0, 44716.0, 16841.0, 7564.0, 3871.0, 2226.0, 1411.0, 801.0, 549.0, 394.0, 255.0, 187.0, 104.0, 70.0, 45.0, 37.0, 26.0, 29.0, 8.0, 11.0, 7.0, 5.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.1513671875, -1.115142822265625, -1.07891845703125, -1.042694091796875, -1.0064697265625, -0.970245361328125, -0.93402099609375, -0.897796630859375, -0.861572265625, -0.825347900390625, -0.78912353515625, -0.752899169921875, -0.7166748046875, -0.680450439453125, -0.64422607421875, -0.608001708984375, -0.57177734375, -0.535552978515625, -0.49932861328125, -0.463104248046875, -0.4268798828125, -0.390655517578125, -0.35443115234375, -0.318206787109375, -0.281982421875, -0.245758056640625, -0.20953369140625, -0.173309326171875, -0.1370849609375, -0.100860595703125, -0.06463623046875, -0.028411865234375, 0.0078125, 0.044036865234375, 0.08026123046875, 0.116485595703125, 0.1527099609375, 0.188934326171875, 0.22515869140625, 0.261383056640625, 0.297607421875, 0.333831787109375, 0.37005615234375, 0.406280517578125, 0.4425048828125, 0.478729248046875, 0.51495361328125, 0.551177978515625, 0.58740234375, 0.623626708984375, 0.65985107421875, 0.696075439453125, 0.7322998046875, 0.768524169921875, 0.80474853515625, 0.840972900390625, 0.877197265625, 0.913421630859375, 0.94964599609375, 0.985870361328125, 1.0220947265625, 1.058319091796875, 1.09454345703125, 1.130767822265625, 1.1669921875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 3.0, 6.0, 6.0, 8.0, 4.0, 16.0, 20.0, 25.0, 46.0, 77.0, 166.0, 3302.0, 173.0, 80.0, 32.0, 37.0, 19.0, 11.0, 14.0, 7.0, 7.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.494140625, -0.48131561279296875, -0.4684906005859375, -0.45566558837890625, -0.442840576171875, -0.43001556396484375, -0.4171905517578125, -0.40436553955078125, -0.39154052734375, -0.37871551513671875, -0.3658905029296875, -0.35306549072265625, -0.340240478515625, -0.32741546630859375, -0.3145904541015625, -0.30176544189453125, -0.2889404296875, -0.27611541748046875, -0.2632904052734375, -0.25046539306640625, -0.237640380859375, -0.22481536865234375, -0.2119903564453125, -0.19916534423828125, -0.18634033203125, -0.17351531982421875, -0.1606903076171875, -0.14786529541015625, -0.135040283203125, -0.12221527099609375, -0.1093902587890625, -0.09656524658203125, -0.083740234375, -0.07091522216796875, -0.0580902099609375, -0.04526519775390625, -0.032440185546875, -0.01961517333984375, -0.0067901611328125, 0.00603485107421875, 0.01885986328125, 0.03168487548828125, 0.0445098876953125, 0.05733489990234375, 0.070159912109375, 0.08298492431640625, 0.0958099365234375, 0.10863494873046875, 0.1214599609375, 0.13428497314453125, 0.1471099853515625, 0.15993499755859375, 0.172760009765625, 0.18558502197265625, 0.1984100341796875, 0.21123504638671875, 0.22406005859375, 0.23688507080078125, 0.2497100830078125, 0.26253509521484375, 0.275360107421875, 0.28818511962890625, 0.3010101318359375, 0.31383514404296875, 0.32666015625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 0.0, 21.0, 90.0, 167.0, 231.0, 242.0, 137.0, 77.0, 29.0, 6.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.519367218017578, -5.406399250030518, -5.293430805206299, -5.180462837219238, -5.0674943923950195, -4.954526424407959, -4.84155797958374, -4.72859001159668, -4.615621566772461, -4.5026535987854, -4.389685153961182, -4.276717185974121, -4.163748741149902, -4.050780773162842, -3.937812328338623, -3.8248443603515625, -3.711876153945923, -3.598907947540283, -3.4859397411346436, -3.372971534729004, -3.2600033283233643, -3.1470351219177246, -3.034067153930664, -2.9210987091064453, -2.8081307411193848, -2.695162534713745, -2.5821943283081055, -2.469226121902466, -2.356257915496826, -2.2432897090911865, -2.130321502685547, -2.0173535346984863, -1.9043848514556885, -1.7914166450500488, -1.6784484386444092, -1.5654802322387695, -1.4525120258331299, -1.3395438194274902, -1.2265757322311401, -1.1136075258255005, -1.0006393194198608, -0.8876711130142212, -0.7747029066085815, -0.6617347598075867, -0.548766553401947, -0.4357983469963074, -0.3228302001953125, -0.20986199378967285, -0.0968937873840332, 0.01607440412044525, 0.1290425956249237, 0.24201077222824097, 0.3549789786338806, 0.46794718503952026, 0.5809153318405151, 0.6938835382461548, 0.8068517446517944, 0.9198199510574341, 1.0327881574630737, 1.1457562446594238, 1.2587244510650635, 1.3716926574707031, 1.4846608638763428, 1.5976290702819824, 1.710597276687622]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 7.0, 2.0, 5.0, 6.0, 10.0, 10.0, 9.0, 8.0, 18.0, 12.0, 14.0, 15.0, 24.0, 26.0, 23.0, 23.0, 41.0, 33.0, 32.0, 36.0, 30.0, 44.0, 40.0, 51.0, 42.0, 41.0, 34.0, 40.0, 42.0, 33.0, 27.0, 22.0, 27.0, 29.0, 22.0, 28.0, 13.0, 16.0, 12.0, 11.0, 13.0, 10.0, 7.0, 8.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.7974575161933899, -0.7742125391960144, -0.7509675621986389, -0.7277225852012634, -0.7044776082038879, -0.6812326312065125, -0.657987654209137, -0.6347426772117615, -0.611497700214386, -0.5882527232170105, -0.565007746219635, -0.5417627692222595, -0.518517792224884, -0.49527281522750854, -0.47202783823013306, -0.44878286123275757, -0.42553791403770447, -0.402292937040329, -0.3790479600429535, -0.355802983045578, -0.3325580060482025, -0.309313029050827, -0.2860680818557739, -0.26282310485839844, -0.23957811295986176, -0.21633313596248627, -0.19308815896511078, -0.16984319686889648, -0.146598219871521, -0.12335323542356491, -0.10010826587677002, -0.07686328887939453, -0.05361831188201904, -0.030373336747288704, -0.007128361612558365, 0.016116611659526825, 0.03936158865690231, 0.0626065656542778, 0.08585153520107269, 0.10909651219844818, 0.13234148919582367, 0.15558646619319916, 0.17883144319057465, 0.20207640528678894, 0.22532138228416443, 0.24856635928153992, 0.2718113362789154, 0.2950563132762909, 0.3183012902736664, 0.34154626727104187, 0.36479124426841736, 0.38803622126579285, 0.41128119826316833, 0.4345261752605438, 0.4577711224555969, 0.4810160994529724, 0.5042610764503479, 0.5275060534477234, 0.5507510304450989, 0.5739960074424744, 0.5972409844398499, 0.6204859614372253, 0.6437309384346008, 0.6669759154319763, 0.6902208924293518]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 7.0, 9.0, 13.0, 14.0, 24.0, 28.0, 55.0, 77.0, 118.0, 177.0, 262.0, 448.0, 742.0, 1192.0, 2261.0, 3898.0, 7331.0, 14877.0, 31939.0, 71406.0, 157678.0, 270853.0, 246870.0, 128387.0, 57304.0, 26131.0, 12321.0, 6144.0, 3373.0, 1779.0, 1077.0, 634.0, 383.0, 253.0, 195.0, 77.0, 82.0, 46.0, 35.0, 22.0, 9.0, 8.0, 3.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.9306640625, -0.9005126953125, -0.870361328125, -0.8402099609375, -0.81005859375, -0.7799072265625, -0.749755859375, -0.7196044921875, -0.689453125, -0.6593017578125, -0.629150390625, -0.5989990234375, -0.56884765625, -0.5386962890625, -0.508544921875, -0.4783935546875, -0.4482421875, -0.4180908203125, -0.387939453125, -0.3577880859375, -0.32763671875, -0.2974853515625, -0.267333984375, -0.2371826171875, -0.20703125, -0.1768798828125, -0.146728515625, -0.1165771484375, -0.08642578125, -0.0562744140625, -0.026123046875, 0.0040283203125, 0.0341796875, 0.0643310546875, 0.094482421875, 0.1246337890625, 0.15478515625, 0.1849365234375, 0.215087890625, 0.2452392578125, 0.275390625, 0.3055419921875, 0.335693359375, 0.3658447265625, 0.39599609375, 0.4261474609375, 0.456298828125, 0.4864501953125, 0.5166015625, 0.5467529296875, 0.576904296875, 0.6070556640625, 0.63720703125, 0.6673583984375, 0.697509765625, 0.7276611328125, 0.7578125, 0.7879638671875, 0.818115234375, 0.8482666015625, 0.87841796875, 0.9085693359375, 0.938720703125, 0.9688720703125, 0.9990234375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 7.0, 8.0, 11.0, 18.0, 16.0, 10.0, 16.0, 31.0, 32.0, 37.0, 38.0, 41.0, 47.0, 52.0, 59.0, 59.0, 48.0, 62.0, 54.0, 57.0, 46.0, 34.0, 37.0, 28.0, 32.0, 26.0, 16.0, 11.0, 16.0, 12.0, 10.0, 9.0, 2.0, 7.0, 2.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5341796875, -0.5171279907226562, -0.5000762939453125, -0.48302459716796875, -0.465972900390625, -0.44892120361328125, -0.4318695068359375, -0.41481781005859375, -0.39776611328125, -0.38071441650390625, -0.3636627197265625, -0.34661102294921875, -0.329559326171875, -0.31250762939453125, -0.2954559326171875, -0.27840423583984375, -0.2613525390625, -0.24430084228515625, -0.2272491455078125, -0.21019744873046875, -0.193145751953125, -0.17609405517578125, -0.1590423583984375, -0.14199066162109375, -0.12493896484375, -0.10788726806640625, -0.0908355712890625, -0.07378387451171875, -0.056732177734375, -0.03968048095703125, -0.0226287841796875, -0.00557708740234375, 0.011474609375, 0.02852630615234375, 0.0455780029296875, 0.06262969970703125, 0.079681396484375, 0.09673309326171875, 0.1137847900390625, 0.13083648681640625, 0.14788818359375, 0.16493988037109375, 0.1819915771484375, 0.19904327392578125, 0.216094970703125, 0.23314666748046875, 0.2501983642578125, 0.26725006103515625, 0.2843017578125, 0.30135345458984375, 0.3184051513671875, 0.33545684814453125, 0.352508544921875, 0.36956024169921875, 0.3866119384765625, 0.40366363525390625, 0.42071533203125, 0.43776702880859375, 0.4548187255859375, 0.47187042236328125, 0.488922119140625, 0.5059738159179688, 0.5230255126953125, 0.5400772094726562, 0.55712890625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 5.0, 10.0, 13.0, 24.0, 30.0, 29.0, 59.0, 72.0, 130.0, 214.0, 344.0, 677.0, 1508.0, 3974.0, 14159.0, 79042.0, 529606.0, 353847.0, 49202.0, 10021.0, 2994.0, 1216.0, 565.0, 312.0, 179.0, 99.0, 75.0, 50.0, 36.0, 16.0, 14.0, 8.0, 13.0, 2.0, 2.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.478515625, -2.409423828125, -2.34033203125, -2.271240234375, -2.2021484375, -2.133056640625, -2.06396484375, -1.994873046875, -1.92578125, -1.856689453125, -1.78759765625, -1.718505859375, -1.6494140625, -1.580322265625, -1.51123046875, -1.442138671875, -1.373046875, -1.303955078125, -1.23486328125, -1.165771484375, -1.0966796875, -1.027587890625, -0.95849609375, -0.889404296875, -0.8203125, -0.751220703125, -0.68212890625, -0.613037109375, -0.5439453125, -0.474853515625, -0.40576171875, -0.336669921875, -0.267578125, -0.198486328125, -0.12939453125, -0.060302734375, 0.0087890625, 0.077880859375, 0.14697265625, 0.216064453125, 0.28515625, 0.354248046875, 0.42333984375, 0.492431640625, 0.5615234375, 0.630615234375, 0.69970703125, 0.768798828125, 0.837890625, 0.906982421875, 0.97607421875, 1.045166015625, 1.1142578125, 1.183349609375, 1.25244140625, 1.321533203125, 1.390625, 1.459716796875, 1.52880859375, 1.597900390625, 1.6669921875, 1.736083984375, 1.80517578125, 1.874267578125, 1.943359375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 9.0, 5.0, 10.0, 9.0, 15.0, 18.0, 15.0, 23.0, 23.0, 32.0, 38.0, 38.0, 51.0, 41.0, 49.0, 60.0, 43.0, 58.0, 50.0, 48.0, 43.0, 58.0, 44.0, 39.0, 37.0, 25.0, 18.0, 18.0, 15.0, 11.0, 14.0, 15.0, 12.0, 6.0, 8.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.8671875, -2.789031982421875, -2.71087646484375, -2.632720947265625, -2.5545654296875, -2.476409912109375, -2.39825439453125, -2.320098876953125, -2.241943359375, -2.163787841796875, -2.08563232421875, -2.007476806640625, -1.9293212890625, -1.851165771484375, -1.77301025390625, -1.694854736328125, -1.61669921875, -1.538543701171875, -1.46038818359375, -1.382232666015625, -1.3040771484375, -1.225921630859375, -1.14776611328125, -1.069610595703125, -0.991455078125, -0.913299560546875, -0.83514404296875, -0.756988525390625, -0.6788330078125, -0.600677490234375, -0.52252197265625, -0.444366455078125, -0.3662109375, -0.288055419921875, -0.20989990234375, -0.131744384765625, -0.0535888671875, 0.024566650390625, 0.10272216796875, 0.180877685546875, 0.259033203125, 0.337188720703125, 0.41534423828125, 0.493499755859375, 0.5716552734375, 0.649810791015625, 0.72796630859375, 0.806121826171875, 0.88427734375, 0.962432861328125, 1.04058837890625, 1.118743896484375, 1.1968994140625, 1.275054931640625, 1.35321044921875, 1.431365966796875, 1.509521484375, 1.587677001953125, 1.66583251953125, 1.743988037109375, 1.8221435546875, 1.900299072265625, 1.97845458984375, 2.056610107421875, 2.134765625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 8.0, 13.0, 23.0, 35.0, 42.0, 85.0, 168.0, 373.0, 1198.0, 4844.0, 35516.0, 877468.0, 116884.0, 8941.0, 1988.0, 518.0, 192.0, 103.0, 54.0, 34.0, 24.0, 12.0, 10.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8681640625, -1.8030242919921875, -1.737884521484375, -1.6727447509765625, -1.60760498046875, -1.5424652099609375, -1.477325439453125, -1.4121856689453125, -1.3470458984375, -1.2819061279296875, -1.216766357421875, -1.1516265869140625, -1.08648681640625, -1.0213470458984375, -0.956207275390625, -0.8910675048828125, -0.825927734375, -0.7607879638671875, -0.695648193359375, -0.6305084228515625, -0.56536865234375, -0.5002288818359375, -0.435089111328125, -0.3699493408203125, -0.3048095703125, -0.2396697998046875, -0.174530029296875, -0.1093902587890625, -0.04425048828125, 0.0208892822265625, 0.086029052734375, 0.1511688232421875, 0.21630859375, 0.2814483642578125, 0.346588134765625, 0.4117279052734375, 0.47686767578125, 0.5420074462890625, 0.607147216796875, 0.6722869873046875, 0.7374267578125, 0.8025665283203125, 0.867706298828125, 0.9328460693359375, 0.99798583984375, 1.0631256103515625, 1.128265380859375, 1.1934051513671875, 1.258544921875, 1.3236846923828125, 1.388824462890625, 1.4539642333984375, 1.51910400390625, 1.5842437744140625, 1.649383544921875, 1.7145233154296875, 1.7796630859375, 1.8448028564453125, 1.909942626953125, 1.9750823974609375, 2.04022216796875, 2.1053619384765625, 2.170501708984375, 2.2356414794921875, 2.30078125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 4.0, 8.0, 10.0, 30.0, 24.0, 66.0, 107.0, 158.0, 182.0, 167.0, 110.0, 68.0, 26.0, 18.0, 10.0, 7.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003380775451660156, -0.00033030658960342407, -0.0003225356340408325, -0.00031476467847824097, -0.0003069937229156494, -0.00029922276735305786, -0.0002914518117904663, -0.00028368085622787476, -0.0002759099006652832, -0.00026813894510269165, -0.0002603679895401001, -0.00025259703397750854, -0.000244826078414917, -0.00023705512285232544, -0.0002292841672897339, -0.00022151321172714233, -0.00021374225616455078, -0.00020597130060195923, -0.00019820034503936768, -0.00019042938947677612, -0.00018265843391418457, -0.00017488747835159302, -0.00016711652278900146, -0.0001593455672264099, -0.00015157461166381836, -0.0001438036561012268, -0.00013603270053863525, -0.0001282617449760437, -0.00012049078941345215, -0.0001127198338508606, -0.00010494887828826904, -9.717792272567749e-05, -8.940696716308594e-05, -8.163601160049438e-05, -7.386505603790283e-05, -6.609410047531128e-05, -5.8323144912719727e-05, -5.0552189350128174e-05, -4.278123378753662e-05, -3.501027822494507e-05, -2.7239322662353516e-05, -1.9468367099761963e-05, -1.169741153717041e-05, -3.926455974578857e-06, 3.844499588012695e-06, 1.1615455150604248e-05, 1.93864107131958e-05, 2.7157366275787354e-05, 3.4928321838378906e-05, 4.269927740097046e-05, 5.047023296356201e-05, 5.8241188526153564e-05, 6.601214408874512e-05, 7.378309965133667e-05, 8.155405521392822e-05, 8.932501077651978e-05, 9.709596633911133e-05, 0.00010486692190170288, 0.00011263787746429443, 0.00012040883302688599, 0.00012817978858947754, 0.0001359507441520691, 0.00014372169971466064, 0.0001514926552772522, 0.00015926361083984375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 8.0, 10.0, 6.0, 12.0, 18.0, 20.0, 34.0, 57.0, 58.0, 117.0, 199.0, 447.0, 1229.0, 4327.0, 23546.0, 599909.0, 394944.0, 18061.0, 3575.0, 1099.0, 398.0, 161.0, 98.0, 90.0, 46.0, 23.0, 16.0, 13.0, 11.0, 10.0, 6.0, 4.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-2.15625, -2.10357666015625, -2.0509033203125, -1.99822998046875, -1.945556640625, -1.89288330078125, -1.8402099609375, -1.78753662109375, -1.73486328125, -1.68218994140625, -1.6295166015625, -1.57684326171875, -1.524169921875, -1.47149658203125, -1.4188232421875, -1.36614990234375, -1.3134765625, -1.26080322265625, -1.2081298828125, -1.15545654296875, -1.102783203125, -1.05010986328125, -0.9974365234375, -0.94476318359375, -0.89208984375, -0.83941650390625, -0.7867431640625, -0.73406982421875, -0.681396484375, -0.62872314453125, -0.5760498046875, -0.52337646484375, -0.470703125, -0.41802978515625, -0.3653564453125, -0.31268310546875, -0.260009765625, -0.20733642578125, -0.1546630859375, -0.10198974609375, -0.04931640625, 0.00335693359375, 0.0560302734375, 0.10870361328125, 0.161376953125, 0.21405029296875, 0.2667236328125, 0.31939697265625, 0.3720703125, 0.42474365234375, 0.4774169921875, 0.53009033203125, 0.582763671875, 0.63543701171875, 0.6881103515625, 0.74078369140625, 0.79345703125, 0.84613037109375, 0.8988037109375, 0.95147705078125, 1.004150390625, 1.05682373046875, 1.1094970703125, 1.16217041015625, 1.21484375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 3.0, 8.0, 9.0, 6.0, 15.0, 27.0, 83.0, 142.0, 191.0, 177.0, 136.0, 89.0, 49.0, 30.0, 12.0, 10.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-3.337890625, -3.266998291015625, -3.19610595703125, -3.125213623046875, -3.0543212890625, -2.983428955078125, -2.91253662109375, -2.841644287109375, -2.770751953125, -2.699859619140625, -2.62896728515625, -2.558074951171875, -2.4871826171875, -2.416290283203125, -2.34539794921875, -2.274505615234375, -2.20361328125, -2.132720947265625, -2.06182861328125, -1.990936279296875, -1.9200439453125, -1.849151611328125, -1.77825927734375, -1.707366943359375, -1.636474609375, -1.565582275390625, -1.49468994140625, -1.423797607421875, -1.3529052734375, -1.282012939453125, -1.21112060546875, -1.140228271484375, -1.0693359375, -0.998443603515625, -0.92755126953125, -0.856658935546875, -0.7857666015625, -0.714874267578125, -0.64398193359375, -0.573089599609375, -0.502197265625, -0.431304931640625, -0.36041259765625, -0.289520263671875, -0.2186279296875, -0.147735595703125, -0.07684326171875, -0.005950927734375, 0.06494140625, 0.135833740234375, 0.20672607421875, 0.277618408203125, 0.3485107421875, 0.419403076171875, 0.49029541015625, 0.561187744140625, 0.632080078125, 0.702972412109375, 0.77386474609375, 0.844757080078125, 0.9156494140625, 0.986541748046875, 1.05743408203125, 1.128326416015625, 1.19921875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 2.0, 9.0, 14.0, 38.0, 87.0, 169.0, 237.0, 192.0, 149.0, 55.0, 26.0, 16.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.055191040039062, -18.141637802124023, -17.228084564208984, -16.314531326293945, -15.400978088378906, -14.487424850463867, -13.573872566223145, -12.660319328308105, -11.746766090393066, -10.833212852478027, -9.919659614562988, -9.006107330322266, -8.092554092407227, -7.179000377655029, -6.265447616577148, -5.351894378662109, -4.43834114074707, -3.5247879028320312, -2.6112349033355713, -1.6976819038391113, -0.7841286659240723, 0.1294245719909668, 1.0429773330688477, 1.9565305709838867, 2.870083808898926, 3.783637046813965, 4.697190284729004, 5.610743045806885, 6.524296283721924, 7.437849521636963, 8.351402282714844, 9.264955520629883, 10.178508758544922, 11.092061996459961, 12.005615234375, 12.919168472290039, 13.832721710205078, 14.746274948120117, 15.65982723236084, 16.573379516601562, 17.486934661865234, 18.400487899780273, 19.314041137695312, 20.22759437561035, 21.14114761352539, 22.05470085144043, 22.96825408935547, 23.881805419921875, 24.795358657836914, 25.708911895751953, 26.622465133666992, 27.53601837158203, 28.44957160949707, 29.36312484741211, 30.276676177978516, 31.190231323242188, 32.103782653808594, 33.017333984375, 33.93088912963867, 34.84444046020508, 35.75799560546875, 36.671546936035156, 37.58510208129883, 38.498653411865234, 39.412208557128906]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 3.0, 5.0, 2.0, 5.0, 14.0, 11.0, 11.0, 9.0, 21.0, 16.0, 30.0, 39.0, 30.0, 34.0, 38.0, 54.0, 59.0, 43.0, 51.0, 57.0, 50.0, 42.0, 53.0, 33.0, 41.0, 41.0, 23.0, 28.0, 24.0, 33.0, 24.0, 19.0, 14.0, 15.0, 5.0, 7.0, 6.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.899551391601562, -11.535235404968262, -11.170919418334961, -10.806602478027344, -10.442286491394043, -10.077970504760742, -9.713654518127441, -9.34933853149414, -8.985021591186523, -8.620705604553223, -8.256389617919922, -7.892073154449463, -7.527756690979004, -7.163440704345703, -6.799124717712402, -6.434808731079102, -6.070492744445801, -5.7061767578125, -5.341860294342041, -4.97754430770874, -4.613227844238281, -4.2489118576049805, -3.8845958709716797, -3.5202796459198, -3.15596342086792, -2.79164719581604, -2.42733097076416, -2.0630149841308594, -1.6986987590789795, -1.3343825340270996, -0.9700665473937988, -0.605750322341919, -0.24143505096435547, 0.12288111448287964, 0.48719727993011475, 0.8515133857727051, 1.215829610824585, 1.5801458358764648, 1.9444618225097656, 2.3087780475616455, 2.6730942726135254, 3.0374104976654053, 3.401726722717285, 3.766042709350586, 4.130358695983887, 4.494675159454346, 4.8589911460876465, 5.2233076095581055, 5.587623596191406, 5.951939582824707, 6.316256046295166, 6.680572032928467, 7.044888496398926, 7.409204483032227, 7.773520469665527, 8.137836456298828, 8.502153396606445, 8.866469383239746, 9.230785369873047, 9.595102310180664, 9.959418296813965, 10.323734283447266, 10.688050270080566, 11.052366256713867, 11.416682243347168]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 1.0, 1.0, 9.0, 11.0, 17.0, 25.0, 47.0, 43.0, 74.0, 142.0, 196.0, 400.0, 759.0, 1438.0, 3298.0, 9382.0, 54131.0, 4095279.0, 19096.0, 5416.0, 2199.0, 1022.0, 500.0, 298.0, 172.0, 114.0, 74.0, 45.0, 32.0, 16.0, 19.0, 14.0, 1.0, 5.0, 4.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.248046875, -2.168487548828125, -2.08892822265625, -2.009368896484375, -1.9298095703125, -1.850250244140625, -1.77069091796875, -1.691131591796875, -1.611572265625, -1.532012939453125, -1.45245361328125, -1.372894287109375, -1.2933349609375, -1.213775634765625, -1.13421630859375, -1.054656982421875, -0.97509765625, -0.895538330078125, -0.81597900390625, -0.736419677734375, -0.6568603515625, -0.577301025390625, -0.49774169921875, -0.418182373046875, -0.338623046875, -0.259063720703125, -0.17950439453125, -0.099945068359375, -0.0203857421875, 0.059173583984375, 0.13873291015625, 0.218292236328125, 0.2978515625, 0.377410888671875, 0.45697021484375, 0.536529541015625, 0.6160888671875, 0.695648193359375, 0.77520751953125, 0.854766845703125, 0.934326171875, 1.013885498046875, 1.09344482421875, 1.173004150390625, 1.2525634765625, 1.332122802734375, 1.41168212890625, 1.491241455078125, 1.57080078125, 1.650360107421875, 1.72991943359375, 1.809478759765625, 1.8890380859375, 1.968597412109375, 2.04815673828125, 2.127716064453125, 2.207275390625, 2.286834716796875, 2.36639404296875, 2.445953369140625, 2.5255126953125, 2.605072021484375, 2.68463134765625, 2.764190673828125, 2.84375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 7.0, 7.0, 10.0, 17.0, 24.0, 35.0, 34.0, 50.0, 80.0, 79.0, 108.0, 108.0, 98.0, 81.0, 73.0, 59.0, 45.0, 33.0, 22.0, 17.0, 5.0, 3.0, 3.0, 9.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0107421875, -0.9796981811523438, -0.9486541748046875, -0.9176101684570312, -0.886566162109375, -0.8555221557617188, -0.8244781494140625, -0.7934341430664062, -0.76239013671875, -0.7313461303710938, -0.7003021240234375, -0.6692581176757812, -0.638214111328125, -0.6071701049804688, -0.5761260986328125, -0.5450820922851562, -0.5140380859375, -0.48299407958984375, -0.4519500732421875, -0.42090606689453125, -0.389862060546875, -0.35881805419921875, -0.3277740478515625, -0.29673004150390625, -0.26568603515625, -0.23464202880859375, -0.2035980224609375, -0.17255401611328125, -0.141510009765625, -0.11046600341796875, -0.0794219970703125, -0.04837799072265625, -0.017333984375, 0.01371002197265625, 0.0447540283203125, 0.07579803466796875, 0.106842041015625, 0.13788604736328125, 0.1689300537109375, 0.19997406005859375, 0.23101806640625, 0.26206207275390625, 0.2931060791015625, 0.32415008544921875, 0.355194091796875, 0.38623809814453125, 0.4172821044921875, 0.44832611083984375, 0.4793701171875, 0.5104141235351562, 0.5414581298828125, 0.5725021362304688, 0.603546142578125, 0.6345901489257812, 0.6656341552734375, 0.6966781616210938, 0.72772216796875, 0.7587661743164062, 0.7898101806640625, 0.8208541870117188, 0.851898193359375, 0.8829421997070312, 0.9139862060546875, 0.9450302124023438, 0.97607421875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 7.0, 7.0, 10.0, 9.0, 11.0, 33.0, 35.0, 71.0, 74.0, 104.0, 177.0, 252.0, 471.0, 1065.0, 2525.0, 7156.0, 29387.0, 4053305.0, 79791.0, 12600.0, 3941.0, 1520.0, 723.0, 340.0, 203.0, 133.0, 100.0, 68.0, 50.0, 42.0, 29.0, 17.0, 8.0, 9.0, 4.0, 5.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.984375, -2.9052734375, -2.826171875, -2.7470703125, -2.66796875, -2.5888671875, -2.509765625, -2.4306640625, -2.3515625, -2.2724609375, -2.193359375, -2.1142578125, -2.03515625, -1.9560546875, -1.876953125, -1.7978515625, -1.71875, -1.6396484375, -1.560546875, -1.4814453125, -1.40234375, -1.3232421875, -1.244140625, -1.1650390625, -1.0859375, -1.0068359375, -0.927734375, -0.8486328125, -0.76953125, -0.6904296875, -0.611328125, -0.5322265625, -0.453125, -0.3740234375, -0.294921875, -0.2158203125, -0.13671875, -0.0576171875, 0.021484375, 0.1005859375, 0.1796875, 0.2587890625, 0.337890625, 0.4169921875, 0.49609375, 0.5751953125, 0.654296875, 0.7333984375, 0.8125, 0.8916015625, 0.970703125, 1.0498046875, 1.12890625, 1.2080078125, 1.287109375, 1.3662109375, 1.4453125, 1.5244140625, 1.603515625, 1.6826171875, 1.76171875, 1.8408203125, 1.919921875, 1.9990234375, 2.078125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 8.0, 13.0, 15.0, 30.0, 66.0, 3743.0, 104.0, 42.0, 22.0, 14.0, 8.0, 5.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.393310546875, -0.3697242736816406, -0.34613800048828125, -0.3225517272949219, -0.2989654541015625, -0.2753791809082031, -0.25179290771484375, -0.22820663452148438, -0.204620361328125, -0.18103408813476562, -0.15744781494140625, -0.13386154174804688, -0.1102752685546875, -0.08668899536132812, -0.06310272216796875, -0.039516448974609375, -0.01593017578125, 0.007656097412109375, 0.03124237060546875, 0.054828643798828125, 0.0784149169921875, 0.10200119018554688, 0.12558746337890625, 0.14917373657226562, 0.172760009765625, 0.19634628295898438, 0.21993255615234375, 0.24351882934570312, 0.2671051025390625, 0.2906913757324219, 0.31427764892578125, 0.3378639221191406, 0.3614501953125, 0.3850364685058594, 0.40862274169921875, 0.4322090148925781, 0.4557952880859375, 0.4793815612792969, 0.5029678344726562, 0.5265541076660156, 0.550140380859375, 0.5737266540527344, 0.5973129272460938, 0.6208992004394531, 0.6444854736328125, 0.6680717468261719, 0.6916580200195312, 0.7152442932128906, 0.73883056640625, 0.7624168395996094, 0.7860031127929688, 0.8095893859863281, 0.8331756591796875, 0.8567619323730469, 0.8803482055664062, 0.9039344787597656, 0.927520751953125, 0.9511070251464844, 0.9746932983398438, 0.9982795715332031, 1.0218658447265625, 1.0454521179199219, 1.0690383911132812, 1.0926246643066406, 1.1162109375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 13.0, 37.0, 140.0, 343.0, 275.0, 138.0, 43.0, 20.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.988763332366943, -5.83800745010376, -5.687251567840576, -5.536495685577393, -5.385740280151367, -5.234984397888184, -5.084228515625, -4.933472633361816, -4.782716751098633, -4.631960868835449, -4.481204986572266, -4.330449104309082, -4.179693222045898, -4.028937816619873, -3.8781819343566895, -3.727426052093506, -3.5766701698303223, -3.4259142875671387, -3.275158405303955, -3.1244027614593506, -2.973646879196167, -2.8228909969329834, -2.672135353088379, -2.5213794708251953, -2.3706235885620117, -2.219867706298828, -2.0691118240356445, -1.91835618019104, -1.7676002979278564, -1.6168444156646729, -1.4660886526107788, -1.3153328895568848, -1.164576530456543, -1.0138206481933594, -0.8630648851394653, -0.7123090624809265, -0.5615532398223877, -0.4107974171638489, -0.26004159450531006, -0.10928583145141602, 0.04147005081176758, 0.1922258734703064, 0.3429816961288452, 0.49373751878738403, 0.6444933414459229, 0.7952491641044617, 0.9460049867630005, 1.0967607498168945, 1.2475166320800781, 1.3982725143432617, 1.5490282773971558, 1.6997840404510498, 1.8505399227142334, 2.001295804977417, 2.1520514488220215, 2.302807331085205, 2.4535632133483887, 2.6043190956115723, 2.755074977874756, 2.9058306217193604, 3.056586503982544, 3.2073423862457275, 3.358098030090332, 3.5088539123535156, 3.659609794616699]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 5.0, 4.0, 2.0, 4.0, 8.0, 6.0, 14.0, 6.0, 11.0, 23.0, 21.0, 27.0, 29.0, 17.0, 45.0, 43.0, 40.0, 39.0, 41.0, 38.0, 44.0, 42.0, 34.0, 39.0, 33.0, 46.0, 33.0, 41.0, 40.0, 27.0, 25.0, 27.0, 26.0, 20.0, 25.0, 17.0, 11.0, 12.0, 6.0, 11.0, 7.0, 8.0, 2.0, 2.0, 0.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.998574435710907, -0.9680328369140625, -0.9374912977218628, -0.9069497585296631, -0.8764081597328186, -0.8458665609359741, -0.8153250217437744, -0.7847834825515747, -0.7542418837547302, -0.7237002849578857, -0.693158745765686, -0.6626172065734863, -0.6320756077766418, -0.6015340089797974, -0.5709924697875977, -0.540450930595398, -0.5099093317985535, -0.47936776280403137, -0.4488261938095093, -0.4182846248149872, -0.3877430558204651, -0.357201486825943, -0.3266599178314209, -0.2961183488368988, -0.2655767798423767, -0.23503521084785461, -0.20449364185333252, -0.17395207285881042, -0.14341050386428833, -0.11286893486976624, -0.08232736587524414, -0.051785796880722046, -0.02124422788619995, 0.009297341108322144, 0.03983891010284424, 0.07038047909736633, 0.10092204809188843, 0.13146361708641052, 0.16200518608093262, 0.1925467550754547, 0.2230883240699768, 0.2536298930644989, 0.284171462059021, 0.3147130310535431, 0.3452546000480652, 0.3757961690425873, 0.4063377380371094, 0.43687930703163147, 0.46742087602615356, 0.49796244502067566, 0.5285040140151978, 0.5590455532073975, 0.5895871520042419, 0.6201287508010864, 0.6506702899932861, 0.6812118291854858, 0.7117534279823303, 0.7422950267791748, 0.7728365659713745, 0.8033781051635742, 0.8339197039604187, 0.8644613027572632, 0.8950028419494629, 0.9255443811416626, 0.9560859799385071]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 6.0, 6.0, 11.0, 9.0, 33.0, 35.0, 53.0, 91.0, 193.0, 352.0, 746.0, 1516.0, 3649.0, 10522.0, 37583.0, 176774.0, 519201.0, 229328.0, 47665.0, 12790.0, 4449.0, 1823.0, 815.0, 410.0, 195.0, 132.0, 65.0, 36.0, 17.0, 22.0, 10.0, 10.0, 7.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.1640625, -2.0996246337890625, -2.035186767578125, -1.9707489013671875, -1.90631103515625, -1.8418731689453125, -1.777435302734375, -1.7129974365234375, -1.6485595703125, -1.5841217041015625, -1.519683837890625, -1.4552459716796875, -1.39080810546875, -1.3263702392578125, -1.261932373046875, -1.1974945068359375, -1.133056640625, -1.0686187744140625, -1.004180908203125, -0.9397430419921875, -0.87530517578125, -0.8108673095703125, -0.746429443359375, -0.6819915771484375, -0.6175537109375, -0.5531158447265625, -0.488677978515625, -0.4242401123046875, -0.35980224609375, -0.2953643798828125, -0.230926513671875, -0.1664886474609375, -0.10205078125, -0.0376129150390625, 0.026824951171875, 0.0912628173828125, 0.15570068359375, 0.2201385498046875, 0.284576416015625, 0.3490142822265625, 0.4134521484375, 0.4778900146484375, 0.542327880859375, 0.6067657470703125, 0.67120361328125, 0.7356414794921875, 0.800079345703125, 0.8645172119140625, 0.928955078125, 0.9933929443359375, 1.057830810546875, 1.1222686767578125, 1.18670654296875, 1.2511444091796875, 1.315582275390625, 1.3800201416015625, 1.4444580078125, 1.5088958740234375, 1.573333740234375, 1.6377716064453125, 1.70220947265625, 1.7666473388671875, 1.831085205078125, 1.8955230712890625, 1.9599609375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 11.0, 13.0, 6.0, 18.0, 25.0, 39.0, 45.0, 62.0, 75.0, 89.0, 92.0, 104.0, 94.0, 70.0, 69.0, 62.0, 37.0, 29.0, 25.0, 14.0, 10.0, 8.0, 5.0, 6.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1259765625, -1.0931854248046875, -1.060394287109375, -1.0276031494140625, -0.99481201171875, -0.9620208740234375, -0.929229736328125, -0.8964385986328125, -0.8636474609375, -0.8308563232421875, -0.798065185546875, -0.7652740478515625, -0.73248291015625, -0.6996917724609375, -0.666900634765625, -0.6341094970703125, -0.601318359375, -0.5685272216796875, -0.535736083984375, -0.5029449462890625, -0.47015380859375, -0.4373626708984375, -0.404571533203125, -0.3717803955078125, -0.3389892578125, -0.3061981201171875, -0.273406982421875, -0.2406158447265625, -0.20782470703125, -0.1750335693359375, -0.142242431640625, -0.1094512939453125, -0.07666015625, -0.0438690185546875, -0.011077880859375, 0.0217132568359375, 0.05450439453125, 0.0872955322265625, 0.120086669921875, 0.1528778076171875, 0.1856689453125, 0.2184600830078125, 0.251251220703125, 0.2840423583984375, 0.31683349609375, 0.3496246337890625, 0.382415771484375, 0.4152069091796875, 0.447998046875, 0.4807891845703125, 0.513580322265625, 0.5463714599609375, 0.57916259765625, 0.6119537353515625, 0.644744873046875, 0.6775360107421875, 0.7103271484375, 0.7431182861328125, 0.775909423828125, 0.8087005615234375, 0.84149169921875, 0.8742828369140625, 0.907073974609375, 0.9398651123046875, 0.97265625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 5.0, 11.0, 21.0, 23.0, 53.0, 85.0, 169.0, 262.0, 532.0, 1233.0, 3648.0, 18914.0, 259042.0, 701770.0, 52358.0, 6961.0, 1917.0, 739.0, 335.0, 214.0, 108.0, 54.0, 39.0, 27.0, 17.0, 7.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.296875, -3.1976318359375, -3.098388671875, -2.9991455078125, -2.89990234375, -2.8006591796875, -2.701416015625, -2.6021728515625, -2.5029296875, -2.4036865234375, -2.304443359375, -2.2052001953125, -2.10595703125, -2.0067138671875, -1.907470703125, -1.8082275390625, -1.708984375, -1.6097412109375, -1.510498046875, -1.4112548828125, -1.31201171875, -1.2127685546875, -1.113525390625, -1.0142822265625, -0.9150390625, -0.8157958984375, -0.716552734375, -0.6173095703125, -0.51806640625, -0.4188232421875, -0.319580078125, -0.2203369140625, -0.12109375, -0.0218505859375, 0.077392578125, 0.1766357421875, 0.27587890625, 0.3751220703125, 0.474365234375, 0.5736083984375, 0.6728515625, 0.7720947265625, 0.871337890625, 0.9705810546875, 1.06982421875, 1.1690673828125, 1.268310546875, 1.3675537109375, 1.466796875, 1.5660400390625, 1.665283203125, 1.7645263671875, 1.86376953125, 1.9630126953125, 2.062255859375, 2.1614990234375, 2.2607421875, 2.3599853515625, 2.459228515625, 2.5584716796875, 2.65771484375, 2.7569580078125, 2.856201171875, 2.9554443359375, 3.0546875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 8.0, 8.0, 3.0, 12.0, 13.0, 13.0, 21.0, 23.0, 26.0, 26.0, 44.0, 47.0, 51.0, 55.0, 56.0, 50.0, 44.0, 68.0, 63.0, 50.0, 55.0, 38.0, 46.0, 30.0, 35.0, 27.0, 15.0, 18.0, 10.0, 16.0, 11.0, 6.0, 6.0, 5.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.703125, -2.607452392578125, -2.51177978515625, -2.416107177734375, -2.3204345703125, -2.224761962890625, -2.12908935546875, -2.033416748046875, -1.937744140625, -1.842071533203125, -1.74639892578125, -1.650726318359375, -1.5550537109375, -1.459381103515625, -1.36370849609375, -1.268035888671875, -1.17236328125, -1.076690673828125, -0.98101806640625, -0.885345458984375, -0.7896728515625, -0.694000244140625, -0.59832763671875, -0.502655029296875, -0.406982421875, -0.311309814453125, -0.21563720703125, -0.119964599609375, -0.0242919921875, 0.071380615234375, 0.16705322265625, 0.262725830078125, 0.3583984375, 0.454071044921875, 0.54974365234375, 0.645416259765625, 0.7410888671875, 0.836761474609375, 0.93243408203125, 1.028106689453125, 1.123779296875, 1.219451904296875, 1.31512451171875, 1.410797119140625, 1.5064697265625, 1.602142333984375, 1.69781494140625, 1.793487548828125, 1.88916015625, 1.984832763671875, 2.08050537109375, 2.176177978515625, 2.2718505859375, 2.367523193359375, 2.46319580078125, 2.558868408203125, 2.654541015625, 2.750213623046875, 2.84588623046875, 2.941558837890625, 3.0372314453125, 3.132904052734375, 3.22857666015625, 3.324249267578125, 3.419921875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 2.0, 1.0, 4.0, 5.0, 10.0, 15.0, 21.0, 51.0, 82.0, 176.0, 428.0, 1141.0, 4139.0, 35126.0, 930754.0, 68601.0, 5718.0, 1398.0, 468.0, 193.0, 99.0, 50.0, 23.0, 15.0, 16.0, 5.0, 7.0, 2.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.255859375, -3.1756591796875, -3.095458984375, -3.0152587890625, -2.93505859375, -2.8548583984375, -2.774658203125, -2.6944580078125, -2.6142578125, -2.5340576171875, -2.453857421875, -2.3736572265625, -2.29345703125, -2.2132568359375, -2.133056640625, -2.0528564453125, -1.97265625, -1.8924560546875, -1.812255859375, -1.7320556640625, -1.65185546875, -1.5716552734375, -1.491455078125, -1.4112548828125, -1.3310546875, -1.2508544921875, -1.170654296875, -1.0904541015625, -1.01025390625, -0.9300537109375, -0.849853515625, -0.7696533203125, -0.689453125, -0.6092529296875, -0.529052734375, -0.4488525390625, -0.36865234375, -0.2884521484375, -0.208251953125, -0.1280517578125, -0.0478515625, 0.0323486328125, 0.112548828125, 0.1927490234375, 0.27294921875, 0.3531494140625, 0.433349609375, 0.5135498046875, 0.59375, 0.6739501953125, 0.754150390625, 0.8343505859375, 0.91455078125, 0.9947509765625, 1.074951171875, 1.1551513671875, 1.2353515625, 1.3155517578125, 1.395751953125, 1.4759521484375, 1.55615234375, 1.6363525390625, 1.716552734375, 1.7967529296875, 1.876953125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 3.0, 8.0, 9.0, 7.0, 24.0, 43.0, 70.0, 137.0, 204.0, 207.0, 135.0, 84.0, 36.0, 16.0, 7.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000324249267578125, -0.00031340867280960083, -0.00030256807804107666, -0.0002917274832725525, -0.0002808868885040283, -0.00027004629373550415, -0.00025920569896698, -0.0002483651041984558, -0.00023752450942993164, -0.00022668391466140747, -0.0002158433198928833, -0.00020500272512435913, -0.00019416213035583496, -0.0001833215355873108, -0.00017248094081878662, -0.00016164034605026245, -0.00015079975128173828, -0.0001399591565132141, -0.00012911856174468994, -0.00011827796697616577, -0.0001074373722076416, -9.659677743911743e-05, -8.575618267059326e-05, -7.491558790206909e-05, -6.407499313354492e-05, -5.323439836502075e-05, -4.239380359649658e-05, -3.155320882797241e-05, -2.0712614059448242e-05, -9.872019290924072e-06, 9.685754776000977e-07, 1.1809170246124268e-05, 2.2649765014648438e-05, 3.349035978317261e-05, 4.433095455169678e-05, 5.517154932022095e-05, 6.601214408874512e-05, 7.685273885726929e-05, 8.769333362579346e-05, 9.853392839431763e-05, 0.0001093745231628418, 0.00012021511793136597, 0.00013105571269989014, 0.0001418963074684143, 0.00015273690223693848, 0.00016357749700546265, 0.00017441809177398682, 0.00018525868654251099, 0.00019609928131103516, 0.00020693987607955933, 0.0002177804708480835, 0.00022862106561660767, 0.00023946166038513184, 0.000250302255153656, 0.0002611428499221802, 0.00027198344469070435, 0.0002828240394592285, 0.0002936646342277527, 0.00030450522899627686, 0.000315345823764801, 0.0003261864185333252, 0.00033702701330184937, 0.00034786760807037354, 0.0003587082028388977, 0.0003695487976074219]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 5.0, 5.0, 4.0, 11.0, 14.0, 18.0, 14.0, 30.0, 39.0, 83.0, 107.0, 176.0, 288.0, 488.0, 924.0, 1735.0, 3686.0, 9150.0, 35437.0, 422761.0, 515914.0, 39976.0, 9954.0, 3828.0, 1683.0, 935.0, 491.0, 269.0, 184.0, 113.0, 75.0, 42.0, 41.0, 25.0, 12.0, 8.0, 11.0, 6.0, 6.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-1.515625, -1.474700927734375, -1.43377685546875, -1.392852783203125, -1.3519287109375, -1.311004638671875, -1.27008056640625, -1.229156494140625, -1.188232421875, -1.147308349609375, -1.10638427734375, -1.065460205078125, -1.0245361328125, -0.983612060546875, -0.94268798828125, -0.901763916015625, -0.86083984375, -0.819915771484375, -0.77899169921875, -0.738067626953125, -0.6971435546875, -0.656219482421875, -0.61529541015625, -0.574371337890625, -0.533447265625, -0.492523193359375, -0.45159912109375, -0.410675048828125, -0.3697509765625, -0.328826904296875, -0.28790283203125, -0.246978759765625, -0.2060546875, -0.165130615234375, -0.12420654296875, -0.083282470703125, -0.0423583984375, -0.001434326171875, 0.03948974609375, 0.080413818359375, 0.121337890625, 0.162261962890625, 0.20318603515625, 0.244110107421875, 0.2850341796875, 0.325958251953125, 0.36688232421875, 0.407806396484375, 0.44873046875, 0.489654541015625, 0.53057861328125, 0.571502685546875, 0.6124267578125, 0.653350830078125, 0.69427490234375, 0.735198974609375, 0.776123046875, 0.817047119140625, 0.85797119140625, 0.898895263671875, 0.9398193359375, 0.980743408203125, 1.02166748046875, 1.062591552734375, 1.103515625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 1.0, 7.0, 4.0, 4.0, 6.0, 11.0, 14.0, 36.0, 65.0, 137.0, 171.0, 203.0, 142.0, 77.0, 47.0, 15.0, 6.0, 14.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 3.0, 5.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.37109375, -2.28717041015625, -2.2032470703125, -2.11932373046875, -2.035400390625, -1.95147705078125, -1.8675537109375, -1.78363037109375, -1.69970703125, -1.61578369140625, -1.5318603515625, -1.44793701171875, -1.364013671875, -1.28009033203125, -1.1961669921875, -1.11224365234375, -1.0283203125, -0.94439697265625, -0.8604736328125, -0.77655029296875, -0.692626953125, -0.60870361328125, -0.5247802734375, -0.44085693359375, -0.35693359375, -0.27301025390625, -0.1890869140625, -0.10516357421875, -0.021240234375, 0.06268310546875, 0.1466064453125, 0.23052978515625, 0.314453125, 0.39837646484375, 0.4822998046875, 0.56622314453125, 0.650146484375, 0.73406982421875, 0.8179931640625, 0.90191650390625, 0.98583984375, 1.06976318359375, 1.1536865234375, 1.23760986328125, 1.321533203125, 1.40545654296875, 1.4893798828125, 1.57330322265625, 1.6572265625, 1.74114990234375, 1.8250732421875, 1.90899658203125, 1.992919921875, 2.07684326171875, 2.1607666015625, 2.24468994140625, 2.32861328125, 2.41253662109375, 2.4964599609375, 2.58038330078125, 2.664306640625, 2.74822998046875, 2.8321533203125, 2.91607666015625, 3.0]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 11.0, 20.0, 28.0, 64.0, 106.0, 138.0, 144.0, 143.0, 118.0, 78.0, 63.0, 36.0, 32.0, 11.0, 8.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.128128051757812, -23.487226486206055, -22.846324920654297, -22.20542335510254, -21.56452178955078, -20.923620223999023, -20.282718658447266, -19.641815185546875, -19.00091552734375, -18.360013961791992, -17.719112396240234, -17.078210830688477, -16.43730926513672, -15.796407699584961, -15.155505180358887, -14.514603614807129, -13.873701095581055, -13.232799530029297, -12.591897964477539, -11.950996398925781, -11.310094833374023, -10.669193267822266, -10.028290748596191, -9.387389183044434, -8.746487617492676, -8.105586051940918, -7.46468448638916, -6.823782444000244, -6.182880878448486, -5.5419793128967285, -4.9010772705078125, -4.260175704956055, -3.619274139404297, -2.978372573852539, -2.337470769882202, -1.6965690851211548, -1.0556674003601074, -0.4147658348083496, 0.2261359691619873, 0.8670377731323242, 1.507939338684082, 2.14884090423584, 2.7897427082061768, 3.4306445121765137, 4.0715460777282715, 4.712447643280029, 5.353349685668945, 5.994251251220703, 6.635152816772461, 7.276054382324219, 7.916955947875977, 8.557857513427734, 9.198759078979492, 9.83966064453125, 10.480563163757324, 11.121464729309082, 11.76236629486084, 12.403267860412598, 13.044169425964355, 13.685070991516113, 14.325973510742188, 14.966875076293945, 15.607776641845703, 16.24867820739746, 16.88957977294922]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 5.0, 1.0, 4.0, 5.0, 3.0, 7.0, 9.0, 10.0, 14.0, 13.0, 18.0, 15.0, 21.0, 32.0, 36.0, 31.0, 19.0, 34.0, 23.0, 53.0, 36.0, 43.0, 39.0, 51.0, 43.0, 31.0, 34.0, 37.0, 43.0, 31.0, 32.0, 29.0, 19.0, 16.0, 27.0, 27.0, 14.0, 13.0, 19.0, 12.0, 13.0, 14.0, 8.0, 4.0, 7.0, 6.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-12.500033378601074, -12.127107620239258, -11.754181861877441, -11.381256103515625, -11.008330345153809, -10.635404586791992, -10.26247787475586, -9.88955307006836, -9.516626358032227, -9.14370059967041, -8.770774841308594, -8.397849082946777, -8.024923324584961, -7.6519975662231445, -7.27907133102417, -6.9061455726623535, -6.533220291137695, -6.160294532775879, -5.7873687744140625, -5.414443016052246, -5.04151725769043, -4.668591499328613, -4.295665264129639, -3.9227395057678223, -3.549813747406006, -3.1768879890441895, -2.803962230682373, -2.4310362339019775, -2.058110475540161, -1.6851847171783447, -1.3122587203979492, -0.9393329620361328, -0.5664081573486328, -0.19348233938217163, 0.17944347858428955, 0.5523693561553955, 0.9252951145172119, 1.2982208728790283, 1.6711468696594238, 2.0440726280212402, 2.4169983863830566, 2.789924144744873, 3.1628499031066895, 3.535775899887085, 3.9087016582489014, 4.281627655029297, 4.654553413391113, 5.02747917175293, 5.400404930114746, 5.7733306884765625, 6.146256446838379, 6.519182205200195, 6.892107963562012, 7.265033721923828, 7.637959957122803, 8.010885238647461, 8.383811950683594, 8.75673770904541, 9.129663467407227, 9.502589225769043, 9.87551498413086, 10.248440742492676, 10.621366500854492, 10.994293212890625, 11.367218017578125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 1.0, 9.0, 3.0, 3.0, 3.0, 8.0, 7.0, 17.0, 27.0, 24.0, 33.0, 53.0, 78.0, 130.0, 244.0, 352.0, 753.0, 1698.0, 4619.0, 16677.0, 115503.0, 3993591.0, 45691.0, 9351.0, 2974.0, 1166.0, 521.0, 252.0, 152.0, 101.0, 68.0, 43.0, 33.0, 27.0, 18.0, 12.0, 10.0, 3.0, 6.0, 5.0, 3.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-2.68359375, -2.6053466796875, -2.527099609375, -2.4488525390625, -2.37060546875, -2.2923583984375, -2.214111328125, -2.1358642578125, -2.0576171875, -1.9793701171875, -1.901123046875, -1.8228759765625, -1.74462890625, -1.6663818359375, -1.588134765625, -1.5098876953125, -1.431640625, -1.3533935546875, -1.275146484375, -1.1968994140625, -1.11865234375, -1.0404052734375, -0.962158203125, -0.8839111328125, -0.8056640625, -0.7274169921875, -0.649169921875, -0.5709228515625, -0.49267578125, -0.4144287109375, -0.336181640625, -0.2579345703125, -0.1796875, -0.1014404296875, -0.023193359375, 0.0550537109375, 0.13330078125, 0.2115478515625, 0.289794921875, 0.3680419921875, 0.4462890625, 0.5245361328125, 0.602783203125, 0.6810302734375, 0.75927734375, 0.8375244140625, 0.915771484375, 0.9940185546875, 1.072265625, 1.1505126953125, 1.228759765625, 1.3070068359375, 1.38525390625, 1.4635009765625, 1.541748046875, 1.6199951171875, 1.6982421875, 1.7764892578125, 1.854736328125, 1.9329833984375, 2.01123046875, 2.0894775390625, 2.167724609375, 2.2459716796875, 2.32421875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 6.0, 10.0, 6.0, 17.0, 19.0, 25.0, 29.0, 35.0, 48.0, 48.0, 47.0, 47.0, 47.0, 65.0, 59.0, 49.0, 62.0, 53.0, 46.0, 45.0, 41.0, 24.0, 27.0, 22.0, 22.0, 20.0, 10.0, 11.0, 11.0, 6.0, 8.0, 8.0, 3.0, 6.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.701171875, -0.6803817749023438, -0.6595916748046875, -0.6388015747070312, -0.618011474609375, -0.5972213745117188, -0.5764312744140625, -0.5556411743164062, -0.53485107421875, -0.5140609741210938, -0.4932708740234375, -0.47248077392578125, -0.451690673828125, -0.43090057373046875, -0.4101104736328125, -0.38932037353515625, -0.3685302734375, -0.34774017333984375, -0.3269500732421875, -0.30615997314453125, -0.285369873046875, -0.26457977294921875, -0.2437896728515625, -0.22299957275390625, -0.20220947265625, -0.18141937255859375, -0.1606292724609375, -0.13983917236328125, -0.119049072265625, -0.09825897216796875, -0.0774688720703125, -0.05667877197265625, -0.035888671875, -0.01509857177734375, 0.0056915283203125, 0.02648162841796875, 0.047271728515625, 0.06806182861328125, 0.0888519287109375, 0.10964202880859375, 0.13043212890625, 0.15122222900390625, 0.1720123291015625, 0.19280242919921875, 0.213592529296875, 0.23438262939453125, 0.2551727294921875, 0.27596282958984375, 0.2967529296875, 0.31754302978515625, 0.3383331298828125, 0.35912322998046875, 0.379913330078125, 0.40070343017578125, 0.4214935302734375, 0.44228363037109375, 0.46307373046875, 0.48386383056640625, 0.5046539306640625, 0.5254440307617188, 0.546234130859375, 0.5670242309570312, 0.5878143310546875, 0.6086044311523438, 0.62939453125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 7.0, 4.0, 4.0, 7.0, 6.0, 9.0, 11.0, 19.0, 33.0, 32.0, 37.0, 42.0, 64.0, 86.0, 99.0, 156.0, 208.0, 271.0, 530.0, 2414.0, 56787.0, 4120617.0, 10352.0, 1153.0, 383.0, 226.0, 164.0, 133.0, 108.0, 86.0, 62.0, 36.0, 29.0, 26.0, 23.0, 19.0, 12.0, 14.0, 4.0, 6.0, 2.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.625, -8.3734130859375, -8.121826171875, -7.8702392578125, -7.61865234375, -7.3670654296875, -7.115478515625, -6.8638916015625, -6.6123046875, -6.3607177734375, -6.109130859375, -5.8575439453125, -5.60595703125, -5.3543701171875, -5.102783203125, -4.8511962890625, -4.599609375, -4.3480224609375, -4.096435546875, -3.8448486328125, -3.59326171875, -3.3416748046875, -3.090087890625, -2.8385009765625, -2.5869140625, -2.3353271484375, -2.083740234375, -1.8321533203125, -1.58056640625, -1.3289794921875, -1.077392578125, -0.8258056640625, -0.57421875, -0.3226318359375, -0.071044921875, 0.1805419921875, 0.43212890625, 0.6837158203125, 0.935302734375, 1.1868896484375, 1.4384765625, 1.6900634765625, 1.941650390625, 2.1932373046875, 2.44482421875, 2.6964111328125, 2.947998046875, 3.1995849609375, 3.451171875, 3.7027587890625, 3.954345703125, 4.2059326171875, 4.45751953125, 4.7091064453125, 4.960693359375, 5.2122802734375, 5.4638671875, 5.7154541015625, 5.967041015625, 6.2186279296875, 6.47021484375, 6.7218017578125, 6.973388671875, 7.2249755859375, 7.4765625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 7.0, 18.0, 28.0, 114.0, 3492.0, 300.0, 81.0, 25.0, 8.0, 3.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0], "bins": [-4.86328125, -4.7711181640625, -4.678955078125, -4.5867919921875, -4.49462890625, -4.4024658203125, -4.310302734375, -4.2181396484375, -4.1259765625, -4.0338134765625, -3.941650390625, -3.8494873046875, -3.75732421875, -3.6651611328125, -3.572998046875, -3.4808349609375, -3.388671875, -3.2965087890625, -3.204345703125, -3.1121826171875, -3.02001953125, -2.9278564453125, -2.835693359375, -2.7435302734375, -2.6513671875, -2.5592041015625, -2.467041015625, -2.3748779296875, -2.28271484375, -2.1905517578125, -2.098388671875, -2.0062255859375, -1.9140625, -1.8218994140625, -1.729736328125, -1.6375732421875, -1.54541015625, -1.4532470703125, -1.361083984375, -1.2689208984375, -1.1767578125, -1.0845947265625, -0.992431640625, -0.9002685546875, -0.80810546875, -0.7159423828125, -0.623779296875, -0.5316162109375, -0.439453125, -0.3472900390625, -0.255126953125, -0.1629638671875, -0.07080078125, 0.0213623046875, 0.113525390625, 0.2056884765625, 0.2978515625, 0.3900146484375, 0.482177734375, 0.5743408203125, 0.66650390625, 0.7586669921875, 0.850830078125, 0.9429931640625, 1.03515625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 8.0, 5.0, 15.0, 20.0, 37.0, 42.0, 89.0, 138.0, 157.0, 159.0, 129.0, 82.0, 57.0, 22.0, 19.0, 8.0, 6.0, 6.0, 1.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.920400619506836, -8.658134460449219, -8.395867347717285, -8.133601188659668, -7.871334552764893, -7.609067916870117, -7.3468017578125, -7.084535121917725, -6.822268486022949, -6.560001850128174, -6.297735214233398, -6.035469055175781, -5.773202419281006, -5.5109357833862305, -5.248669624328613, -4.986402988433838, -4.7241363525390625, -4.461869716644287, -4.199603080749512, -3.9373369216918945, -3.675070285797119, -3.4128036499023438, -3.1505372524261475, -2.888270854949951, -2.626004219055176, -2.3637375831604004, -2.101471185684204, -1.8392046689987183, -1.5769381523132324, -1.3146716356277466, -1.0524051189422607, -0.7901386022567749, -0.5278730392456055, -0.26560652256011963, -0.003340005874633789, 0.25892651081085205, 0.5211930274963379, 0.7834595441818237, 1.0457260608673096, 1.3079925775527954, 1.5702590942382812, 1.832525610923767, 2.094792127609253, 2.357058525085449, 2.6193251609802246, 2.881591796875, 3.1438581943511963, 3.4061245918273926, 3.668391227722168, 3.9306578636169434, 4.192924499511719, 4.455190658569336, 4.717457294464111, 4.979723930358887, 5.241990089416504, 5.504256725311279, 5.766523361206055, 6.02878999710083, 6.2910566329956055, 6.553322792053223, 6.815589427947998, 7.077856063842773, 7.340122222900391, 7.602388858795166, 7.864655494689941]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 5.0, 11.0, 7.0, 22.0, 52.0, 46.0, 60.0, 84.0, 86.0, 99.0, 110.0, 107.0, 84.0, 58.0, 54.0, 35.0, 24.0, 16.0, 17.0, 12.0, 3.0, 7.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.068631172180176, -6.798524856567383, -6.528418064117432, -6.2583112716674805, -5.9882049560546875, -5.7180986404418945, -5.447991847991943, -5.177885055541992, -4.907778739929199, -4.637672424316406, -4.367565631866455, -4.097458839416504, -3.827352523803711, -3.557245969772339, -3.287139415740967, -3.0170328617095947, -2.7469263076782227, -2.4768197536468506, -2.2067131996154785, -1.9366066455841064, -1.6665000915527344, -1.3963935375213623, -1.1262869834899902, -0.8561804294586182, -0.5860738754272461, -0.315967321395874, -0.04586076736450195, 0.22424578666687012, 0.4943523406982422, 0.7644588947296143, 1.0345654487609863, 1.3046720027923584, 1.574777603149414, 1.8448841571807861, 2.114990711212158, 2.3850972652435303, 2.6552038192749023, 2.9253103733062744, 3.1954169273376465, 3.4655234813690186, 3.7356300354003906, 4.005736351013184, 4.275843143463135, 4.545949935913086, 4.816056251525879, 5.086162567138672, 5.356269359588623, 5.626376152038574, 5.896482467651367, 6.16658878326416, 6.436695575714111, 6.7068023681640625, 6.9769086837768555, 7.247014999389648, 7.5171217918396, 7.787228584289551, 8.057334899902344, 8.327441215515137, 8.59754753112793, 8.867654800415039, 9.137761116027832, 9.407867431640625, 9.677974700927734, 9.948081016540527, 10.21818733215332]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 3.0, 2.0, 8.0, 13.0, 7.0, 13.0, 28.0, 42.0, 36.0, 51.0, 106.0, 130.0, 201.0, 326.0, 531.0, 942.0, 1697.0, 3225.0, 6500.0, 14332.0, 34550.0, 88887.0, 224228.0, 344565.0, 196975.0, 76066.0, 29661.0, 12738.0, 5896.0, 2945.0, 1594.0, 904.0, 484.0, 315.0, 175.0, 125.0, 73.0, 63.0, 41.0, 24.0, 20.0, 11.0, 9.0, 8.0, 4.0, 7.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1494140625, -1.1074981689453125, -1.065582275390625, -1.0236663818359375, -0.98175048828125, -0.9398345947265625, -0.897918701171875, -0.8560028076171875, -0.8140869140625, -0.7721710205078125, -0.730255126953125, -0.6883392333984375, -0.64642333984375, -0.6045074462890625, -0.562591552734375, -0.5206756591796875, -0.478759765625, -0.4368438720703125, -0.394927978515625, -0.3530120849609375, -0.31109619140625, -0.2691802978515625, -0.227264404296875, -0.1853485107421875, -0.1434326171875, -0.1015167236328125, -0.059600830078125, -0.0176849365234375, 0.02423095703125, 0.0661468505859375, 0.108062744140625, 0.1499786376953125, 0.19189453125, 0.2338104248046875, 0.275726318359375, 0.3176422119140625, 0.35955810546875, 0.4014739990234375, 0.443389892578125, 0.4853057861328125, 0.5272216796875, 0.5691375732421875, 0.611053466796875, 0.6529693603515625, 0.69488525390625, 0.7368011474609375, 0.778717041015625, 0.8206329345703125, 0.862548828125, 0.9044647216796875, 0.946380615234375, 0.9882965087890625, 1.03021240234375, 1.0721282958984375, 1.114044189453125, 1.1559600830078125, 1.1978759765625, 1.2397918701171875, 1.281707763671875, 1.3236236572265625, 1.36553955078125, 1.4074554443359375, 1.449371337890625, 1.4912872314453125, 1.533203125]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 6.0, 2.0, 6.0, 10.0, 12.0, 15.0, 13.0, 25.0, 25.0, 30.0, 37.0, 31.0, 45.0, 40.0, 50.0, 71.0, 56.0, 62.0, 71.0, 64.0, 60.0, 39.0, 51.0, 32.0, 31.0, 26.0, 20.0, 14.0, 12.0, 9.0, 7.0, 8.0, 4.0, 6.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.65673828125, -0.6317977905273438, -0.6068572998046875, -0.5819168090820312, -0.556976318359375, -0.5320358276367188, -0.5070953369140625, -0.48215484619140625, -0.45721435546875, -0.43227386474609375, -0.4073333740234375, -0.38239288330078125, -0.357452392578125, -0.33251190185546875, -0.3075714111328125, -0.28263092041015625, -0.2576904296875, -0.23274993896484375, -0.2078094482421875, -0.18286895751953125, -0.157928466796875, -0.13298797607421875, -0.1080474853515625, -0.08310699462890625, -0.05816650390625, -0.03322601318359375, -0.0082855224609375, 0.01665496826171875, 0.041595458984375, 0.06653594970703125, 0.0914764404296875, 0.11641693115234375, 0.141357421875, 0.16629791259765625, 0.1912384033203125, 0.21617889404296875, 0.241119384765625, 0.26605987548828125, 0.2910003662109375, 0.31594085693359375, 0.34088134765625, 0.36582183837890625, 0.3907623291015625, 0.41570281982421875, 0.440643310546875, 0.46558380126953125, 0.4905242919921875, 0.5154647827148438, 0.5404052734375, 0.5653457641601562, 0.5902862548828125, 0.6152267456054688, 0.640167236328125, 0.6651077270507812, 0.6900482177734375, 0.7149887084960938, 0.73992919921875, 0.7648696899414062, 0.7898101806640625, 0.8147506713867188, 0.839691162109375, 0.8646316528320312, 0.8895721435546875, 0.9145126342773438, 0.939453125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 5.0, 3.0, 6.0, 9.0, 13.0, 38.0, 40.0, 87.0, 124.0, 183.0, 386.0, 911.0, 3824.0, 67998.0, 935323.0, 35122.0, 2889.0, 763.0, 338.0, 174.0, 119.0, 69.0, 49.0, 26.0, 20.0, 9.0, 9.0, 4.0, 3.0, 3.0, 4.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.8125, -5.61492919921875, -5.4173583984375, -5.21978759765625, -5.022216796875, -4.82464599609375, -4.6270751953125, -4.42950439453125, -4.23193359375, -4.03436279296875, -3.8367919921875, -3.63922119140625, -3.441650390625, -3.24407958984375, -3.0465087890625, -2.84893798828125, -2.6513671875, -2.45379638671875, -2.2562255859375, -2.05865478515625, -1.861083984375, -1.66351318359375, -1.4659423828125, -1.26837158203125, -1.07080078125, -0.87322998046875, -0.6756591796875, -0.47808837890625, -0.280517578125, -0.08294677734375, 0.1146240234375, 0.31219482421875, 0.509765625, 0.70733642578125, 0.9049072265625, 1.10247802734375, 1.300048828125, 1.49761962890625, 1.6951904296875, 1.89276123046875, 2.09033203125, 2.28790283203125, 2.4854736328125, 2.68304443359375, 2.880615234375, 3.07818603515625, 3.2757568359375, 3.47332763671875, 3.6708984375, 3.86846923828125, 4.0660400390625, 4.26361083984375, 4.461181640625, 4.65875244140625, 4.8563232421875, 5.05389404296875, 5.25146484375, 5.44903564453125, 5.6466064453125, 5.84417724609375, 6.041748046875, 6.23931884765625, 6.4368896484375, 6.63446044921875, 6.83203125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 3.0, 9.0, 12.0, 12.0, 13.0, 27.0, 27.0, 40.0, 43.0, 58.0, 52.0, 71.0, 97.0, 74.0, 84.0, 61.0, 73.0, 63.0, 52.0, 36.0, 29.0, 21.0, 16.0, 13.0, 5.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.015625, -4.86053466796875, -4.7054443359375, -4.55035400390625, -4.395263671875, -4.24017333984375, -4.0850830078125, -3.92999267578125, -3.77490234375, -3.61981201171875, -3.4647216796875, -3.30963134765625, -3.154541015625, -2.99945068359375, -2.8443603515625, -2.68927001953125, -2.5341796875, -2.37908935546875, -2.2239990234375, -2.06890869140625, -1.913818359375, -1.75872802734375, -1.6036376953125, -1.44854736328125, -1.29345703125, -1.13836669921875, -0.9832763671875, -0.82818603515625, -0.673095703125, -0.51800537109375, -0.3629150390625, -0.20782470703125, -0.052734375, 0.10235595703125, 0.2574462890625, 0.41253662109375, 0.567626953125, 0.72271728515625, 0.8778076171875, 1.03289794921875, 1.18798828125, 1.34307861328125, 1.4981689453125, 1.65325927734375, 1.808349609375, 1.96343994140625, 2.1185302734375, 2.27362060546875, 2.4287109375, 2.58380126953125, 2.7388916015625, 2.89398193359375, 3.049072265625, 3.20416259765625, 3.3592529296875, 3.51434326171875, 3.66943359375, 3.82452392578125, 3.9796142578125, 4.13470458984375, 4.289794921875, 4.44488525390625, 4.5999755859375, 4.75506591796875, 4.91015625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 4.0, 5.0, 10.0, 9.0, 15.0, 17.0, 44.0, 77.0, 136.0, 344.0, 1018.0, 4556.0, 63919.0, 922021.0, 50840.0, 3932.0, 915.0, 352.0, 150.0, 86.0, 34.0, 16.0, 17.0, 15.0, 9.0, 8.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.14453125, -2.0872955322265625, -2.030059814453125, -1.9728240966796875, -1.91558837890625, -1.8583526611328125, -1.801116943359375, -1.7438812255859375, -1.6866455078125, -1.6294097900390625, -1.572174072265625, -1.5149383544921875, -1.45770263671875, -1.4004669189453125, -1.343231201171875, -1.2859954833984375, -1.228759765625, -1.1715240478515625, -1.114288330078125, -1.0570526123046875, -0.99981689453125, -0.9425811767578125, -0.885345458984375, -0.8281097412109375, -0.7708740234375, -0.7136383056640625, -0.656402587890625, -0.5991668701171875, -0.54193115234375, -0.4846954345703125, -0.427459716796875, -0.3702239990234375, -0.31298828125, -0.2557525634765625, -0.198516845703125, -0.1412811279296875, -0.08404541015625, -0.0268096923828125, 0.030426025390625, 0.0876617431640625, 0.1448974609375, 0.2021331787109375, 0.259368896484375, 0.3166046142578125, 0.37384033203125, 0.4310760498046875, 0.488311767578125, 0.5455474853515625, 0.602783203125, 0.6600189208984375, 0.717254638671875, 0.7744903564453125, 0.83172607421875, 0.8889617919921875, 0.946197509765625, 1.0034332275390625, 1.0606689453125, 1.1179046630859375, 1.175140380859375, 1.2323760986328125, 1.28961181640625, 1.3468475341796875, 1.404083251953125, 1.4613189697265625, 1.5185546875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 0.0, 2.0, 5.0, 4.0, 9.0, 10.0, 10.0, 19.0, 24.0, 34.0, 42.0, 71.0, 92.0, 119.0, 112.0, 109.0, 103.0, 77.0, 39.0, 32.0, 21.0, 22.0, 7.0, 6.0, 11.0, 10.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00023245811462402344, -0.00022589415311813354, -0.00021933019161224365, -0.00021276623010635376, -0.00020620226860046387, -0.00019963830709457397, -0.00019307434558868408, -0.0001865103840827942, -0.0001799464225769043, -0.0001733824610710144, -0.0001668184995651245, -0.00016025453805923462, -0.00015369057655334473, -0.00014712661504745483, -0.00014056265354156494, -0.00013399869203567505, -0.00012743473052978516, -0.00012087076902389526, -0.00011430680751800537, -0.00010774284601211548, -0.00010117888450622559, -9.46149230003357e-05, -8.80509614944458e-05, -8.148699998855591e-05, -7.492303848266602e-05, -6.835907697677612e-05, -6.179511547088623e-05, -5.523115396499634e-05, -4.8667192459106445e-05, -4.210323095321655e-05, -3.553926944732666e-05, -2.8975307941436768e-05, -2.2411346435546875e-05, -1.5847384929656982e-05, -9.28342342376709e-06, -2.7194619178771973e-06, 3.844499588012695e-06, 1.0408461093902588e-05, 1.697242259979248e-05, 2.3536384105682373e-05, 3.0100345611572266e-05, 3.666430711746216e-05, 4.322826862335205e-05, 4.979223012924194e-05, 5.6356191635131836e-05, 6.292015314102173e-05, 6.948411464691162e-05, 7.604807615280151e-05, 8.26120376586914e-05, 8.91759991645813e-05, 9.573996067047119e-05, 0.00010230392217636108, 0.00010886788368225098, 0.00011543184518814087, 0.00012199580669403076, 0.00012855976819992065, 0.00013512372970581055, 0.00014168769121170044, 0.00014825165271759033, 0.00015481561422348022, 0.00016137957572937012, 0.00016794353723526, 0.0001745074987411499, 0.0001810714602470398, 0.0001876354217529297]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 9.0, 7.0, 2.0, 9.0, 14.0, 29.0, 40.0, 58.0, 84.0, 182.0, 390.0, 820.0, 2496.0, 12710.0, 210623.0, 773386.0, 40026.0, 5149.0, 1377.0, 564.0, 247.0, 112.0, 82.0, 54.0, 29.0, 20.0, 13.0, 4.0, 5.0, 1.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4130859375, -1.3692626953125, -1.325439453125, -1.2816162109375, -1.23779296875, -1.1939697265625, -1.150146484375, -1.1063232421875, -1.0625, -1.0186767578125, -0.974853515625, -0.9310302734375, -0.88720703125, -0.8433837890625, -0.799560546875, -0.7557373046875, -0.7119140625, -0.6680908203125, -0.624267578125, -0.5804443359375, -0.53662109375, -0.4927978515625, -0.448974609375, -0.4051513671875, -0.361328125, -0.3175048828125, -0.273681640625, -0.2298583984375, -0.18603515625, -0.1422119140625, -0.098388671875, -0.0545654296875, -0.0107421875, 0.0330810546875, 0.076904296875, 0.1207275390625, 0.16455078125, 0.2083740234375, 0.252197265625, 0.2960205078125, 0.33984375, 0.3836669921875, 0.427490234375, 0.4713134765625, 0.51513671875, 0.5589599609375, 0.602783203125, 0.6466064453125, 0.6904296875, 0.7342529296875, 0.778076171875, 0.8218994140625, 0.86572265625, 0.9095458984375, 0.953369140625, 0.9971923828125, 1.041015625, 1.0848388671875, 1.128662109375, 1.1724853515625, 1.21630859375, 1.2601318359375, 1.303955078125, 1.3477783203125, 1.3916015625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 3.0, 10.0, 9.0, 11.0, 17.0, 35.0, 24.0, 58.0, 70.0, 86.0, 110.0, 118.0, 113.0, 93.0, 72.0, 60.0, 40.0, 21.0, 17.0, 11.0, 3.0, 2.0, 3.0, 3.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.990234375, -0.952606201171875, -0.91497802734375, -0.877349853515625, -0.8397216796875, -0.802093505859375, -0.76446533203125, -0.726837158203125, -0.689208984375, -0.651580810546875, -0.61395263671875, -0.576324462890625, -0.5386962890625, -0.501068115234375, -0.46343994140625, -0.425811767578125, -0.38818359375, -0.350555419921875, -0.31292724609375, -0.275299072265625, -0.2376708984375, -0.200042724609375, -0.16241455078125, -0.124786376953125, -0.087158203125, -0.049530029296875, -0.01190185546875, 0.025726318359375, 0.0633544921875, 0.100982666015625, 0.13861083984375, 0.176239013671875, 0.2138671875, 0.251495361328125, 0.28912353515625, 0.326751708984375, 0.3643798828125, 0.402008056640625, 0.43963623046875, 0.477264404296875, 0.514892578125, 0.552520751953125, 0.59014892578125, 0.627777099609375, 0.6654052734375, 0.703033447265625, 0.74066162109375, 0.778289794921875, 0.81591796875, 0.853546142578125, 0.89117431640625, 0.928802490234375, 0.9664306640625, 1.004058837890625, 1.04168701171875, 1.079315185546875, 1.116943359375, 1.154571533203125, 1.19219970703125, 1.229827880859375, 1.2674560546875, 1.305084228515625, 1.34271240234375, 1.380340576171875, 1.41796875]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 15.0, 17.0, 48.0, 104.0, 207.0, 276.0, 188.0, 76.0, 42.0, 24.0, 6.0, 7.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.46487808227539, -16.038665771484375, -14.612455368041992, -13.186243057250977, -11.760031700134277, -10.333820343017578, -8.907608032226562, -7.481396675109863, -6.055185317993164, -4.628973960876465, -3.2027621269226074, -1.77655029296875, -0.3503389358520508, 1.0758724212646484, 2.502084732055664, 3.9282960891723633, 5.3545074462890625, 6.780718803405762, 8.206930160522461, 9.633142471313477, 11.059353828430176, 12.485565185546875, 13.91177749633789, 15.33798885345459, 16.76420021057129, 18.190412521362305, 19.616622924804688, 21.042835235595703, 22.46904754638672, 23.8952579498291, 25.321470260620117, 26.7476806640625, 28.17389678955078, 29.600109100341797, 31.02631950378418, 32.45252990722656, 33.87874221801758, 35.304954528808594, 36.73116683959961, 38.157379150390625, 39.583587646484375, 41.00979995727539, 42.436012268066406, 43.862220764160156, 45.28843307495117, 46.71464538574219, 48.1408576965332, 49.56707000732422, 50.993282318115234, 52.41949462890625, 53.845706939697266, 55.27191925048828, 56.69812774658203, 58.12434005737305, 59.55055236816406, 60.97676467895508, 62.402976989746094, 63.82918930053711, 65.25540161132812, 66.68161010742188, 68.10782623291016, 69.5340347290039, 70.96025085449219, 72.38645935058594, 73.81266784667969]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 1.0, 4.0, 5.0, 8.0, 10.0, 16.0, 18.0, 21.0, 20.0, 30.0, 37.0, 42.0, 59.0, 63.0, 61.0, 61.0, 51.0, 75.0, 64.0, 47.0, 51.0, 48.0, 51.0, 36.0, 23.0, 26.0, 14.0, 15.0, 9.0, 9.0, 9.0, 4.0, 7.0, 5.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.036518096923828, -20.397083282470703, -19.757646560668945, -19.11821174621582, -18.478775024414062, -17.839340209960938, -17.199905395507812, -16.560470581054688, -15.92103385925293, -15.281598091125488, -14.642162322998047, -14.002727508544922, -13.36329174041748, -12.723855972290039, -12.084421157836914, -11.444985389709473, -10.805549621582031, -10.16611385345459, -9.526678085327148, -8.887243270874023, -8.247807502746582, -7.608371734619141, -6.968936443328857, -6.329501152038574, -5.690065383911133, -5.050629615783691, -4.411194324493408, -3.771758794784546, -3.1323232650756836, -2.4928877353668213, -1.853452205657959, -1.2140169143676758, -0.5745811462402344, 0.06485438346862793, 0.7042899131774902, 1.3437254428863525, 1.9831609725952148, 2.622596502304077, 3.2620320320129395, 3.9014673233032227, 4.540903091430664, 5.1803388595581055, 5.819774150848389, 6.459209442138672, 7.098645210266113, 7.738080978393555, 8.37751579284668, 9.016951560974121, 9.656387329101562, 10.295823097229004, 10.935258865356445, 11.57469367980957, 12.214129447937012, 12.853565216064453, 13.493000030517578, 14.13243579864502, 14.771871566772461, 15.411307334899902, 16.050743103027344, 16.69017791748047, 17.329612731933594, 17.96904945373535, 18.608484268188477, 19.247920989990234, 19.88735580444336]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 1.0, 7.0, 1.0, 2.0, 7.0, 6.0, 9.0, 9.0, 7.0, 11.0, 13.0, 19.0, 24.0, 33.0, 34.0, 41.0, 65.0, 110.0, 127.0, 223.0, 365.0, 682.0, 1260.0, 3059.0, 7999.0, 27231.0, 142278.0, 3218992.0, 697350.0, 66861.0, 17249.0, 5733.0, 2310.0, 1062.0, 495.0, 232.0, 144.0, 87.0, 53.0, 28.0, 20.0, 12.0, 12.0, 12.0, 4.0, 7.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.08203125, -2.030975341796875, -1.97991943359375, -1.928863525390625, -1.8778076171875, -1.826751708984375, -1.77569580078125, -1.724639892578125, -1.673583984375, -1.622528076171875, -1.57147216796875, -1.520416259765625, -1.4693603515625, -1.418304443359375, -1.36724853515625, -1.316192626953125, -1.26513671875, -1.214080810546875, -1.16302490234375, -1.111968994140625, -1.0609130859375, -1.009857177734375, -0.95880126953125, -0.907745361328125, -0.856689453125, -0.805633544921875, -0.75457763671875, -0.703521728515625, -0.6524658203125, -0.601409912109375, -0.55035400390625, -0.499298095703125, -0.4482421875, -0.397186279296875, -0.34613037109375, -0.295074462890625, -0.2440185546875, -0.192962646484375, -0.14190673828125, -0.090850830078125, -0.039794921875, 0.011260986328125, 0.06231689453125, 0.113372802734375, 0.1644287109375, 0.215484619140625, 0.26654052734375, 0.317596435546875, 0.36865234375, 0.419708251953125, 0.47076416015625, 0.521820068359375, 0.5728759765625, 0.623931884765625, 0.67498779296875, 0.726043701171875, 0.777099609375, 0.828155517578125, 0.87921142578125, 0.930267333984375, 0.9813232421875, 1.032379150390625, 1.08343505859375, 1.134490966796875, 1.185546875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 9.0, 20.0, 34.0, 61.0, 89.0, 103.0, 145.0, 142.0, 107.0, 115.0, 57.0, 53.0, 32.0, 11.0, 8.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.15625, -2.1038665771484375, -2.051483154296875, -1.9990997314453125, -1.94671630859375, -1.8943328857421875, -1.841949462890625, -1.7895660400390625, -1.7371826171875, -1.6847991943359375, -1.632415771484375, -1.5800323486328125, -1.52764892578125, -1.4752655029296875, -1.422882080078125, -1.3704986572265625, -1.318115234375, -1.2657318115234375, -1.213348388671875, -1.1609649658203125, -1.10858154296875, -1.0561981201171875, -1.003814697265625, -0.9514312744140625, -0.8990478515625, -0.8466644287109375, -0.794281005859375, -0.7418975830078125, -0.68951416015625, -0.6371307373046875, -0.584747314453125, -0.5323638916015625, -0.47998046875, -0.4275970458984375, -0.375213623046875, -0.3228302001953125, -0.27044677734375, -0.2180633544921875, -0.165679931640625, -0.1132965087890625, -0.0609130859375, -0.0085296630859375, 0.043853759765625, 0.0962371826171875, 0.14862060546875, 0.2010040283203125, 0.253387451171875, 0.3057708740234375, 0.358154296875, 0.4105377197265625, 0.462921142578125, 0.5153045654296875, 0.56768798828125, 0.6200714111328125, 0.672454833984375, 0.7248382568359375, 0.7772216796875, 0.8296051025390625, 0.881988525390625, 0.9343719482421875, 0.98675537109375, 1.0391387939453125, 1.091522216796875, 1.1439056396484375, 1.1962890625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 4.0, 6.0, 7.0, 10.0, 14.0, 20.0, 23.0, 50.0, 73.0, 110.0, 232.0, 518.0, 1252.0, 3844.0, 15148.0, 104116.0, 3659443.0, 368966.0, 30547.0, 6449.0, 1981.0, 780.0, 301.0, 156.0, 85.0, 44.0, 21.0, 14.0, 13.0, 10.0, 6.0, 10.0, 6.0, 4.0, 5.0, 1.0, 1.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-2.833984375, -2.749908447265625, -2.66583251953125, -2.581756591796875, -2.4976806640625, -2.413604736328125, -2.32952880859375, -2.245452880859375, -2.161376953125, -2.077301025390625, -1.99322509765625, -1.909149169921875, -1.8250732421875, -1.740997314453125, -1.65692138671875, -1.572845458984375, -1.48876953125, -1.404693603515625, -1.32061767578125, -1.236541748046875, -1.1524658203125, -1.068389892578125, -0.98431396484375, -0.900238037109375, -0.816162109375, -0.732086181640625, -0.64801025390625, -0.563934326171875, -0.4798583984375, -0.395782470703125, -0.31170654296875, -0.227630615234375, -0.1435546875, -0.059478759765625, 0.02459716796875, 0.108673095703125, 0.1927490234375, 0.276824951171875, 0.36090087890625, 0.444976806640625, 0.529052734375, 0.613128662109375, 0.69720458984375, 0.781280517578125, 0.8653564453125, 0.949432373046875, 1.03350830078125, 1.117584228515625, 1.20166015625, 1.285736083984375, 1.36981201171875, 1.453887939453125, 1.5379638671875, 1.622039794921875, 1.70611572265625, 1.790191650390625, 1.874267578125, 1.958343505859375, 2.04241943359375, 2.126495361328125, 2.2105712890625, 2.294647216796875, 2.37872314453125, 2.462799072265625, 2.546875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 5.0, 2.0, 7.0, 8.0, 14.0, 15.0, 16.0, 20.0, 37.0, 63.0, 75.0, 147.0, 322.0, 856.0, 1215.0, 645.0, 257.0, 136.0, 66.0, 52.0, 29.0, 17.0, 21.0, 9.0, 7.0, 10.0, 4.0, 7.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.41796875, -2.34332275390625, -2.2686767578125, -2.19403076171875, -2.119384765625, -2.04473876953125, -1.9700927734375, -1.89544677734375, -1.82080078125, -1.74615478515625, -1.6715087890625, -1.59686279296875, -1.522216796875, -1.44757080078125, -1.3729248046875, -1.29827880859375, -1.2236328125, -1.14898681640625, -1.0743408203125, -0.99969482421875, -0.925048828125, -0.85040283203125, -0.7757568359375, -0.70111083984375, -0.62646484375, -0.55181884765625, -0.4771728515625, -0.40252685546875, -0.327880859375, -0.25323486328125, -0.1785888671875, -0.10394287109375, -0.029296875, 0.04534912109375, 0.1199951171875, 0.19464111328125, 0.269287109375, 0.34393310546875, 0.4185791015625, 0.49322509765625, 0.56787109375, 0.64251708984375, 0.7171630859375, 0.79180908203125, 0.866455078125, 0.94110107421875, 1.0157470703125, 1.09039306640625, 1.1650390625, 1.23968505859375, 1.3143310546875, 1.38897705078125, 1.463623046875, 1.53826904296875, 1.6129150390625, 1.68756103515625, 1.76220703125, 1.83685302734375, 1.9114990234375, 1.98614501953125, 2.060791015625, 2.13543701171875, 2.2100830078125, 2.28472900390625, 2.359375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 2.0, 8.0, 14.0, 31.0, 94.0, 215.0, 285.0, 194.0, 99.0, 31.0, 9.0, 7.0, 6.0, 2.0, 5.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.81629180908203, -35.92899703979492, -35.04170227050781, -34.1544075012207, -33.267112731933594, -32.379817962646484, -31.492525100708008, -30.6052303314209, -29.71793556213379, -28.83064079284668, -27.94334602355957, -27.05605125427246, -26.168758392333984, -25.281463623046875, -24.394168853759766, -23.506874084472656, -22.619579315185547, -21.732284545898438, -20.844989776611328, -19.95769500732422, -19.07040023803711, -18.18310546875, -17.295812606811523, -16.408517837524414, -15.521223068237305, -14.633928298950195, -13.746633529663086, -12.859339714050293, -11.972044944763184, -11.084750175476074, -10.197456359863281, -9.310161590576172, -8.422868728637695, -7.535573959350586, -6.648279666900635, -5.760985374450684, -4.873690605163574, -3.986395835876465, -3.0991015434265137, -2.2118072509765625, -1.3245124816894531, -0.43721795082092285, 0.4500765800476074, 1.3373711109161377, 2.224665641784668, 3.1119604110717773, 3.9992547035217285, 4.88654899597168, 5.773843765258789, 6.661138534545898, 7.54843282699585, 8.4357271194458, 9.32302188873291, 10.21031665802002, 11.097610473632812, 11.984905242919922, 12.872200012207031, 13.75949478149414, 14.64678955078125, 15.534083366394043, 16.42137908935547, 17.308673858642578, 18.195966720581055, 19.083261489868164, 19.970556259155273]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 7.0, 7.0, 9.0, 13.0, 18.0, 21.0, 19.0, 22.0, 36.0, 28.0, 45.0, 43.0, 48.0, 66.0, 54.0, 60.0, 62.0, 56.0, 52.0, 52.0, 40.0, 40.0, 39.0, 42.0, 21.0, 23.0, 23.0, 13.0, 12.0, 8.0, 7.0, 3.0, 1.0, 4.0, 2.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.543047904968262, -9.176339149475098, -8.809630393981934, -8.44292163848877, -8.076212882995605, -7.709504127502441, -7.342795372009277, -6.976086616516113, -6.609377861022949, -6.242669105529785, -5.875960350036621, -5.509251594543457, -5.142542839050293, -4.775834083557129, -4.409125328063965, -4.042416572570801, -3.6757073402404785, -3.3089985847473145, -2.9422898292541504, -2.5755810737609863, -2.2088723182678223, -1.8421634435653687, -1.475454568862915, -1.108745813369751, -0.7420370578765869, -0.37532827258110046, -0.008619487285614014, 0.3580893278121948, 0.7247980833053589, 1.091506838798523, 1.4582157135009766, 1.8249244689941406, 2.1916332244873047, 2.5583419799804688, 2.925050735473633, 3.291759490966797, 3.658468246459961, 4.025177001953125, 4.391885757446289, 4.758594512939453, 5.125303268432617, 5.492012023925781, 5.858720779418945, 6.225429534912109, 6.592138290405273, 6.9588470458984375, 7.325555801391602, 7.692264556884766, 8.05897331237793, 8.425682067871094, 8.792390823364258, 9.159099578857422, 9.525808334350586, 9.89251708984375, 10.259225845336914, 10.625934600830078, 10.992644309997559, 11.359353065490723, 11.726061820983887, 12.09277057647705, 12.459479331970215, 12.826188087463379, 13.192896842956543, 13.559605598449707, 13.926314353942871]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 9.0, 5.0, 8.0, 8.0, 18.0, 35.0, 35.0, 70.0, 96.0, 178.0, 266.0, 411.0, 826.0, 1382.0, 2527.0, 5060.0, 10587.0, 23187.0, 53036.0, 118712.0, 230494.0, 278968.0, 173788.0, 81420.0, 35885.0, 16066.0, 7405.0, 3692.0, 1902.0, 989.0, 562.0, 343.0, 191.0, 141.0, 93.0, 48.0, 39.0, 29.0, 12.0, 9.0, 8.0, 6.0, 4.0, 1.0, 1.0, 5.0, 1.0, 1.0, 0.0, 3.0, 2.0], "bins": [-1.09765625, -1.0656204223632812, -1.0335845947265625, -1.0015487670898438, -0.969512939453125, -0.9374771118164062, -0.9054412841796875, -0.8734054565429688, -0.84136962890625, -0.8093338012695312, -0.7772979736328125, -0.7452621459960938, -0.713226318359375, -0.6811904907226562, -0.6491546630859375, -0.6171188354492188, -0.5850830078125, -0.5530471801757812, -0.5210113525390625, -0.48897552490234375, -0.456939697265625, -0.42490386962890625, -0.3928680419921875, -0.36083221435546875, -0.32879638671875, -0.29676055908203125, -0.2647247314453125, -0.23268890380859375, -0.200653076171875, -0.16861724853515625, -0.1365814208984375, -0.10454559326171875, -0.072509765625, -0.04047393798828125, -0.0084381103515625, 0.02359771728515625, 0.055633544921875, 0.08766937255859375, 0.1197052001953125, 0.15174102783203125, 0.18377685546875, 0.21581268310546875, 0.2478485107421875, 0.27988433837890625, 0.311920166015625, 0.34395599365234375, 0.3759918212890625, 0.40802764892578125, 0.4400634765625, 0.47209930419921875, 0.5041351318359375, 0.5361709594726562, 0.568206787109375, 0.6002426147460938, 0.6322784423828125, 0.6643142700195312, 0.69635009765625, 0.7283859252929688, 0.7604217529296875, 0.7924575805664062, 0.824493408203125, 0.8565292358398438, 0.8885650634765625, 0.9206008911132812, 0.95263671875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 12.0, 7.0, 15.0, 21.0, 18.0, 39.0, 61.0, 83.0, 81.0, 100.0, 115.0, 97.0, 86.0, 71.0, 65.0, 45.0, 29.0, 22.0, 13.0, 10.0, 10.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3935546875, -1.35540771484375, -1.3172607421875, -1.27911376953125, -1.240966796875, -1.20281982421875, -1.1646728515625, -1.12652587890625, -1.08837890625, -1.05023193359375, -1.0120849609375, -0.97393798828125, -0.935791015625, -0.89764404296875, -0.8594970703125, -0.82135009765625, -0.783203125, -0.74505615234375, -0.7069091796875, -0.66876220703125, -0.630615234375, -0.59246826171875, -0.5543212890625, -0.51617431640625, -0.47802734375, -0.43988037109375, -0.4017333984375, -0.36358642578125, -0.325439453125, -0.28729248046875, -0.2491455078125, -0.21099853515625, -0.1728515625, -0.13470458984375, -0.0965576171875, -0.05841064453125, -0.020263671875, 0.01788330078125, 0.0560302734375, 0.09417724609375, 0.13232421875, 0.17047119140625, 0.2086181640625, 0.24676513671875, 0.284912109375, 0.32305908203125, 0.3612060546875, 0.39935302734375, 0.4375, 0.47564697265625, 0.5137939453125, 0.55194091796875, 0.590087890625, 0.62823486328125, 0.6663818359375, 0.70452880859375, 0.74267578125, 0.78082275390625, 0.8189697265625, 0.85711669921875, 0.895263671875, 0.93341064453125, 0.9715576171875, 1.00970458984375, 1.0478515625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 5.0, 6.0, 9.0, 4.0, 17.0, 14.0, 24.0, 40.0, 44.0, 80.0, 122.0, 171.0, 280.0, 453.0, 743.0, 1439.0, 3079.0, 8967.0, 35384.0, 203057.0, 603385.0, 151022.0, 27166.0, 7176.0, 2705.0, 1258.0, 681.0, 423.0, 267.0, 157.0, 118.0, 69.0, 45.0, 43.0, 34.0, 23.0, 14.0, 8.0, 6.0, 6.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.71875, -1.6536865234375, -1.588623046875, -1.5235595703125, -1.45849609375, -1.3934326171875, -1.328369140625, -1.2633056640625, -1.1982421875, -1.1331787109375, -1.068115234375, -1.0030517578125, -0.93798828125, -0.8729248046875, -0.807861328125, -0.7427978515625, -0.677734375, -0.6126708984375, -0.547607421875, -0.4825439453125, -0.41748046875, -0.3524169921875, -0.287353515625, -0.2222900390625, -0.1572265625, -0.0921630859375, -0.027099609375, 0.0379638671875, 0.10302734375, 0.1680908203125, 0.233154296875, 0.2982177734375, 0.36328125, 0.4283447265625, 0.493408203125, 0.5584716796875, 0.62353515625, 0.6885986328125, 0.753662109375, 0.8187255859375, 0.8837890625, 0.9488525390625, 1.013916015625, 1.0789794921875, 1.14404296875, 1.2091064453125, 1.274169921875, 1.3392333984375, 1.404296875, 1.4693603515625, 1.534423828125, 1.5994873046875, 1.66455078125, 1.7296142578125, 1.794677734375, 1.8597412109375, 1.9248046875, 1.9898681640625, 2.054931640625, 2.1199951171875, 2.18505859375, 2.2501220703125, 2.315185546875, 2.3802490234375, 2.4453125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 1.0, 3.0, 1.0, 4.0, 7.0, 14.0, 12.0, 14.0, 17.0, 25.0, 17.0, 26.0, 28.0, 48.0, 46.0, 43.0, 46.0, 56.0, 52.0, 48.0, 42.0, 55.0, 42.0, 46.0, 43.0, 34.0, 43.0, 30.0, 27.0, 25.0, 13.0, 20.0, 18.0, 10.0, 12.0, 5.0, 5.0, 5.0, 3.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9765625, -2.883453369140625, -2.79034423828125, -2.697235107421875, -2.6041259765625, -2.511016845703125, -2.41790771484375, -2.324798583984375, -2.231689453125, -2.138580322265625, -2.04547119140625, -1.952362060546875, -1.8592529296875, -1.766143798828125, -1.67303466796875, -1.579925537109375, -1.48681640625, -1.393707275390625, -1.30059814453125, -1.207489013671875, -1.1143798828125, -1.021270751953125, -0.92816162109375, -0.835052490234375, -0.741943359375, -0.648834228515625, -0.55572509765625, -0.462615966796875, -0.3695068359375, -0.276397705078125, -0.18328857421875, -0.090179443359375, 0.0029296875, 0.096038818359375, 0.18914794921875, 0.282257080078125, 0.3753662109375, 0.468475341796875, 0.56158447265625, 0.654693603515625, 0.747802734375, 0.840911865234375, 0.93402099609375, 1.027130126953125, 1.1202392578125, 1.213348388671875, 1.30645751953125, 1.399566650390625, 1.49267578125, 1.585784912109375, 1.67889404296875, 1.772003173828125, 1.8651123046875, 1.958221435546875, 2.05133056640625, 2.144439697265625, 2.237548828125, 2.330657958984375, 2.42376708984375, 2.516876220703125, 2.6099853515625, 2.703094482421875, 2.79620361328125, 2.889312744140625, 2.982421875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 5.0, 3.0, 5.0, 1.0, 10.0, 24.0, 16.0, 25.0, 57.0, 61.0, 125.0, 234.0, 514.0, 1217.0, 4067.0, 21468.0, 300791.0, 670013.0, 40820.0, 6090.0, 1674.0, 624.0, 300.0, 169.0, 87.0, 54.0, 21.0, 28.0, 18.0, 6.0, 5.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2216796875, -1.1858978271484375, -1.150115966796875, -1.1143341064453125, -1.07855224609375, -1.0427703857421875, -1.006988525390625, -0.9712066650390625, -0.9354248046875, -0.8996429443359375, -0.863861083984375, -0.8280792236328125, -0.79229736328125, -0.7565155029296875, -0.720733642578125, -0.6849517822265625, -0.649169921875, -0.6133880615234375, -0.577606201171875, -0.5418243408203125, -0.50604248046875, -0.4702606201171875, -0.434478759765625, -0.3986968994140625, -0.3629150390625, -0.3271331787109375, -0.291351318359375, -0.2555694580078125, -0.21978759765625, -0.1840057373046875, -0.148223876953125, -0.1124420166015625, -0.07666015625, -0.0408782958984375, -0.005096435546875, 0.0306854248046875, 0.06646728515625, 0.1022491455078125, 0.138031005859375, 0.1738128662109375, 0.2095947265625, 0.2453765869140625, 0.281158447265625, 0.3169403076171875, 0.35272216796875, 0.3885040283203125, 0.424285888671875, 0.4600677490234375, 0.495849609375, 0.5316314697265625, 0.567413330078125, 0.6031951904296875, 0.63897705078125, 0.6747589111328125, 0.710540771484375, 0.7463226318359375, 0.7821044921875, 0.8178863525390625, 0.853668212890625, 0.8894500732421875, 0.92523193359375, 0.9610137939453125, 0.996795654296875, 1.0325775146484375, 1.068359375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 0.0, 2.0, 4.0, 3.0, 3.0, 9.0, 7.0, 15.0, 20.0, 31.0, 40.0, 54.0, 74.0, 78.0, 126.0, 124.0, 109.0, 66.0, 63.0, 52.0, 28.0, 25.0, 19.0, 16.0, 9.0, 4.0, 4.0, 3.0, 2.0, 6.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019669532775878906, -0.00019000470638275146, -0.00018331408500671387, -0.00017662346363067627, -0.00016993284225463867, -0.00016324222087860107, -0.00015655159950256348, -0.00014986097812652588, -0.00014317035675048828, -0.00013647973537445068, -0.00012978911399841309, -0.0001230984926223755, -0.00011640787124633789, -0.00010971724987030029, -0.0001030266284942627, -9.63360071182251e-05, -8.96453857421875e-05, -8.29547643661499e-05, -7.62641429901123e-05, -6.957352161407471e-05, -6.288290023803711e-05, -5.619227886199951e-05, -4.9501657485961914e-05, -4.2811036109924316e-05, -3.612041473388672e-05, -2.942979335784912e-05, -2.2739171981811523e-05, -1.6048550605773926e-05, -9.357929229736328e-06, -2.6673078536987305e-06, 4.023313522338867e-06, 1.0713934898376465e-05, 1.7404556274414062e-05, 2.409517765045166e-05, 3.078579902648926e-05, 3.7476420402526855e-05, 4.416704177856445e-05, 5.085766315460205e-05, 5.754828453063965e-05, 6.423890590667725e-05, 7.092952728271484e-05, 7.762014865875244e-05, 8.431077003479004e-05, 9.100139141082764e-05, 9.769201278686523e-05, 0.00010438263416290283, 0.00011107325553894043, 0.00011776387691497803, 0.00012445449829101562, 0.00013114511966705322, 0.00013783574104309082, 0.00014452636241912842, 0.00015121698379516602, 0.0001579076051712036, 0.0001645982265472412, 0.0001712888479232788, 0.0001779794692993164, 0.000184670090675354, 0.0001913607120513916, 0.0001980513334274292, 0.0002047419548034668, 0.0002114325761795044, 0.000218123197555542, 0.0002248138189315796, 0.0002315044403076172]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 7.0, 3.0, 4.0, 6.0, 12.0, 22.0, 24.0, 54.0, 86.0, 162.0, 279.0, 508.0, 1155.0, 3233.0, 11184.0, 80193.0, 722084.0, 200764.0, 20936.0, 4688.0, 1668.0, 705.0, 326.0, 163.0, 104.0, 68.0, 37.0, 25.0, 17.0, 14.0, 8.0, 2.0, 3.0, 4.0, 2.0, 4.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.9033203125, -0.8738784790039062, -0.8444366455078125, -0.8149948120117188, -0.785552978515625, -0.7561111450195312, -0.7266693115234375, -0.6972274780273438, -0.66778564453125, -0.6383438110351562, -0.6089019775390625, -0.5794601440429688, -0.550018310546875, -0.5205764770507812, -0.4911346435546875, -0.46169281005859375, -0.4322509765625, -0.40280914306640625, -0.3733673095703125, -0.34392547607421875, -0.314483642578125, -0.28504180908203125, -0.2555999755859375, -0.22615814208984375, -0.19671630859375, -0.16727447509765625, -0.1378326416015625, -0.10839080810546875, -0.078948974609375, -0.04950714111328125, -0.0200653076171875, 0.00937652587890625, 0.038818359375, 0.06826019287109375, 0.0977020263671875, 0.12714385986328125, 0.156585693359375, 0.18602752685546875, 0.2154693603515625, 0.24491119384765625, 0.27435302734375, 0.30379486083984375, 0.3332366943359375, 0.36267852783203125, 0.392120361328125, 0.42156219482421875, 0.4510040283203125, 0.48044586181640625, 0.5098876953125, 0.5393295288085938, 0.5687713623046875, 0.5982131958007812, 0.627655029296875, 0.6570968627929688, 0.6865386962890625, 0.7159805297851562, 0.74542236328125, 0.7748641967773438, 0.8043060302734375, 0.8337478637695312, 0.863189697265625, 0.8926315307617188, 0.9220733642578125, 0.9515151977539062, 0.98095703125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 8.0, 5.0, 8.0, 6.0, 13.0, 15.0, 21.0, 23.0, 33.0, 35.0, 50.0, 53.0, 66.0, 86.0, 80.0, 82.0, 71.0, 69.0, 77.0, 59.0, 30.0, 26.0, 29.0, 14.0, 10.0, 13.0, 9.0, 7.0, 4.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.66455078125, -0.6380538940429688, -0.6115570068359375, -0.5850601196289062, -0.558563232421875, -0.5320663452148438, -0.5055694580078125, -0.47907257080078125, -0.45257568359375, -0.42607879638671875, -0.3995819091796875, -0.37308502197265625, -0.346588134765625, -0.32009124755859375, -0.2935943603515625, -0.26709747314453125, -0.2406005859375, -0.21410369873046875, -0.1876068115234375, -0.16110992431640625, -0.134613037109375, -0.10811614990234375, -0.0816192626953125, -0.05512237548828125, -0.02862548828125, -0.00212860107421875, 0.0243682861328125, 0.05086517333984375, 0.077362060546875, 0.10385894775390625, 0.1303558349609375, 0.15685272216796875, 0.183349609375, 0.20984649658203125, 0.2363433837890625, 0.26284027099609375, 0.289337158203125, 0.31583404541015625, 0.3423309326171875, 0.36882781982421875, 0.39532470703125, 0.42182159423828125, 0.4483184814453125, 0.47481536865234375, 0.501312255859375, 0.5278091430664062, 0.5543060302734375, 0.5808029174804688, 0.6072998046875, 0.6337966918945312, 0.6602935791015625, 0.6867904663085938, 0.713287353515625, 0.7397842407226562, 0.7662811279296875, 0.7927780151367188, 0.81927490234375, 0.8457717895507812, 0.8722686767578125, 0.8987655639648438, 0.925262451171875, 0.9517593383789062, 0.9782562255859375, 1.0047531127929688, 1.03125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 5.0, 52.0, 240.0, 532.0, 164.0, 18.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.50355529785156, -74.56202697753906, -72.6205062866211, -70.6789779663086, -68.7374496459961, -66.79592895507812, -64.85440063476562, -62.91287612915039, -60.971351623535156, -59.02982711791992, -57.08829879760742, -55.14677429199219, -53.20524978637695, -51.26372528076172, -49.32219696044922, -47.380672454833984, -45.439144134521484, -43.49761962890625, -41.55609130859375, -39.614566802978516, -37.67304229736328, -35.73151397705078, -33.78998947143555, -31.848464965820312, -29.906938552856445, -27.965412139892578, -26.023887634277344, -24.082361221313477, -22.14083480834961, -20.199310302734375, -18.257783889770508, -16.31625747680664, -14.374736785888672, -12.433211326599121, -10.49168586730957, -8.550159454345703, -6.608633995056152, -4.667108535766602, -2.7255821228027344, -0.7840566635131836, 1.1574687957763672, 3.098994493484497, 5.040520191192627, 6.982046127319336, 8.923571586608887, 10.865097045898438, 12.806623458862305, 14.748148918151855, 16.689674377441406, 18.631200790405273, 20.572725296020508, 22.514251708984375, 24.45577621459961, 26.397302627563477, 28.338829040527344, 30.280353546142578, 32.22187805175781, 34.16340255737305, 36.10493087768555, 38.04645538330078, 39.987979888916016, 41.92950439453125, 43.87103271484375, 45.812557220458984, 47.754085540771484]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 6.0, 2.0, 6.0, 11.0, 15.0, 25.0, 38.0, 40.0, 29.0, 57.0, 76.0, 74.0, 82.0, 96.0, 80.0, 75.0, 63.0, 53.0, 35.0, 27.0, 38.0, 27.0, 21.0, 10.0, 4.0, 8.0, 6.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.208656311035156, -11.64046573638916, -11.072275161743164, -10.504084587097168, -9.935894012451172, -9.36770248413086, -8.799511909484863, -8.231321334838867, -7.663130760192871, -7.094940185546875, -6.526749610900879, -5.958558559417725, -5.3903679847717285, -4.822177410125732, -4.253986358642578, -3.685795783996582, -3.117605209350586, -2.54941463470459, -1.9812238216400146, -1.413033127784729, -0.8448424339294434, -0.27665185928344727, 0.29153895378112793, 0.8597297668457031, 1.4279203414916992, 1.9961110353469849, 2.5643017292022705, 3.1324925422668457, 3.700683116912842, 4.268873691558838, 4.837064743041992, 5.405255317687988, 5.973445892333984, 6.5416364669799805, 7.109827041625977, 7.678018093109131, 8.246208190917969, 8.814399719238281, 9.382590293884277, 9.950780868530273, 10.51897144317627, 11.087162017822266, 11.655352592468262, 12.223543167114258, 12.79173469543457, 13.35992431640625, 13.928115844726562, 14.496306419372559, 15.064496994018555, 15.63268756866455, 16.200878143310547, 16.76906967163086, 17.33725929260254, 17.90545082092285, 18.47364044189453, 19.041831970214844, 19.610023498535156, 20.17821502685547, 20.74640464782715, 21.31459617614746, 21.88278579711914, 22.450977325439453, 23.019166946411133, 23.587358474731445, 24.155548095703125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 7.0, 2.0, 3.0, 5.0, 6.0, 13.0, 19.0, 28.0, 49.0, 86.0, 187.0, 374.0, 1018.0, 3378.0, 14450.0, 105262.0, 3593194.0, 439311.0, 27866.0, 5924.0, 1758.0, 675.0, 274.0, 155.0, 72.0, 55.0, 37.0, 26.0, 17.0, 10.0, 10.0, 6.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.033203125, -1.9746246337890625, -1.916046142578125, -1.8574676513671875, -1.79888916015625, -1.7403106689453125, -1.681732177734375, -1.6231536865234375, -1.5645751953125, -1.5059967041015625, -1.447418212890625, -1.3888397216796875, -1.33026123046875, -1.2716827392578125, -1.213104248046875, -1.1545257568359375, -1.095947265625, -1.0373687744140625, -0.978790283203125, -0.9202117919921875, -0.86163330078125, -0.8030548095703125, -0.744476318359375, -0.6858978271484375, -0.6273193359375, -0.5687408447265625, -0.510162353515625, -0.4515838623046875, -0.39300537109375, -0.3344268798828125, -0.275848388671875, -0.2172698974609375, -0.15869140625, -0.1001129150390625, -0.041534423828125, 0.0170440673828125, 0.07562255859375, 0.1342010498046875, 0.192779541015625, 0.2513580322265625, 0.3099365234375, 0.3685150146484375, 0.427093505859375, 0.4856719970703125, 0.54425048828125, 0.6028289794921875, 0.661407470703125, 0.7199859619140625, 0.778564453125, 0.8371429443359375, 0.895721435546875, 0.9542999267578125, 1.01287841796875, 1.0714569091796875, 1.130035400390625, 1.1886138916015625, 1.2471923828125, 1.3057708740234375, 1.364349365234375, 1.4229278564453125, 1.48150634765625, 1.5400848388671875, 1.598663330078125, 1.6572418212890625, 1.7158203125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 9.0, 20.0, 21.0, 32.0, 44.0, 62.0, 94.0, 100.0, 118.0, 114.0, 93.0, 83.0, 68.0, 55.0, 30.0, 18.0, 21.0, 15.0, 4.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67529296875, -0.6360549926757812, -0.5968170166015625, -0.5575790405273438, -0.518341064453125, -0.47910308837890625, -0.4398651123046875, -0.40062713623046875, -0.36138916015625, -0.32215118408203125, -0.2829132080078125, -0.24367523193359375, -0.204437255859375, -0.16519927978515625, -0.1259613037109375, -0.08672332763671875, -0.0474853515625, -0.00824737548828125, 0.0309906005859375, 0.07022857666015625, 0.109466552734375, 0.14870452880859375, 0.1879425048828125, 0.22718048095703125, 0.26641845703125, 0.30565643310546875, 0.3448944091796875, 0.38413238525390625, 0.423370361328125, 0.46260833740234375, 0.5018463134765625, 0.5410842895507812, 0.580322265625, 0.6195602416992188, 0.6587982177734375, 0.6980361938476562, 0.737274169921875, 0.7765121459960938, 0.8157501220703125, 0.8549880981445312, 0.89422607421875, 0.9334640502929688, 0.9727020263671875, 1.0119400024414062, 1.051177978515625, 1.0904159545898438, 1.1296539306640625, 1.1688919067382812, 1.2081298828125, 1.2473678588867188, 1.2866058349609375, 1.3258438110351562, 1.365081787109375, 1.4043197631835938, 1.4435577392578125, 1.4827957153320312, 1.52203369140625, 1.5612716674804688, 1.6005096435546875, 1.6397476196289062, 1.678985595703125, 1.7182235717773438, 1.7574615478515625, 1.7966995239257812, 1.8359375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 1.0, 7.0, 2.0, 1.0, 1.0, 12.0, 7.0, 17.0, 31.0, 35.0, 55.0, 108.0, 178.0, 311.0, 703.0, 1453.0, 3292.0, 7941.0, 21684.0, 82117.0, 899304.0, 2946036.0, 175515.0, 36060.0, 11405.0, 4438.0, 1889.0, 810.0, 391.0, 203.0, 108.0, 69.0, 38.0, 19.0, 18.0, 6.0, 9.0, 7.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.5166015625, -1.472259521484375, -1.42791748046875, -1.383575439453125, -1.3392333984375, -1.294891357421875, -1.25054931640625, -1.206207275390625, -1.161865234375, -1.117523193359375, -1.07318115234375, -1.028839111328125, -0.9844970703125, -0.940155029296875, -0.89581298828125, -0.851470947265625, -0.80712890625, -0.762786865234375, -0.71844482421875, -0.674102783203125, -0.6297607421875, -0.585418701171875, -0.54107666015625, -0.496734619140625, -0.452392578125, -0.408050537109375, -0.36370849609375, -0.319366455078125, -0.2750244140625, -0.230682373046875, -0.18634033203125, -0.141998291015625, -0.09765625, -0.053314208984375, -0.00897216796875, 0.035369873046875, 0.0797119140625, 0.124053955078125, 0.16839599609375, 0.212738037109375, 0.257080078125, 0.301422119140625, 0.34576416015625, 0.390106201171875, 0.4344482421875, 0.478790283203125, 0.52313232421875, 0.567474365234375, 0.61181640625, 0.656158447265625, 0.70050048828125, 0.744842529296875, 0.7891845703125, 0.833526611328125, 0.87786865234375, 0.922210693359375, 0.966552734375, 1.010894775390625, 1.05523681640625, 1.099578857421875, 1.1439208984375, 1.188262939453125, 1.23260498046875, 1.276947021484375, 1.3212890625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 4.0, 5.0, 7.0, 5.0, 8.0, 8.0, 16.0, 19.0, 23.0, 43.0, 43.0, 84.0, 144.0, 289.0, 648.0, 1122.0, 743.0, 334.0, 172.0, 121.0, 75.0, 43.0, 30.0, 20.0, 21.0, 12.0, 11.0, 6.0, 1.0, 2.0, 3.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.958984375, -1.9055633544921875, -1.852142333984375, -1.7987213134765625, -1.74530029296875, -1.6918792724609375, -1.638458251953125, -1.5850372314453125, -1.5316162109375, -1.4781951904296875, -1.424774169921875, -1.3713531494140625, -1.31793212890625, -1.2645111083984375, -1.211090087890625, -1.1576690673828125, -1.104248046875, -1.0508270263671875, -0.997406005859375, -0.9439849853515625, -0.89056396484375, -0.8371429443359375, -0.783721923828125, -0.7303009033203125, -0.6768798828125, -0.6234588623046875, -0.570037841796875, -0.5166168212890625, -0.46319580078125, -0.4097747802734375, -0.356353759765625, -0.3029327392578125, -0.24951171875, -0.1960906982421875, -0.142669677734375, -0.0892486572265625, -0.03582763671875, 0.0175933837890625, 0.071014404296875, 0.1244354248046875, 0.1778564453125, 0.2312774658203125, 0.284698486328125, 0.3381195068359375, 0.39154052734375, 0.4449615478515625, 0.498382568359375, 0.5518035888671875, 0.605224609375, 0.6586456298828125, 0.712066650390625, 0.7654876708984375, 0.81890869140625, 0.8723297119140625, 0.925750732421875, 0.9791717529296875, 1.0325927734375, 1.0860137939453125, 1.139434814453125, 1.1928558349609375, 1.24627685546875, 1.2996978759765625, 1.353118896484375, 1.4065399169921875, 1.4599609375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 8.0, 20.0, 33.0, 106.0, 206.0, 255.0, 187.0, 93.0, 37.0, 22.0, 5.0, 8.0, 4.0, 9.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.511463165283203, -19.945589065551758, -19.379714965820312, -18.8138427734375, -18.247968673706055, -17.68209457397461, -17.116220474243164, -16.55034637451172, -15.984474182128906, -15.418600082397461, -14.852726936340332, -14.286852836608887, -13.720979690551758, -13.155105590820312, -12.589231491088867, -12.023358345031738, -11.457484245300293, -10.891610145568848, -10.325736999511719, -9.759862899780273, -9.193989753723145, -8.6281156539917, -8.06224250793457, -7.496368408203125, -6.930494785308838, -6.364621162414551, -5.798747539520264, -5.232873916625977, -4.666999816894531, -4.101126670837402, -3.535252571105957, -2.96937894821167, -2.403505325317383, -1.8376317024230957, -1.271757960319519, -0.7058842182159424, -0.14001059532165527, 0.42586302757263184, 0.991736888885498, 1.5576105117797852, 2.1234841346740723, 2.6893577575683594, 3.2552313804626465, 3.8211052417755127, 4.386979103088379, 4.952852249145508, 5.518726348876953, 6.08459997177124, 6.650473594665527, 7.2163472175598145, 7.782220840454102, 8.348094940185547, 8.913968086242676, 9.479842185974121, 10.04571533203125, 10.611589431762695, 11.17746353149414, 11.743337631225586, 12.309210777282715, 12.87508487701416, 13.440958023071289, 14.006832122802734, 14.57270622253418, 15.138579368591309, 15.704452514648438]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 6.0, 5.0, 7.0, 7.0, 9.0, 13.0, 17.0, 25.0, 26.0, 29.0, 43.0, 49.0, 54.0, 58.0, 68.0, 73.0, 44.0, 65.0, 57.0, 61.0, 49.0, 55.0, 41.0, 33.0, 27.0, 33.0, 13.0, 16.0, 5.0, 9.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-10.97507095336914, -10.702346801757812, -10.4296236038208, -10.156900405883789, -9.884176254272461, -9.611452102661133, -9.338728904724121, -9.06600570678711, -8.793281555175781, -8.520557403564453, -8.247834205627441, -7.9751105308532715, -7.702386856079102, -7.429663181304932, -7.156939506530762, -6.884215831756592, -6.611492156982422, -6.338768482208252, -6.066044807434082, -5.793321132659912, -5.520597457885742, -5.247873783111572, -4.975150108337402, -4.702426433563232, -4.4297027587890625, -4.156979084014893, -3.8842554092407227, -3.6115317344665527, -3.338808059692383, -3.066084384918213, -2.793360710144043, -2.520637035369873, -2.2479124069213867, -1.9751887321472168, -1.7024650573730469, -1.429741382598877, -1.157017707824707, -0.8842940330505371, -0.6115703582763672, -0.33884668350219727, -0.06612300872802734, 0.20660066604614258, 0.4793243408203125, 0.7520480155944824, 1.0247716903686523, 1.2974953651428223, 1.5702190399169922, 1.842942714691162, 2.115666389465332, 2.388390064239502, 2.661113739013672, 2.933837413787842, 3.2065610885620117, 3.4792847633361816, 3.7520084381103516, 4.0247321128845215, 4.297455787658691, 4.570179462432861, 4.842903137207031, 5.115626811981201, 5.388350486755371, 5.661074161529541, 5.933797836303711, 6.206521511077881, 6.479245185852051]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 15.0, 10.0, 18.0, 16.0, 37.0, 72.0, 102.0, 179.0, 282.0, 548.0, 972.0, 1831.0, 3556.0, 7507.0, 16546.0, 39832.0, 97100.0, 224158.0, 319042.0, 194028.0, 81706.0, 33418.0, 14379.0, 6529.0, 3095.0, 1550.0, 895.0, 474.0, 277.0, 150.0, 91.0, 48.0, 26.0, 19.0, 15.0, 11.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.0791015625, -1.04473876953125, -1.0103759765625, -0.97601318359375, -0.941650390625, -0.90728759765625, -0.8729248046875, -0.83856201171875, -0.80419921875, -0.76983642578125, -0.7354736328125, -0.70111083984375, -0.666748046875, -0.63238525390625, -0.5980224609375, -0.56365966796875, -0.529296875, -0.49493408203125, -0.4605712890625, -0.42620849609375, -0.391845703125, -0.35748291015625, -0.3231201171875, -0.28875732421875, -0.25439453125, -0.22003173828125, -0.1856689453125, -0.15130615234375, -0.116943359375, -0.08258056640625, -0.0482177734375, -0.01385498046875, 0.0205078125, 0.05487060546875, 0.0892333984375, 0.12359619140625, 0.157958984375, 0.19232177734375, 0.2266845703125, 0.26104736328125, 0.29541015625, 0.32977294921875, 0.3641357421875, 0.39849853515625, 0.432861328125, 0.46722412109375, 0.5015869140625, 0.53594970703125, 0.5703125, 0.60467529296875, 0.6390380859375, 0.67340087890625, 0.707763671875, 0.74212646484375, 0.7764892578125, 0.81085205078125, 0.84521484375, 0.87957763671875, 0.9139404296875, 0.94830322265625, 0.982666015625, 1.01702880859375, 1.0513916015625, 1.08575439453125, 1.1201171875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 6.0, 2.0, 9.0, 8.0, 10.0, 22.0, 19.0, 20.0, 23.0, 30.0, 31.0, 43.0, 45.0, 29.0, 41.0, 64.0, 44.0, 67.0, 46.0, 61.0, 43.0, 42.0, 37.0, 50.0, 43.0, 34.0, 20.0, 32.0, 15.0, 11.0, 12.0, 10.0, 13.0, 7.0, 3.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5615234375, -0.5419845581054688, -0.5224456787109375, -0.5029067993164062, -0.483367919921875, -0.46382904052734375, -0.4442901611328125, -0.42475128173828125, -0.40521240234375, -0.38567352294921875, -0.3661346435546875, -0.34659576416015625, -0.327056884765625, -0.30751800537109375, -0.2879791259765625, -0.26844024658203125, -0.2489013671875, -0.22936248779296875, -0.2098236083984375, -0.19028472900390625, -0.170745849609375, -0.15120697021484375, -0.1316680908203125, -0.11212921142578125, -0.09259033203125, -0.07305145263671875, -0.0535125732421875, -0.03397369384765625, -0.014434814453125, 0.00510406494140625, 0.0246429443359375, 0.04418182373046875, 0.063720703125, 0.08325958251953125, 0.1027984619140625, 0.12233734130859375, 0.141876220703125, 0.16141510009765625, 0.1809539794921875, 0.20049285888671875, 0.22003173828125, 0.23957061767578125, 0.2591094970703125, 0.27864837646484375, 0.298187255859375, 0.31772613525390625, 0.3372650146484375, 0.35680389404296875, 0.3763427734375, 0.39588165283203125, 0.4154205322265625, 0.43495941162109375, 0.454498291015625, 0.47403717041015625, 0.4935760498046875, 0.5131149291992188, 0.53265380859375, 0.5521926879882812, 0.5717315673828125, 0.5912704467773438, 0.610809326171875, 0.6303482055664062, 0.6498870849609375, 0.6694259643554688, 0.68896484375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 1.0, 0.0, 7.0, 6.0, 11.0, 11.0, 23.0, 25.0, 34.0, 47.0, 87.0, 130.0, 231.0, 330.0, 692.0, 1330.0, 3303.0, 11159.0, 56850.0, 386073.0, 500787.0, 67930.0, 12789.0, 3620.0, 1365.0, 713.0, 381.0, 224.0, 132.0, 70.0, 57.0, 30.0, 35.0, 25.0, 18.0, 9.0, 6.0, 2.0, 2.0, 5.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.3125, -2.242523193359375, -2.17254638671875, -2.102569580078125, -2.0325927734375, -1.962615966796875, -1.89263916015625, -1.822662353515625, -1.752685546875, -1.682708740234375, -1.61273193359375, -1.542755126953125, -1.4727783203125, -1.402801513671875, -1.33282470703125, -1.262847900390625, -1.19287109375, -1.122894287109375, -1.05291748046875, -0.982940673828125, -0.9129638671875, -0.842987060546875, -0.77301025390625, -0.703033447265625, -0.633056640625, -0.563079833984375, -0.49310302734375, -0.423126220703125, -0.3531494140625, -0.283172607421875, -0.21319580078125, -0.143218994140625, -0.0732421875, -0.003265380859375, 0.06671142578125, 0.136688232421875, 0.2066650390625, 0.276641845703125, 0.34661865234375, 0.416595458984375, 0.486572265625, 0.556549072265625, 0.62652587890625, 0.696502685546875, 0.7664794921875, 0.836456298828125, 0.90643310546875, 0.976409912109375, 1.04638671875, 1.116363525390625, 1.18634033203125, 1.256317138671875, 1.3262939453125, 1.396270751953125, 1.46624755859375, 1.536224365234375, 1.606201171875, 1.676177978515625, 1.74615478515625, 1.816131591796875, 1.8861083984375, 1.956085205078125, 2.02606201171875, 2.096038818359375, 2.166015625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 2.0, 6.0, 5.0, 8.0, 11.0, 10.0, 15.0, 18.0, 14.0, 18.0, 30.0, 20.0, 36.0, 26.0, 34.0, 40.0, 49.0, 47.0, 59.0, 46.0, 57.0, 52.0, 52.0, 52.0, 49.0, 46.0, 29.0, 32.0, 24.0, 19.0, 23.0, 20.0, 10.0, 13.0, 7.0, 8.0, 9.0, 1.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.162109375, -2.086944580078125, -2.01177978515625, -1.936614990234375, -1.8614501953125, -1.786285400390625, -1.71112060546875, -1.635955810546875, -1.560791015625, -1.485626220703125, -1.41046142578125, -1.335296630859375, -1.2601318359375, -1.184967041015625, -1.10980224609375, -1.034637451171875, -0.95947265625, -0.884307861328125, -0.80914306640625, -0.733978271484375, -0.6588134765625, -0.583648681640625, -0.50848388671875, -0.433319091796875, -0.358154296875, -0.282989501953125, -0.20782470703125, -0.132659912109375, -0.0574951171875, 0.017669677734375, 0.09283447265625, 0.167999267578125, 0.2431640625, 0.318328857421875, 0.39349365234375, 0.468658447265625, 0.5438232421875, 0.618988037109375, 0.69415283203125, 0.769317626953125, 0.844482421875, 0.919647216796875, 0.99481201171875, 1.069976806640625, 1.1451416015625, 1.220306396484375, 1.29547119140625, 1.370635986328125, 1.44580078125, 1.520965576171875, 1.59613037109375, 1.671295166015625, 1.7464599609375, 1.821624755859375, 1.89678955078125, 1.971954345703125, 2.047119140625, 2.122283935546875, 2.19744873046875, 2.272613525390625, 2.3477783203125, 2.422943115234375, 2.49810791015625, 2.573272705078125, 2.6484375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 11.0, 6.0, 4.0, 9.0, 22.0, 33.0, 54.0, 84.0, 195.0, 392.0, 1119.0, 4001.0, 26140.0, 404726.0, 572790.0, 32325.0, 4476.0, 1196.0, 481.0, 206.0, 112.0, 60.0, 38.0, 27.0, 14.0, 14.0, 8.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.423828125, -1.3853912353515625, -1.346954345703125, -1.3085174560546875, -1.27008056640625, -1.2316436767578125, -1.193206787109375, -1.1547698974609375, -1.1163330078125, -1.0778961181640625, -1.039459228515625, -1.0010223388671875, -0.96258544921875, -0.9241485595703125, -0.885711669921875, -0.8472747802734375, -0.808837890625, -0.7704010009765625, -0.731964111328125, -0.6935272216796875, -0.65509033203125, -0.6166534423828125, -0.578216552734375, -0.5397796630859375, -0.5013427734375, -0.4629058837890625, -0.424468994140625, -0.3860321044921875, -0.34759521484375, -0.3091583251953125, -0.270721435546875, -0.2322845458984375, -0.19384765625, -0.1554107666015625, -0.116973876953125, -0.0785369873046875, -0.04010009765625, -0.0016632080078125, 0.036773681640625, 0.0752105712890625, 0.1136474609375, 0.1520843505859375, 0.190521240234375, 0.2289581298828125, 0.26739501953125, 0.3058319091796875, 0.344268798828125, 0.3827056884765625, 0.421142578125, 0.4595794677734375, 0.498016357421875, 0.5364532470703125, 0.57489013671875, 0.6133270263671875, 0.651763916015625, 0.6902008056640625, 0.7286376953125, 0.7670745849609375, 0.805511474609375, 0.8439483642578125, 0.88238525390625, 0.9208221435546875, 0.959259033203125, 0.9976959228515625, 1.0361328125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 3.0, 2.0, 6.0, 5.0, 3.0, 10.0, 11.0, 22.0, 20.0, 30.0, 38.0, 55.0, 74.0, 107.0, 147.0, 121.0, 99.0, 90.0, 49.0, 32.0, 23.0, 17.0, 11.0, 12.0, 7.0, 6.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00024509429931640625, -0.00023714080452919006, -0.00022918730974197388, -0.0002212338149547577, -0.0002132803201675415, -0.00020532682538032532, -0.00019737333059310913, -0.00018941983580589294, -0.00018146634101867676, -0.00017351284623146057, -0.00016555935144424438, -0.0001576058566570282, -0.000149652361869812, -0.00014169886708259583, -0.00013374537229537964, -0.00012579187750816345, -0.00011783838272094727, -0.00010988488793373108, -0.00010193139314651489, -9.39778983592987e-05, -8.602440357208252e-05, -7.807090878486633e-05, -7.011741399765015e-05, -6.216391921043396e-05, -5.4210424423217773e-05, -4.625692963600159e-05, -3.83034348487854e-05, -3.0349940061569214e-05, -2.2396445274353027e-05, -1.444295048713684e-05, -6.489455699920654e-06, 1.4640390872955322e-06, 9.417533874511719e-06, 1.7371028661727905e-05, 2.5324523448944092e-05, 3.327801823616028e-05, 4.1231513023376465e-05, 4.918500781059265e-05, 5.713850259780884e-05, 6.509199738502502e-05, 7.304549217224121e-05, 8.09989869594574e-05, 8.895248174667358e-05, 9.690597653388977e-05, 0.00010485947132110596, 0.00011281296610832214, 0.00012076646089553833, 0.00012871995568275452, 0.0001366734504699707, 0.0001446269452571869, 0.00015258044004440308, 0.00016053393483161926, 0.00016848742961883545, 0.00017644092440605164, 0.00018439441919326782, 0.000192347913980484, 0.0002003014087677002, 0.00020825490355491638, 0.00021620839834213257, 0.00022416189312934875, 0.00023211538791656494, 0.00024006888270378113, 0.0002480223774909973, 0.0002559758722782135, 0.0002639293670654297]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 2.0, 1.0, 8.0, 8.0, 10.0, 11.0, 11.0, 26.0, 26.0, 43.0, 56.0, 105.0, 145.0, 225.0, 362.0, 857.0, 1769.0, 4940.0, 17177.0, 89947.0, 563272.0, 304078.0, 48503.0, 10607.0, 3419.0, 1382.0, 615.0, 383.0, 223.0, 123.0, 63.0, 59.0, 28.0, 26.0, 17.0, 12.0, 5.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.76513671875, -0.7418289184570312, -0.7185211181640625, -0.6952133178710938, -0.671905517578125, -0.6485977172851562, -0.6252899169921875, -0.6019821166992188, -0.57867431640625, -0.5553665161132812, -0.5320587158203125, -0.5087509155273438, -0.485443115234375, -0.46213531494140625, -0.4388275146484375, -0.41551971435546875, -0.3922119140625, -0.36890411376953125, -0.3455963134765625, -0.32228851318359375, -0.298980712890625, -0.27567291259765625, -0.2523651123046875, -0.22905731201171875, -0.20574951171875, -0.18244171142578125, -0.1591339111328125, -0.13582611083984375, -0.112518310546875, -0.08921051025390625, -0.0659027099609375, -0.04259490966796875, -0.019287109375, 0.00402069091796875, 0.0273284912109375, 0.05063629150390625, 0.073944091796875, 0.09725189208984375, 0.1205596923828125, 0.14386749267578125, 0.16717529296875, 0.19048309326171875, 0.2137908935546875, 0.23709869384765625, 0.260406494140625, 0.28371429443359375, 0.3070220947265625, 0.33032989501953125, 0.3536376953125, 0.37694549560546875, 0.4002532958984375, 0.42356109619140625, 0.446868896484375, 0.47017669677734375, 0.4934844970703125, 0.5167922973632812, 0.54010009765625, 0.5634078979492188, 0.5867156982421875, 0.6100234985351562, 0.633331298828125, 0.6566390991210938, 0.6799468994140625, 0.7032546997070312, 0.7265625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 2.0, 8.0, 9.0, 8.0, 5.0, 10.0, 22.0, 20.0, 29.0, 33.0, 42.0, 42.0, 61.0, 63.0, 64.0, 81.0, 82.0, 75.0, 59.0, 62.0, 57.0, 51.0, 33.0, 18.0, 15.0, 14.0, 7.0, 11.0, 5.0, 2.0, 4.0, 3.0, 0.0, 4.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.90380859375, -0.8791961669921875, -0.854583740234375, -0.8299713134765625, -0.80535888671875, -0.7807464599609375, -0.756134033203125, -0.7315216064453125, -0.7069091796875, -0.6822967529296875, -0.657684326171875, -0.6330718994140625, -0.60845947265625, -0.5838470458984375, -0.559234619140625, -0.5346221923828125, -0.510009765625, -0.4853973388671875, -0.460784912109375, -0.4361724853515625, -0.41156005859375, -0.3869476318359375, -0.362335205078125, -0.3377227783203125, -0.3131103515625, -0.2884979248046875, -0.263885498046875, -0.2392730712890625, -0.21466064453125, -0.1900482177734375, -0.165435791015625, -0.1408233642578125, -0.1162109375, -0.0915985107421875, -0.066986083984375, -0.0423736572265625, -0.01776123046875, 0.0068511962890625, 0.031463623046875, 0.0560760498046875, 0.0806884765625, 0.1053009033203125, 0.129913330078125, 0.1545257568359375, 0.17913818359375, 0.2037506103515625, 0.228363037109375, 0.2529754638671875, 0.277587890625, 0.3022003173828125, 0.326812744140625, 0.3514251708984375, 0.37603759765625, 0.4006500244140625, 0.425262451171875, 0.4498748779296875, 0.4744873046875, 0.4990997314453125, 0.523712158203125, 0.5483245849609375, 0.57293701171875, 0.5975494384765625, 0.622161865234375, 0.6467742919921875, 0.67138671875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 11.0, 20.0, 28.0, 68.0, 89.0, 136.0, 210.0, 173.0, 121.0, 70.0, 35.0, 19.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-24.06265640258789, -23.512418746948242, -22.962181091308594, -22.411943435668945, -21.861705780029297, -21.311466217041016, -20.76123046875, -20.21099090576172, -19.66075325012207, -19.110515594482422, -18.560277938842773, -18.010040283203125, -17.459802627563477, -16.909564971923828, -16.359325408935547, -15.809088706970215, -15.258851051330566, -14.708613395690918, -14.15837574005127, -13.608137130737305, -13.057899475097656, -12.507661819458008, -11.95742416381836, -11.407186508178711, -10.856948852539062, -10.306711196899414, -9.756473541259766, -9.206235885620117, -8.655997276306152, -8.105759620666504, -7.5555219650268555, -7.005284309387207, -6.455045700073242, -5.904808044433594, -5.354569911956787, -4.804332256317139, -4.254094123840332, -3.7038564682006836, -3.153618812561035, -2.6033809185028076, -2.05314302444458, -1.5029051303863525, -0.9526673555374146, -0.40242958068847656, 0.14780831336975098, 0.6980462074279785, 1.248283863067627, 1.7985217571258545, 2.348759651184082, 2.8989975452423096, 3.449235439300537, 3.9994730949401855, 4.549711227416992, 5.099948883056641, 5.650186538696289, 6.2004241943359375, 6.750662326812744, 7.300899982452393, 7.851138114929199, 8.401375770568848, 8.951613426208496, 9.501852035522461, 10.05208969116211, 10.602327346801758, 11.152565002441406]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 1.0, 5.0, 11.0, 8.0, 11.0, 9.0, 19.0, 18.0, 21.0, 20.0, 26.0, 33.0, 30.0, 28.0, 44.0, 49.0, 47.0, 60.0, 74.0, 71.0, 53.0, 49.0, 44.0, 31.0, 37.0, 29.0, 27.0, 24.0, 23.0, 18.0, 19.0, 16.0, 16.0, 3.0, 9.0, 9.0, 0.0, 5.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.196157455444336, -8.872919082641602, -8.549680709838867, -8.226442337036133, -7.90320348739624, -7.579965114593506, -7.256726264953613, -6.933487892150879, -6.6102495193481445, -6.28701114654541, -5.963772773742676, -5.640533924102783, -5.317295551300049, -4.9940571784973145, -4.670818328857422, -4.3475799560546875, -4.024341583251953, -3.7011032104492188, -3.3778645992279053, -3.054625988006592, -2.7313876152038574, -2.408149242401123, -2.0849106311798096, -1.761672019958496, -1.4384336471557617, -1.1151951551437378, -0.7919566631317139, -0.46871817111968994, -0.14547967910766602, 0.1777588129043579, 0.5009973049163818, 0.8242359161376953, 1.1474733352661133, 1.4707118272781372, 1.7939503192901611, 2.1171889305114746, 2.440427303314209, 2.7636656761169434, 3.086904287338257, 3.4101428985595703, 3.7333812713623047, 4.056619644165039, 4.379858016967773, 4.703096866607666, 5.0263352394104, 5.349573612213135, 5.672812461853027, 5.996050834655762, 6.319289207458496, 6.6425275802612305, 6.965765953063965, 7.289004802703857, 7.612243175506592, 7.935481548309326, 8.258720397949219, 8.581958770751953, 8.905197143554688, 9.228435516357422, 9.551673889160156, 9.87491226196289, 10.198150634765625, 10.521389961242676, 10.84462833404541, 11.167866706848145, 11.491105079650879]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 5.0, 10.0, 5.0, 8.0, 26.0, 20.0, 55.0, 67.0, 118.0, 207.0, 378.0, 685.0, 1303.0, 2768.0, 6139.0, 15233.0, 44501.0, 174596.0, 1136800.0, 2258958.0, 428667.0, 81422.0, 24579.0, 9544.0, 3986.0, 1906.0, 963.0, 517.0, 291.0, 177.0, 100.0, 80.0, 55.0, 25.0, 23.0, 15.0, 15.0, 9.0, 8.0, 8.0, 4.0, 6.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64990234375, -0.6260528564453125, -0.602203369140625, -0.5783538818359375, -0.55450439453125, -0.5306549072265625, -0.506805419921875, -0.4829559326171875, -0.4591064453125, -0.4352569580078125, -0.411407470703125, -0.3875579833984375, -0.36370849609375, -0.3398590087890625, -0.316009521484375, -0.2921600341796875, -0.268310546875, -0.2444610595703125, -0.220611572265625, -0.1967620849609375, -0.17291259765625, -0.1490631103515625, -0.125213623046875, -0.1013641357421875, -0.0775146484375, -0.0536651611328125, -0.029815673828125, -0.0059661865234375, 0.01788330078125, 0.0417327880859375, 0.065582275390625, 0.0894317626953125, 0.11328125, 0.1371307373046875, 0.160980224609375, 0.1848297119140625, 0.20867919921875, 0.2325286865234375, 0.256378173828125, 0.2802276611328125, 0.3040771484375, 0.3279266357421875, 0.351776123046875, 0.3756256103515625, 0.39947509765625, 0.4233245849609375, 0.447174072265625, 0.4710235595703125, 0.494873046875, 0.5187225341796875, 0.542572021484375, 0.5664215087890625, 0.59027099609375, 0.6141204833984375, 0.637969970703125, 0.6618194580078125, 0.6856689453125, 0.7095184326171875, 0.733367919921875, 0.7572174072265625, 0.78106689453125, 0.8049163818359375, 0.828765869140625, 0.8526153564453125, 0.87646484375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 5.0, 7.0, 6.0, 10.0, 13.0, 9.0, 14.0, 15.0, 31.0, 21.0, 34.0, 51.0, 57.0, 40.0, 44.0, 48.0, 59.0, 53.0, 56.0, 44.0, 44.0, 43.0, 43.0, 46.0, 35.0, 32.0, 29.0, 22.0, 30.0, 17.0, 8.0, 12.0, 10.0, 7.0, 2.0, 6.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45458984375, -0.43566131591796875, -0.4167327880859375, -0.39780426025390625, -0.378875732421875, -0.35994720458984375, -0.3410186767578125, -0.32209014892578125, -0.30316162109375, -0.28423309326171875, -0.2653045654296875, -0.24637603759765625, -0.227447509765625, -0.20851898193359375, -0.1895904541015625, -0.17066192626953125, -0.1517333984375, -0.13280487060546875, -0.1138763427734375, -0.09494781494140625, -0.076019287109375, -0.05709075927734375, -0.0381622314453125, -0.01923370361328125, -0.00030517578125, 0.01862335205078125, 0.0375518798828125, 0.05648040771484375, 0.075408935546875, 0.09433746337890625, 0.1132659912109375, 0.13219451904296875, 0.151123046875, 0.17005157470703125, 0.1889801025390625, 0.20790863037109375, 0.226837158203125, 0.24576568603515625, 0.2646942138671875, 0.28362274169921875, 0.30255126953125, 0.32147979736328125, 0.3404083251953125, 0.35933685302734375, 0.378265380859375, 0.39719390869140625, 0.4161224365234375, 0.43505096435546875, 0.4539794921875, 0.47290802001953125, 0.4918365478515625, 0.5107650756835938, 0.529693603515625, 0.5486221313476562, 0.5675506591796875, 0.5864791870117188, 0.60540771484375, 0.6243362426757812, 0.6432647705078125, 0.6621932983398438, 0.681121826171875, 0.7000503540039062, 0.7189788818359375, 0.7379074096679688, 0.7568359375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 5.0, 9.0, 8.0, 16.0, 18.0, 27.0, 37.0, 47.0, 80.0, 80.0, 141.0, 227.0, 442.0, 815.0, 1861.0, 4743.0, 14322.0, 56069.0, 385028.0, 3277127.0, 375236.0, 55818.0, 14281.0, 4440.0, 1652.0, 722.0, 369.0, 217.0, 132.0, 87.0, 78.0, 39.0, 36.0, 19.0, 24.0, 9.0, 6.0, 3.0, 5.0, 8.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2880859375, -1.244415283203125, -1.20074462890625, -1.157073974609375, -1.1134033203125, -1.069732666015625, -1.02606201171875, -0.982391357421875, -0.938720703125, -0.895050048828125, -0.85137939453125, -0.807708740234375, -0.7640380859375, -0.720367431640625, -0.67669677734375, -0.633026123046875, -0.58935546875, -0.545684814453125, -0.50201416015625, -0.458343505859375, -0.4146728515625, -0.371002197265625, -0.32733154296875, -0.283660888671875, -0.239990234375, -0.196319580078125, -0.15264892578125, -0.108978271484375, -0.0653076171875, -0.021636962890625, 0.02203369140625, 0.065704345703125, 0.109375, 0.153045654296875, 0.19671630859375, 0.240386962890625, 0.2840576171875, 0.327728271484375, 0.37139892578125, 0.415069580078125, 0.458740234375, 0.502410888671875, 0.54608154296875, 0.589752197265625, 0.6334228515625, 0.677093505859375, 0.72076416015625, 0.764434814453125, 0.80810546875, 0.851776123046875, 0.89544677734375, 0.939117431640625, 0.9827880859375, 1.026458740234375, 1.07012939453125, 1.113800048828125, 1.157470703125, 1.201141357421875, 1.24481201171875, 1.288482666015625, 1.3321533203125, 1.375823974609375, 1.41949462890625, 1.463165283203125, 1.5068359375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 4.0, 8.0, 3.0, 5.0, 4.0, 15.0, 12.0, 14.0, 24.0, 21.0, 29.0, 41.0, 68.0, 96.0, 155.0, 213.0, 409.0, 624.0, 750.0, 538.0, 377.0, 201.0, 119.0, 82.0, 58.0, 47.0, 43.0, 23.0, 16.0, 16.0, 11.0, 14.0, 7.0, 11.0, 4.0, 6.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.689453125, -1.64306640625, -1.5966796875, -1.55029296875, -1.50390625, -1.45751953125, -1.4111328125, -1.36474609375, -1.318359375, -1.27197265625, -1.2255859375, -1.17919921875, -1.1328125, -1.08642578125, -1.0400390625, -0.99365234375, -0.947265625, -0.90087890625, -0.8544921875, -0.80810546875, -0.76171875, -0.71533203125, -0.6689453125, -0.62255859375, -0.576171875, -0.52978515625, -0.4833984375, -0.43701171875, -0.390625, -0.34423828125, -0.2978515625, -0.25146484375, -0.205078125, -0.15869140625, -0.1123046875, -0.06591796875, -0.01953125, 0.02685546875, 0.0732421875, 0.11962890625, 0.166015625, 0.21240234375, 0.2587890625, 0.30517578125, 0.3515625, 0.39794921875, 0.4443359375, 0.49072265625, 0.537109375, 0.58349609375, 0.6298828125, 0.67626953125, 0.72265625, 0.76904296875, 0.8154296875, 0.86181640625, 0.908203125, 0.95458984375, 1.0009765625, 1.04736328125, 1.09375, 1.14013671875, 1.1865234375, 1.23291015625, 1.279296875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 1.0, 5.0, 12.0, 21.0, 28.0, 54.0, 100.0, 130.0, 182.0, 158.0, 113.0, 84.0, 41.0, 19.0, 15.0, 8.0, 5.0, 5.0, 6.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.191397666931152, -12.758180618286133, -12.324963569641113, -11.891746520996094, -11.458529472351074, -11.025312423706055, -10.592095375061035, -10.158878326416016, -9.725661277770996, -9.292444229125977, -8.859227180480957, -8.426010131835938, -7.992793083190918, -7.559576034545898, -7.126358985900879, -6.693141937255859, -6.25992488861084, -5.82670783996582, -5.393490791320801, -4.960273742675781, -4.527056694030762, -4.093839645385742, -3.6606225967407227, -3.227405548095703, -2.7941884994506836, -2.360971450805664, -1.9277544021606445, -1.494537353515625, -1.0613203048706055, -0.6281032562255859, -0.1948862075805664, 0.23833084106445312, 0.6715478897094727, 1.1047649383544922, 1.5379819869995117, 1.9711990356445312, 2.404416084289551, 2.8376331329345703, 3.27085018157959, 3.7040672302246094, 4.137284278869629, 4.570501327514648, 5.003718376159668, 5.4369354248046875, 5.870152473449707, 6.303369522094727, 6.736586570739746, 7.169803619384766, 7.603020668029785, 8.036237716674805, 8.469454765319824, 8.902671813964844, 9.335888862609863, 9.769105911254883, 10.202322959899902, 10.635540008544922, 11.068757057189941, 11.501974105834961, 11.93519115447998, 12.368408203125, 12.80162525177002, 13.234842300415039, 13.668059349060059, 14.101276397705078, 14.534493446350098]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 3.0, 6.0, 2.0, 13.0, 8.0, 7.0, 12.0, 10.0, 21.0, 17.0, 24.0, 28.0, 39.0, 38.0, 38.0, 38.0, 46.0, 38.0, 71.0, 58.0, 66.0, 47.0, 46.0, 44.0, 38.0, 35.0, 39.0, 30.0, 24.0, 24.0, 20.0, 15.0, 18.0, 15.0, 10.0, 3.0, 3.0, 2.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.024250030517578, -8.745893478393555, -8.467537879943848, -8.189181327819824, -7.910825252532959, -7.632469177246094, -7.3541131019592285, -7.075757026672363, -6.79740047454834, -6.519044399261475, -6.240688323974609, -5.962331771850586, -5.683975696563721, -5.4056196212768555, -5.12726354598999, -4.848907470703125, -4.57055139541626, -4.2921953201293945, -4.013839244842529, -3.735482931137085, -3.4571266174316406, -3.1787705421447754, -2.90041446685791, -2.622058391571045, -2.3437020778656006, -2.0653460025787354, -1.786989688873291, -1.5086336135864258, -1.230277419090271, -0.9519212245941162, -0.673565149307251, -0.3952089548110962, -0.1168527603149414, 0.161503404378891, 0.4398595690727234, 0.7182157039642334, 0.9965718984603882, 1.274928092956543, 1.5532841682434082, 1.831640362739563, 2.1099965572357178, 2.388352632522583, 2.6667089462280273, 2.9450650215148926, 3.223421096801758, 3.501777410507202, 3.7801334857940674, 4.058489799499512, 4.336845874786377, 4.615201950073242, 4.893558025360107, 5.171914100646973, 5.450270652770996, 5.728626728057861, 6.006982803344727, 6.285338878631592, 6.563694953918457, 6.842051029205322, 7.1204071044921875, 7.398763656616211, 7.677119731903076, 7.955475807189941, 8.233831405639648, 8.512187957763672, 8.790544509887695]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 5.0, 4.0, 4.0, 11.0, 8.0, 25.0, 37.0, 44.0, 62.0, 100.0, 163.0, 267.0, 453.0, 824.0, 1639.0, 3148.0, 6639.0, 13501.0, 28535.0, 59200.0, 115867.0, 198792.0, 242167.0, 179416.0, 100163.0, 50216.0, 24290.0, 11616.0, 5507.0, 2657.0, 1410.0, 731.0, 422.0, 222.0, 131.0, 92.0, 55.0, 45.0, 32.0, 19.0, 12.0, 7.0, 5.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6943359375, -0.6698760986328125, -0.645416259765625, -0.6209564208984375, -0.59649658203125, -0.5720367431640625, -0.547576904296875, -0.5231170654296875, -0.4986572265625, -0.4741973876953125, -0.449737548828125, -0.4252777099609375, -0.40081787109375, -0.3763580322265625, -0.351898193359375, -0.3274383544921875, -0.302978515625, -0.2785186767578125, -0.254058837890625, -0.2295989990234375, -0.20513916015625, -0.1806793212890625, -0.156219482421875, -0.1317596435546875, -0.1072998046875, -0.0828399658203125, -0.058380126953125, -0.0339202880859375, -0.00946044921875, 0.0149993896484375, 0.039459228515625, 0.0639190673828125, 0.08837890625, 0.1128387451171875, 0.137298583984375, 0.1617584228515625, 0.18621826171875, 0.2106781005859375, 0.235137939453125, 0.2595977783203125, 0.2840576171875, 0.3085174560546875, 0.332977294921875, 0.3574371337890625, 0.38189697265625, 0.4063568115234375, 0.430816650390625, 0.4552764892578125, 0.479736328125, 0.5041961669921875, 0.528656005859375, 0.5531158447265625, 0.57757568359375, 0.6020355224609375, 0.626495361328125, 0.6509552001953125, 0.6754150390625, 0.6998748779296875, 0.724334716796875, 0.7487945556640625, 0.77325439453125, 0.7977142333984375, 0.822174072265625, 0.8466339111328125, 0.87109375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 7.0, 6.0, 7.0, 5.0, 15.0, 10.0, 19.0, 18.0, 27.0, 32.0, 19.0, 51.0, 49.0, 41.0, 50.0, 47.0, 51.0, 50.0, 63.0, 45.0, 38.0, 48.0, 43.0, 37.0, 26.0, 36.0, 39.0, 18.0, 28.0, 11.0, 12.0, 6.0, 15.0, 10.0, 8.0, 12.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5419921875, -0.524017333984375, -0.50604248046875, -0.488067626953125, -0.4700927734375, -0.452117919921875, -0.43414306640625, -0.416168212890625, -0.398193359375, -0.380218505859375, -0.36224365234375, -0.344268798828125, -0.3262939453125, -0.308319091796875, -0.29034423828125, -0.272369384765625, -0.25439453125, -0.236419677734375, -0.21844482421875, -0.200469970703125, -0.1824951171875, -0.164520263671875, -0.14654541015625, -0.128570556640625, -0.110595703125, -0.092620849609375, -0.07464599609375, -0.056671142578125, -0.0386962890625, -0.020721435546875, -0.00274658203125, 0.015228271484375, 0.033203125, 0.051177978515625, 0.06915283203125, 0.087127685546875, 0.1051025390625, 0.123077392578125, 0.14105224609375, 0.159027099609375, 0.177001953125, 0.194976806640625, 0.21295166015625, 0.230926513671875, 0.2489013671875, 0.266876220703125, 0.28485107421875, 0.302825927734375, 0.32080078125, 0.338775634765625, 0.35675048828125, 0.374725341796875, 0.3927001953125, 0.410675048828125, 0.42864990234375, 0.446624755859375, 0.464599609375, 0.482574462890625, 0.50054931640625, 0.518524169921875, 0.5364990234375, 0.554473876953125, 0.57244873046875, 0.590423583984375, 0.6083984375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 10.0, 7.0, 5.0, 12.0, 15.0, 22.0, 30.0, 42.0, 52.0, 71.0, 95.0, 160.0, 186.0, 280.0, 420.0, 653.0, 968.0, 1886.0, 4207.0, 13477.0, 69533.0, 512282.0, 364195.0, 59317.0, 12055.0, 3947.0, 1798.0, 955.0, 602.0, 353.0, 236.0, 223.0, 119.0, 100.0, 70.0, 38.0, 32.0, 24.0, 15.0, 13.0, 14.0, 12.0, 13.0, 4.0, 3.0, 6.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.62890625, -1.5684814453125, -1.508056640625, -1.4476318359375, -1.38720703125, -1.3267822265625, -1.266357421875, -1.2059326171875, -1.1455078125, -1.0850830078125, -1.024658203125, -0.9642333984375, -0.90380859375, -0.8433837890625, -0.782958984375, -0.7225341796875, -0.662109375, -0.6016845703125, -0.541259765625, -0.4808349609375, -0.42041015625, -0.3599853515625, -0.299560546875, -0.2391357421875, -0.1787109375, -0.1182861328125, -0.057861328125, 0.0025634765625, 0.06298828125, 0.1234130859375, 0.183837890625, 0.2442626953125, 0.3046875, 0.3651123046875, 0.425537109375, 0.4859619140625, 0.54638671875, 0.6068115234375, 0.667236328125, 0.7276611328125, 0.7880859375, 0.8485107421875, 0.908935546875, 0.9693603515625, 1.02978515625, 1.0902099609375, 1.150634765625, 1.2110595703125, 1.271484375, 1.3319091796875, 1.392333984375, 1.4527587890625, 1.51318359375, 1.5736083984375, 1.634033203125, 1.6944580078125, 1.7548828125, 1.8153076171875, 1.875732421875, 1.9361572265625, 1.99658203125, 2.0570068359375, 2.117431640625, 2.1778564453125, 2.23828125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 4.0, 4.0, 3.0, 3.0, 12.0, 11.0, 17.0, 14.0, 23.0, 26.0, 30.0, 29.0, 45.0, 58.0, 40.0, 57.0, 59.0, 51.0, 58.0, 51.0, 47.0, 64.0, 55.0, 47.0, 39.0, 33.0, 27.0, 21.0, 20.0, 18.0, 11.0, 8.0, 2.0, 6.0, 4.0, 4.0, 7.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.060546875, -1.968658447265625, -1.87677001953125, -1.784881591796875, -1.6929931640625, -1.601104736328125, -1.50921630859375, -1.417327880859375, -1.325439453125, -1.233551025390625, -1.14166259765625, -1.049774169921875, -0.9578857421875, -0.865997314453125, -0.77410888671875, -0.682220458984375, -0.59033203125, -0.498443603515625, -0.40655517578125, -0.314666748046875, -0.2227783203125, -0.130889892578125, -0.03900146484375, 0.052886962890625, 0.144775390625, 0.236663818359375, 0.32855224609375, 0.420440673828125, 0.5123291015625, 0.604217529296875, 0.69610595703125, 0.787994384765625, 0.8798828125, 0.971771240234375, 1.06365966796875, 1.155548095703125, 1.2474365234375, 1.339324951171875, 1.43121337890625, 1.523101806640625, 1.614990234375, 1.706878662109375, 1.79876708984375, 1.890655517578125, 1.9825439453125, 2.074432373046875, 2.16632080078125, 2.258209228515625, 2.35009765625, 2.441986083984375, 2.53387451171875, 2.625762939453125, 2.7176513671875, 2.809539794921875, 2.90142822265625, 2.993316650390625, 3.085205078125, 3.177093505859375, 3.26898193359375, 3.360870361328125, 3.4527587890625, 3.544647216796875, 3.63653564453125, 3.728424072265625, 3.8203125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 9.0, 19.0, 35.0, 59.0, 83.0, 141.0, 293.0, 473.0, 1036.0, 2098.0, 4999.0, 15111.0, 139286.0, 840623.0, 30437.0, 7827.0, 3065.0, 1407.0, 717.0, 345.0, 215.0, 117.0, 72.0, 37.0, 24.0, 13.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.81640625, -1.756317138671875, -1.69622802734375, -1.636138916015625, -1.5760498046875, -1.515960693359375, -1.45587158203125, -1.395782470703125, -1.335693359375, -1.275604248046875, -1.21551513671875, -1.155426025390625, -1.0953369140625, -1.035247802734375, -0.97515869140625, -0.915069580078125, -0.85498046875, -0.794891357421875, -0.73480224609375, -0.674713134765625, -0.6146240234375, -0.554534912109375, -0.49444580078125, -0.434356689453125, -0.374267578125, -0.314178466796875, -0.25408935546875, -0.194000244140625, -0.1339111328125, -0.073822021484375, -0.01373291015625, 0.046356201171875, 0.1064453125, 0.166534423828125, 0.22662353515625, 0.286712646484375, 0.3468017578125, 0.406890869140625, 0.46697998046875, 0.527069091796875, 0.587158203125, 0.647247314453125, 0.70733642578125, 0.767425537109375, 0.8275146484375, 0.887603759765625, 0.94769287109375, 1.007781982421875, 1.06787109375, 1.127960205078125, 1.18804931640625, 1.248138427734375, 1.3082275390625, 1.368316650390625, 1.42840576171875, 1.488494873046875, 1.548583984375, 1.608673095703125, 1.66876220703125, 1.728851318359375, 1.7889404296875, 1.849029541015625, 1.90911865234375, 1.969207763671875, 2.029296875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 9.0, 14.0, 22.0, 94.0, 440.0, 325.0, 40.0, 21.0, 15.0, 8.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0014066696166992188, -0.001362532377243042, -0.0013183951377868652, -0.0012742578983306885, -0.0012301206588745117, -0.001185983419418335, -0.0011418461799621582, -0.0010977089405059814, -0.0010535717010498047, -0.001009434461593628, -0.0009652972221374512, -0.0009211599826812744, -0.0008770227432250977, -0.0008328855037689209, -0.0007887482643127441, -0.0007446110248565674, -0.0007004737854003906, -0.0006563365459442139, -0.0006121993064880371, -0.0005680620670318604, -0.0005239248275756836, -0.00047978758811950684, -0.0004356503486633301, -0.0003915131092071533, -0.00034737586975097656, -0.0003032386302947998, -0.00025910139083862305, -0.0002149641513824463, -0.00017082691192626953, -0.00012668967247009277, -8.255243301391602e-05, -3.841519355773926e-05, 5.7220458984375e-06, 4.985928535461426e-05, 9.399652481079102e-05, 0.00013813376426696777, 0.00018227100372314453, 0.0002264082431793213, 0.00027054548263549805, 0.0003146827220916748, 0.00035881996154785156, 0.0004029572010040283, 0.0004470944404602051, 0.0004912316799163818, 0.0005353689193725586, 0.0005795061588287354, 0.0006236433982849121, 0.0006677806377410889, 0.0007119178771972656, 0.0007560551166534424, 0.0008001923561096191, 0.0008443295955657959, 0.0008884668350219727, 0.0009326040744781494, 0.0009767413139343262, 0.001020878553390503, 0.0010650157928466797, 0.0011091530323028564, 0.0011532902717590332, 0.00119742751121521, 0.0012415647506713867, 0.0012857019901275635, 0.0013298392295837402, 0.001373976469039917, 0.0014181137084960938]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 3.0, 2.0, 11.0, 10.0, 13.0, 19.0, 23.0, 36.0, 82.0, 99.0, 166.0, 251.0, 465.0, 856.0, 1601.0, 3260.0, 7605.0, 21834.0, 235502.0, 726519.0, 31927.0, 9853.0, 4098.0, 1870.0, 1001.0, 565.0, 315.0, 177.0, 125.0, 70.0, 68.0, 36.0, 34.0, 13.0, 13.0, 9.0, 7.0, 4.0, 4.0, 0.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.529296875, -1.4844970703125, -1.439697265625, -1.3948974609375, -1.35009765625, -1.3052978515625, -1.260498046875, -1.2156982421875, -1.1708984375, -1.1260986328125, -1.081298828125, -1.0364990234375, -0.99169921875, -0.9468994140625, -0.902099609375, -0.8572998046875, -0.8125, -0.7677001953125, -0.722900390625, -0.6781005859375, -0.63330078125, -0.5885009765625, -0.543701171875, -0.4989013671875, -0.4541015625, -0.4093017578125, -0.364501953125, -0.3197021484375, -0.27490234375, -0.2301025390625, -0.185302734375, -0.1405029296875, -0.095703125, -0.0509033203125, -0.006103515625, 0.0386962890625, 0.08349609375, 0.1282958984375, 0.173095703125, 0.2178955078125, 0.2626953125, 0.3074951171875, 0.352294921875, 0.3970947265625, 0.44189453125, 0.4866943359375, 0.531494140625, 0.5762939453125, 0.62109375, 0.6658935546875, 0.710693359375, 0.7554931640625, 0.80029296875, 0.8450927734375, 0.889892578125, 0.9346923828125, 0.9794921875, 1.0242919921875, 1.069091796875, 1.1138916015625, 1.15869140625, 1.2034912109375, 1.248291015625, 1.2930908203125, 1.337890625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 1.0, 9.0, 6.0, 10.0, 14.0, 20.0, 25.0, 38.0, 35.0, 57.0, 85.0, 100.0, 117.0, 109.0, 101.0, 65.0, 41.0, 37.0, 32.0, 16.0, 17.0, 9.0, 12.0, 4.0, 4.0, 5.0, 7.0, 3.0, 1.0, 2.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2783203125, -1.2392730712890625, -1.200225830078125, -1.1611785888671875, -1.12213134765625, -1.0830841064453125, -1.044036865234375, -1.0049896240234375, -0.9659423828125, -0.9268951416015625, -0.887847900390625, -0.8488006591796875, -0.80975341796875, -0.7707061767578125, -0.731658935546875, -0.6926116943359375, -0.653564453125, -0.6145172119140625, -0.575469970703125, -0.5364227294921875, -0.49737548828125, -0.4583282470703125, -0.419281005859375, -0.3802337646484375, -0.3411865234375, -0.3021392822265625, -0.263092041015625, -0.2240447998046875, -0.18499755859375, -0.1459503173828125, -0.106903076171875, -0.0678558349609375, -0.02880859375, 0.0102386474609375, 0.049285888671875, 0.0883331298828125, 0.12738037109375, 0.1664276123046875, 0.205474853515625, 0.2445220947265625, 0.2835693359375, 0.3226165771484375, 0.361663818359375, 0.4007110595703125, 0.43975830078125, 0.4788055419921875, 0.517852783203125, 0.5569000244140625, 0.595947265625, 0.6349945068359375, 0.674041748046875, 0.7130889892578125, 0.75213623046875, 0.7911834716796875, 0.830230712890625, 0.8692779541015625, 0.9083251953125, 0.9473724365234375, 0.986419677734375, 1.0254669189453125, 1.06451416015625, 1.1035614013671875, 1.142608642578125, 1.1816558837890625, 1.220703125]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 6.0, 9.0, 6.0, 10.0, 19.0, 24.0, 37.0, 44.0, 71.0, 107.0, 223.0, 183.0, 107.0, 72.0, 35.0, 13.0, 14.0, 5.0, 7.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.703315734863281, -14.059226036071777, -13.41513729095459, -12.771047592163086, -12.126957893371582, -11.482868194580078, -10.83877944946289, -10.194689750671387, -9.550600051879883, -8.906510353088379, -8.262421607971191, -7.6183319091796875, -6.974242210388184, -6.330152988433838, -5.686063766479492, -5.041974067687988, -4.397885322570801, -3.753795862197876, -3.109706401824951, -2.4656171798706055, -1.8215277194976807, -1.1774382591247559, -0.5333490371704102, 0.11074066162109375, 0.7548298835754395, 1.3989193439483643, 2.043008804321289, 2.6870980262756348, 3.3311874866485596, 3.9752769470214844, 4.61936616897583, 5.263455867767334, 5.90754508972168, 6.551634311676025, 7.195724010467529, 7.839813232421875, 8.483902931213379, 9.127992630004883, 9.77208137512207, 10.416171073913574, 11.060260772705078, 11.704350471496582, 12.34843921661377, 12.992528915405273, 13.636618614196777, 14.280708312988281, 14.924797058105469, 15.568886756896973, 16.212974548339844, 16.85706329345703, 17.50115394592285, 18.14524269104004, 18.789331436157227, 19.433422088623047, 20.077510833740234, 20.721599578857422, 21.365690231323242, 22.00977897644043, 22.65386962890625, 23.297958374023438, 23.942047119140625, 24.586137771606445, 25.230226516723633, 25.874317169189453, 26.51840591430664]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 4.0, 2.0, 3.0, 6.0, 3.0, 4.0, 9.0, 17.0, 11.0, 23.0, 20.0, 27.0, 31.0, 35.0, 34.0, 37.0, 50.0, 56.0, 72.0, 79.0, 80.0, 48.0, 52.0, 39.0, 33.0, 33.0, 33.0, 28.0, 27.0, 20.0, 19.0, 9.0, 10.0, 11.0, 12.0, 7.0, 4.0, 3.0, 9.0, 6.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-14.255025863647461, -13.868809700012207, -13.482592582702637, -13.096376419067383, -12.710159301757812, -12.323943138122559, -11.937726974487305, -11.551509857177734, -11.16529369354248, -10.779077529907227, -10.392860412597656, -10.006644248962402, -9.620427131652832, -9.234210968017578, -8.847993850708008, -8.461777687072754, -8.0755615234375, -7.689344882965088, -7.303128242492676, -6.916912078857422, -6.53069543838501, -6.144478797912598, -5.7582621574401855, -5.372045516967773, -4.985828399658203, -4.599611759185791, -4.213395118713379, -3.827178716659546, -3.440962314605713, -3.054745674133301, -2.6685290336608887, -2.2823126316070557, -1.8960962295532227, -1.5098797082901, -1.1236631870269775, -0.7374465465545654, -0.35123002529144287, 0.03498649597167969, 0.4212031364440918, 0.8074195384979248, 1.193636178970337, 1.5798527002334595, 1.966069221496582, 2.352285861968994, 2.7385025024414062, 3.1247189044952393, 3.5109355449676514, 3.8971519470214844, 4.2833685874938965, 4.669585227966309, 5.055801868438721, 5.442018508911133, 5.828234672546387, 6.214451313018799, 6.600667953491211, 6.986884117126465, 7.373101234436035, 7.759317874908447, 8.14553451538086, 8.531750679016113, 8.917967796325684, 9.304183959960938, 9.690401077270508, 10.076617240905762, 10.462833404541016]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 3.0, 2.0, 4.0, 5.0, 7.0, 8.0, 14.0, 11.0, 15.0, 27.0, 39.0, 35.0, 54.0, 86.0, 98.0, 189.0, 452.0, 1372.0, 7601.0, 72853.0, 2176094.0, 1859394.0, 64413.0, 8054.0, 2032.0, 745.0, 273.0, 131.0, 75.0, 56.0, 21.0, 27.0, 20.0, 29.0, 5.0, 11.0, 6.0, 11.0, 5.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.546875, -1.495269775390625, -1.44366455078125, -1.392059326171875, -1.3404541015625, -1.288848876953125, -1.23724365234375, -1.185638427734375, -1.134033203125, -1.082427978515625, -1.03082275390625, -0.979217529296875, -0.9276123046875, -0.876007080078125, -0.82440185546875, -0.772796630859375, -0.72119140625, -0.669586181640625, -0.61798095703125, -0.566375732421875, -0.5147705078125, -0.463165283203125, -0.41156005859375, -0.359954833984375, -0.308349609375, -0.256744384765625, -0.20513916015625, -0.153533935546875, -0.1019287109375, -0.050323486328125, 0.00128173828125, 0.052886962890625, 0.1044921875, 0.156097412109375, 0.20770263671875, 0.259307861328125, 0.3109130859375, 0.362518310546875, 0.41412353515625, 0.465728759765625, 0.517333984375, 0.568939208984375, 0.62054443359375, 0.672149658203125, 0.7237548828125, 0.775360107421875, 0.82696533203125, 0.878570556640625, 0.93017578125, 0.981781005859375, 1.03338623046875, 1.084991455078125, 1.1365966796875, 1.188201904296875, 1.23980712890625, 1.291412353515625, 1.343017578125, 1.394622802734375, 1.44622802734375, 1.497833251953125, 1.5494384765625, 1.601043701171875, 1.65264892578125, 1.704254150390625, 1.755859375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 9.0, 12.0, 22.0, 37.0, 64.0, 74.0, 133.0, 120.0, 140.0, 121.0, 106.0, 63.0, 41.0, 35.0, 17.0, 8.0, 6.0, 4.0, 0.0, 1.0, 1.0], "bins": [-2.376953125, -2.3304977416992188, -2.2840423583984375, -2.2375869750976562, -2.191131591796875, -2.1446762084960938, -2.0982208251953125, -2.0517654418945312, -2.00531005859375, -1.9588546752929688, -1.9123992919921875, -1.8659439086914062, -1.819488525390625, -1.7730331420898438, -1.7265777587890625, -1.6801223754882812, -1.6336669921875, -1.5872116088867188, -1.5407562255859375, -1.4943008422851562, -1.447845458984375, -1.4013900756835938, -1.3549346923828125, -1.3084793090820312, -1.26202392578125, -1.2155685424804688, -1.1691131591796875, -1.1226577758789062, -1.076202392578125, -1.0297470092773438, -0.9832916259765625, -0.9368362426757812, -0.890380859375, -0.8439254760742188, -0.7974700927734375, -0.7510147094726562, -0.704559326171875, -0.6581039428710938, -0.6116485595703125, -0.5651931762695312, -0.51873779296875, -0.47228240966796875, -0.4258270263671875, -0.37937164306640625, -0.332916259765625, -0.28646087646484375, -0.2400054931640625, -0.19355010986328125, -0.1470947265625, -0.10063934326171875, -0.0541839599609375, -0.00772857666015625, 0.038726806640625, 0.08518218994140625, 0.1316375732421875, 0.17809295654296875, 0.22454833984375, 0.27100372314453125, 0.3174591064453125, 0.36391448974609375, 0.410369873046875, 0.45682525634765625, 0.5032806396484375, 0.5497360229492188, 0.59619140625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 7.0, 16.0, 22.0, 33.0, 48.0, 80.0, 124.0, 177.0, 281.0, 636.0, 2786.0, 36136.0, 3736828.0, 403534.0, 11165.0, 1573.0, 450.0, 191.0, 90.0, 42.0, 27.0, 13.0, 6.0, 6.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.205078125, -3.097442626953125, -2.98980712890625, -2.882171630859375, -2.7745361328125, -2.666900634765625, -2.55926513671875, -2.451629638671875, -2.343994140625, -2.236358642578125, -2.12872314453125, -2.021087646484375, -1.9134521484375, -1.805816650390625, -1.69818115234375, -1.590545654296875, -1.48291015625, -1.375274658203125, -1.26763916015625, -1.160003662109375, -1.0523681640625, -0.944732666015625, -0.83709716796875, -0.729461669921875, -0.621826171875, -0.514190673828125, -0.40655517578125, -0.298919677734375, -0.1912841796875, -0.083648681640625, 0.02398681640625, 0.131622314453125, 0.2392578125, 0.346893310546875, 0.45452880859375, 0.562164306640625, 0.6697998046875, 0.777435302734375, 0.88507080078125, 0.992706298828125, 1.100341796875, 1.207977294921875, 1.31561279296875, 1.423248291015625, 1.5308837890625, 1.638519287109375, 1.74615478515625, 1.853790283203125, 1.96142578125, 2.069061279296875, 2.17669677734375, 2.284332275390625, 2.3919677734375, 2.499603271484375, 2.60723876953125, 2.714874267578125, 2.822509765625, 2.930145263671875, 3.03778076171875, 3.145416259765625, 3.2530517578125, 3.360687255859375, 3.46832275390625, 3.575958251953125, 3.68359375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 15.0, 12.0, 12.0, 29.0, 68.0, 134.0, 346.0, 932.0, 1314.0, 693.0, 243.0, 123.0, 74.0, 36.0, 16.0, 10.0, 8.0, 3.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.39453125, -4.2976226806640625, -4.200714111328125, -4.1038055419921875, -4.00689697265625, -3.9099884033203125, -3.813079833984375, -3.7161712646484375, -3.6192626953125, -3.5223541259765625, -3.425445556640625, -3.3285369873046875, -3.23162841796875, -3.1347198486328125, -3.037811279296875, -2.9409027099609375, -2.843994140625, -2.7470855712890625, -2.650177001953125, -2.5532684326171875, -2.45635986328125, -2.3594512939453125, -2.262542724609375, -2.1656341552734375, -2.0687255859375, -1.9718170166015625, -1.874908447265625, -1.7779998779296875, -1.68109130859375, -1.5841827392578125, -1.487274169921875, -1.3903656005859375, -1.29345703125, -1.1965484619140625, -1.099639892578125, -1.0027313232421875, -0.90582275390625, -0.8089141845703125, -0.712005615234375, -0.6150970458984375, -0.5181884765625, -0.4212799072265625, -0.324371337890625, -0.2274627685546875, -0.13055419921875, -0.0336456298828125, 0.063262939453125, 0.1601715087890625, 0.257080078125, 0.3539886474609375, 0.450897216796875, 0.5478057861328125, 0.64471435546875, 0.7416229248046875, 0.838531494140625, 0.9354400634765625, 1.0323486328125, 1.1292572021484375, 1.226165771484375, 1.3230743408203125, 1.41998291015625, 1.5168914794921875, 1.613800048828125, 1.7107086181640625, 1.8076171875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 10.0, 13.0, 18.0, 49.0, 81.0, 131.0, 183.0, 198.0, 146.0, 93.0, 27.0, 15.0, 11.0, 5.0, 6.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.392019271850586, -15.848381042480469, -15.304742813110352, -14.761104583740234, -14.217467308044434, -13.673829078674316, -13.1301908493042, -12.586552619934082, -12.042915344238281, -11.499277114868164, -10.955638885498047, -10.41200065612793, -9.868363380432129, -9.324725151062012, -8.781086921691895, -8.237448692321777, -7.69381046295166, -7.150172233581543, -6.606534481048584, -6.062896251678467, -5.519258499145508, -4.975620269775391, -4.431982040405273, -3.8883440494537354, -3.3447060585021973, -2.801068067550659, -2.257430076599121, -1.713791847229004, -1.1701538562774658, -0.6265158653259277, -0.08287763595581055, 0.46076035499572754, 1.0043983459472656, 1.5480363368988037, 2.091674327850342, 2.635312557220459, 3.178950548171997, 3.722588539123535, 4.266226768493652, 4.8098649978637695, 5.3535027503967285, 5.897140979766846, 6.440778732299805, 6.984416961669922, 7.528055191040039, 8.071693420410156, 8.615331649780273, 9.158968925476074, 9.702607154846191, 10.246245384216309, 10.789883613586426, 11.333520889282227, 11.877159118652344, 12.420797348022461, 12.964435577392578, 13.508073806762695, 14.051712036132812, 14.59535026550293, 15.138988494873047, 15.682626724243164, 16.22626495361328, 16.769901275634766, 17.313541412353516, 17.857177734375, 18.400815963745117]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 7.0, 3.0, 11.0, 15.0, 15.0, 20.0, 27.0, 30.0, 47.0, 52.0, 59.0, 67.0, 70.0, 73.0, 75.0, 72.0, 87.0, 66.0, 49.0, 38.0, 39.0, 27.0, 16.0, 14.0, 6.0, 8.0, 9.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.370281219482422, -9.933174133300781, -9.496066093444824, -9.058959007263184, -8.621851921081543, -8.184743881225586, -7.747636795043945, -7.310529708862305, -6.873422145843506, -6.436314582824707, -5.999207496643066, -5.562099933624268, -5.124992370605469, -4.687885284423828, -4.250777721405029, -3.8136703968048096, -3.37656307220459, -2.93945574760437, -2.5023484230041504, -2.0652408599853516, -1.6281335353851318, -1.191026210784912, -0.7539186477661133, -0.31681132316589355, 0.12029600143432617, 0.5574033856391907, 0.9945107698440552, 1.4316182136535645, 1.8687255382537842, 2.305832862854004, 2.7429404258728027, 3.1800477504730225, 3.617155075073242, 4.054262638092041, 4.491369724273682, 4.9284772872924805, 5.365584373474121, 5.80269193649292, 6.239799499511719, 6.676906585693359, 7.114014148712158, 7.551121711730957, 7.988228797912598, 8.425336837768555, 8.862443923950195, 9.299551010131836, 9.736658096313477, 10.173766136169434, 10.610873222351074, 11.047980308532715, 11.485088348388672, 11.922195434570312, 12.359302520751953, 12.796409606933594, 13.23351764678955, 13.670624732971191, 14.107732772827148, 14.544839859008789, 14.981947898864746, 15.419054985046387, 15.856162071228027, 16.293270111083984, 16.730377197265625, 17.167484283447266, 17.604591369628906]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 7.0, 5.0, 13.0, 17.0, 31.0, 39.0, 73.0, 88.0, 123.0, 212.0, 294.0, 469.0, 761.0, 1185.0, 1915.0, 2948.0, 5029.0, 8687.0, 15109.0, 26355.0, 47191.0, 83182.0, 143071.0, 206311.0, 198500.0, 131061.0, 75399.0, 42442.0, 24242.0, 13709.0, 7799.0, 4687.0, 2801.0, 1755.0, 1121.0, 675.0, 423.0, 279.0, 181.0, 125.0, 76.0, 51.0, 46.0, 26.0, 7.0, 8.0, 8.0, 9.0, 4.0, 6.0, 1.0, 2.0], "bins": [-0.822265625, -0.7993698120117188, -0.7764739990234375, -0.7535781860351562, -0.730682373046875, -0.7077865600585938, -0.6848907470703125, -0.6619949340820312, -0.63909912109375, -0.6162033081054688, -0.5933074951171875, -0.5704116821289062, -0.547515869140625, -0.5246200561523438, -0.5017242431640625, -0.47882843017578125, -0.4559326171875, -0.43303680419921875, -0.4101409912109375, -0.38724517822265625, -0.364349365234375, -0.34145355224609375, -0.3185577392578125, -0.29566192626953125, -0.27276611328125, -0.24987030029296875, -0.2269744873046875, -0.20407867431640625, -0.181182861328125, -0.15828704833984375, -0.1353912353515625, -0.11249542236328125, -0.089599609375, -0.06670379638671875, -0.0438079833984375, -0.02091217041015625, 0.001983642578125, 0.02487945556640625, 0.0477752685546875, 0.07067108154296875, 0.09356689453125, 0.11646270751953125, 0.1393585205078125, 0.16225433349609375, 0.185150146484375, 0.20804595947265625, 0.2309417724609375, 0.25383758544921875, 0.2767333984375, 0.29962921142578125, 0.3225250244140625, 0.34542083740234375, 0.368316650390625, 0.39121246337890625, 0.4141082763671875, 0.43700408935546875, 0.45989990234375, 0.48279571533203125, 0.5056915283203125, 0.5285873413085938, 0.551483154296875, 0.5743789672851562, 0.5972747802734375, 0.6201705932617188, 0.64306640625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 5.0, 2.0, 4.0, 4.0, 6.0, 1.0, 5.0, 8.0, 8.0, 12.0, 12.0, 19.0, 16.0, 17.0, 16.0, 30.0, 26.0, 30.0, 30.0, 30.0, 51.0, 52.0, 56.0, 53.0, 32.0, 53.0, 46.0, 62.0, 36.0, 47.0, 25.0, 35.0, 21.0, 22.0, 25.0, 22.0, 13.0, 13.0, 9.0, 6.0, 9.0, 5.0, 9.0, 10.0, 4.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.6796875, -0.6604156494140625, -0.641143798828125, -0.6218719482421875, -0.60260009765625, -0.5833282470703125, -0.564056396484375, -0.5447845458984375, -0.5255126953125, -0.5062408447265625, -0.486968994140625, -0.4676971435546875, -0.44842529296875, -0.4291534423828125, -0.409881591796875, -0.3906097412109375, -0.371337890625, -0.3520660400390625, -0.332794189453125, -0.3135223388671875, -0.29425048828125, -0.2749786376953125, -0.255706787109375, -0.2364349365234375, -0.2171630859375, -0.1978912353515625, -0.178619384765625, -0.1593475341796875, -0.14007568359375, -0.1208038330078125, -0.101531982421875, -0.0822601318359375, -0.06298828125, -0.0437164306640625, -0.024444580078125, -0.0051727294921875, 0.01409912109375, 0.0333709716796875, 0.052642822265625, 0.0719146728515625, 0.0911865234375, 0.1104583740234375, 0.129730224609375, 0.1490020751953125, 0.16827392578125, 0.1875457763671875, 0.206817626953125, 0.2260894775390625, 0.245361328125, 0.2646331787109375, 0.283905029296875, 0.3031768798828125, 0.32244873046875, 0.3417205810546875, 0.360992431640625, 0.3802642822265625, 0.3995361328125, 0.4188079833984375, 0.438079833984375, 0.4573516845703125, 0.47662353515625, 0.4958953857421875, 0.515167236328125, 0.5344390869140625, 0.5537109375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 3.0, 7.0, 8.0, 9.0, 22.0, 29.0, 36.0, 55.0, 89.0, 141.0, 207.0, 311.0, 541.0, 1067.0, 2110.0, 6461.0, 35481.0, 379485.0, 569003.0, 41540.0, 7012.0, 2282.0, 1072.0, 581.0, 379.0, 196.0, 136.0, 79.0, 65.0, 51.0, 26.0, 21.0, 19.0, 6.0, 9.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.765625, -2.670379638671875, -2.57513427734375, -2.479888916015625, -2.3846435546875, -2.289398193359375, -2.19415283203125, -2.098907470703125, -2.003662109375, -1.908416748046875, -1.81317138671875, -1.717926025390625, -1.6226806640625, -1.527435302734375, -1.43218994140625, -1.336944580078125, -1.24169921875, -1.146453857421875, -1.05120849609375, -0.955963134765625, -0.8607177734375, -0.765472412109375, -0.67022705078125, -0.574981689453125, -0.479736328125, -0.384490966796875, -0.28924560546875, -0.194000244140625, -0.0987548828125, -0.003509521484375, 0.09173583984375, 0.186981201171875, 0.2822265625, 0.377471923828125, 0.47271728515625, 0.567962646484375, 0.6632080078125, 0.758453369140625, 0.85369873046875, 0.948944091796875, 1.044189453125, 1.139434814453125, 1.23468017578125, 1.329925537109375, 1.4251708984375, 1.520416259765625, 1.61566162109375, 1.710906982421875, 1.80615234375, 1.901397705078125, 1.99664306640625, 2.091888427734375, 2.1871337890625, 2.282379150390625, 2.37762451171875, 2.472869873046875, 2.568115234375, 2.663360595703125, 2.75860595703125, 2.853851318359375, 2.9490966796875, 3.044342041015625, 3.13958740234375, 3.234832763671875, 3.330078125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 11.0, 14.0, 13.0, 15.0, 7.0, 14.0, 22.0, 20.0, 28.0, 29.0, 28.0, 34.0, 39.0, 42.0, 60.0, 44.0, 56.0, 63.0, 43.0, 67.0, 57.0, 32.0, 30.0, 43.0, 32.0, 31.0, 22.0, 17.0, 22.0, 18.0, 7.0, 12.0, 9.0, 2.0, 4.0, 3.0, 3.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.673828125, -3.57470703125, -3.4755859375, -3.37646484375, -3.27734375, -3.17822265625, -3.0791015625, -2.97998046875, -2.880859375, -2.78173828125, -2.6826171875, -2.58349609375, -2.484375, -2.38525390625, -2.2861328125, -2.18701171875, -2.087890625, -1.98876953125, -1.8896484375, -1.79052734375, -1.69140625, -1.59228515625, -1.4931640625, -1.39404296875, -1.294921875, -1.19580078125, -1.0966796875, -0.99755859375, -0.8984375, -0.79931640625, -0.7001953125, -0.60107421875, -0.501953125, -0.40283203125, -0.3037109375, -0.20458984375, -0.10546875, -0.00634765625, 0.0927734375, 0.19189453125, 0.291015625, 0.39013671875, 0.4892578125, 0.58837890625, 0.6875, 0.78662109375, 0.8857421875, 0.98486328125, 1.083984375, 1.18310546875, 1.2822265625, 1.38134765625, 1.48046875, 1.57958984375, 1.6787109375, 1.77783203125, 1.876953125, 1.97607421875, 2.0751953125, 2.17431640625, 2.2734375, 2.37255859375, 2.4716796875, 2.57080078125, 2.669921875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 5.0, 5.0, 4.0, 10.0, 12.0, 17.0, 44.0, 50.0, 99.0, 188.0, 440.0, 1219.0, 4560.0, 32037.0, 883045.0, 114669.0, 8966.0, 1982.0, 619.0, 274.0, 120.0, 74.0, 38.0, 29.0, 8.0, 16.0, 8.0, 2.0, 5.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5595703125, -1.4988861083984375, -1.438201904296875, -1.3775177001953125, -1.31683349609375, -1.2561492919921875, -1.195465087890625, -1.1347808837890625, -1.0740966796875, -1.0134124755859375, -0.952728271484375, -0.8920440673828125, -0.83135986328125, -0.7706756591796875, -0.709991455078125, -0.6493072509765625, -0.588623046875, -0.5279388427734375, -0.467254638671875, -0.4065704345703125, -0.34588623046875, -0.2852020263671875, -0.224517822265625, -0.1638336181640625, -0.1031494140625, -0.0424652099609375, 0.018218994140625, 0.0789031982421875, 0.13958740234375, 0.2002716064453125, 0.260955810546875, 0.3216400146484375, 0.38232421875, 0.4430084228515625, 0.503692626953125, 0.5643768310546875, 0.62506103515625, 0.6857452392578125, 0.746429443359375, 0.8071136474609375, 0.8677978515625, 0.9284820556640625, 0.989166259765625, 1.0498504638671875, 1.11053466796875, 1.1712188720703125, 1.231903076171875, 1.2925872802734375, 1.353271484375, 1.4139556884765625, 1.474639892578125, 1.5353240966796875, 1.59600830078125, 1.6566925048828125, 1.717376708984375, 1.7780609130859375, 1.8387451171875, 1.8994293212890625, 1.960113525390625, 2.0207977294921875, 2.08148193359375, 2.1421661376953125, 2.202850341796875, 2.2635345458984375, 2.32421875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 9.0, 7.0, 11.0, 26.0, 41.0, 97.0, 170.0, 260.0, 166.0, 113.0, 47.0, 22.0, 10.0, 8.0, 5.0, 3.0, 3.0, 2.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005397796630859375, -0.0005214959383010864, -0.0005032122135162354, -0.0004849284887313843, -0.0004666447639465332, -0.00044836103916168213, -0.00043007731437683105, -0.00041179358959198, -0.0003935098648071289, -0.00037522614002227783, -0.00035694241523742676, -0.0003386586904525757, -0.0003203749656677246, -0.00030209124088287354, -0.00028380751609802246, -0.0002655237913131714, -0.0002472400665283203, -0.00022895634174346924, -0.00021067261695861816, -0.0001923888921737671, -0.00017410516738891602, -0.00015582144260406494, -0.00013753771781921387, -0.00011925399303436279, -0.00010097026824951172, -8.268654346466064e-05, -6.440281867980957e-05, -4.6119093894958496e-05, -2.7835369110107422e-05, -9.551644325256348e-06, 8.732080459594727e-06, 2.70158052444458e-05, 4.5299530029296875e-05, 6.358325481414795e-05, 8.186697959899902e-05, 0.0001001507043838501, 0.00011843442916870117, 0.00013671815395355225, 0.00015500187873840332, 0.0001732856035232544, 0.00019156932830810547, 0.00020985305309295654, 0.00022813677787780762, 0.0002464205026626587, 0.00026470422744750977, 0.00028298795223236084, 0.0003012716770172119, 0.000319555401802063, 0.00033783912658691406, 0.00035612285137176514, 0.0003744065761566162, 0.0003926903009414673, 0.00041097402572631836, 0.00042925775051116943, 0.0004475414752960205, 0.0004658252000808716, 0.00048410892486572266, 0.0005023926496505737, 0.0005206763744354248, 0.0005389600992202759, 0.000557243824005127, 0.000575527548789978, 0.0005938112735748291, 0.0006120949983596802, 0.0006303787231445312]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 6.0, 8.0, 20.0, 27.0, 43.0, 101.0, 152.0, 380.0, 924.0, 2763.0, 13791.0, 242430.0, 755837.0, 25741.0, 4199.0, 1205.0, 496.0, 201.0, 87.0, 61.0, 23.0, 22.0, 10.0, 10.0, 8.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4609375, -1.4124755859375, -1.364013671875, -1.3155517578125, -1.26708984375, -1.2186279296875, -1.170166015625, -1.1217041015625, -1.0732421875, -1.0247802734375, -0.976318359375, -0.9278564453125, -0.87939453125, -0.8309326171875, -0.782470703125, -0.7340087890625, -0.685546875, -0.6370849609375, -0.588623046875, -0.5401611328125, -0.49169921875, -0.4432373046875, -0.394775390625, -0.3463134765625, -0.2978515625, -0.2493896484375, -0.200927734375, -0.1524658203125, -0.10400390625, -0.0555419921875, -0.007080078125, 0.0413818359375, 0.08984375, 0.1383056640625, 0.186767578125, 0.2352294921875, 0.28369140625, 0.3321533203125, 0.380615234375, 0.4290771484375, 0.4775390625, 0.5260009765625, 0.574462890625, 0.6229248046875, 0.67138671875, 0.7198486328125, 0.768310546875, 0.8167724609375, 0.865234375, 0.9136962890625, 0.962158203125, 1.0106201171875, 1.05908203125, 1.1075439453125, 1.156005859375, 1.2044677734375, 1.2529296875, 1.3013916015625, 1.349853515625, 1.3983154296875, 1.44677734375, 1.4952392578125, 1.543701171875, 1.5921630859375, 1.640625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 6.0, 4.0, 9.0, 10.0, 10.0, 10.0, 15.0, 19.0, 33.0, 50.0, 56.0, 85.0, 106.0, 121.0, 115.0, 89.0, 79.0, 47.0, 47.0, 24.0, 18.0, 16.0, 6.0, 5.0, 4.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2119140625, -1.1768646240234375, -1.141815185546875, -1.1067657470703125, -1.07171630859375, -1.0366668701171875, -1.001617431640625, -0.9665679931640625, -0.9315185546875, -0.8964691162109375, -0.861419677734375, -0.8263702392578125, -0.79132080078125, -0.7562713623046875, -0.721221923828125, -0.6861724853515625, -0.651123046875, -0.6160736083984375, -0.581024169921875, -0.5459747314453125, -0.51092529296875, -0.4758758544921875, -0.440826416015625, -0.4057769775390625, -0.3707275390625, -0.3356781005859375, -0.300628662109375, -0.2655792236328125, -0.23052978515625, -0.1954803466796875, -0.160430908203125, -0.1253814697265625, -0.09033203125, -0.0552825927734375, -0.020233154296875, 0.0148162841796875, 0.04986572265625, 0.0849151611328125, 0.119964599609375, 0.1550140380859375, 0.1900634765625, 0.2251129150390625, 0.260162353515625, 0.2952117919921875, 0.33026123046875, 0.3653106689453125, 0.400360107421875, 0.4354095458984375, 0.470458984375, 0.5055084228515625, 0.540557861328125, 0.5756072998046875, 0.61065673828125, 0.6457061767578125, 0.680755615234375, 0.7158050537109375, 0.7508544921875, 0.7859039306640625, 0.820953369140625, 0.8560028076171875, 0.89105224609375, 0.9261016845703125, 0.961151123046875, 0.9962005615234375, 1.03125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 15.0, 16.0, 56.0, 146.0, 318.0, 195.0, 134.0, 53.0, 27.0, 16.0, 11.0, 5.0, 6.0, 3.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.215835571289062, -29.22852897644043, -28.241222381591797, -27.253915786743164, -26.26660919189453, -25.27930450439453, -24.2919979095459, -23.304691314697266, -22.317384719848633, -21.330078125, -20.342771530151367, -19.355464935302734, -18.368160247802734, -17.38085174560547, -16.39354705810547, -15.406240463256836, -14.418933868408203, -13.43162727355957, -12.444320678710938, -11.457015037536621, -10.469708442687988, -9.482401847839355, -8.495096206665039, -7.507789611816406, -6.520483016967773, -5.533176422119141, -4.545870304107666, -3.5585639476776123, -2.5712575912475586, -1.5839509963989258, -0.5966448783874512, 0.39066123962402344, 1.3779678344726562, 2.36527419090271, 3.3525805473327637, 4.339886665344238, 5.327193260192871, 6.314499855041504, 7.3018059730529785, 8.289112091064453, 9.276418685913086, 10.263725280761719, 11.251031875610352, 12.238337516784668, 13.2256441116333, 14.212950706481934, 15.20025634765625, 16.187562942504883, 17.174869537353516, 18.16217613220215, 19.14948272705078, 20.136789321899414, 21.124095916748047, 22.111400604248047, 23.09870719909668, 24.086013793945312, 25.073320388793945, 26.060626983642578, 27.04793357849121, 28.035240173339844, 29.022544860839844, 30.00985336303711, 30.99715805053711, 31.984464645385742, 32.971771240234375]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 7.0, 2.0, 8.0, 6.0, 7.0, 11.0, 17.0, 14.0, 19.0, 21.0, 32.0, 43.0, 38.0, 48.0, 43.0, 60.0, 117.0, 92.0, 78.0, 63.0, 45.0, 40.0, 29.0, 36.0, 22.0, 27.0, 16.0, 18.0, 12.0, 10.0, 4.0, 4.0, 6.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.239904403686523, -14.637977600097656, -14.036050796508789, -13.434123992919922, -12.832198143005371, -12.230271339416504, -11.628344535827637, -11.026418685913086, -10.424491882324219, -9.822565078735352, -9.220638275146484, -8.618711471557617, -8.016785621643066, -7.414858818054199, -6.812932014465332, -6.211005687713623, -5.609078407287598, -5.0071516036987305, -4.4052252769470215, -3.8032984733581543, -3.201371908187866, -2.599445343017578, -1.997518539428711, -1.395592212677002, -0.7936654090881348, -0.1917387843132019, 0.41018784046173096, 1.0121145248413086, 1.6140410900115967, 2.2159676551818848, 2.817894458770752, 3.419820785522461, 4.021747589111328, 4.623674392700195, 5.225600719451904, 5.8275275230407715, 6.4294538497924805, 7.031380653381348, 7.633307456970215, 8.235233306884766, 8.837160110473633, 9.4390869140625, 10.041013717651367, 10.642940521240234, 11.244866371154785, 11.846793174743652, 12.44871997833252, 13.05064582824707, 13.652573585510254, 14.254500389099121, 14.856427192687988, 15.458353042602539, 16.060279846191406, 16.662206649780273, 17.26413345336914, 17.866060256958008, 18.467987060546875, 19.069913864135742, 19.67184066772461, 20.273767471313477, 20.875694274902344, 21.477619171142578, 22.079547882080078, 22.681472778320312, 23.28339958190918]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 8.0, 11.0, 11.0, 24.0, 30.0, 43.0, 80.0, 103.0, 165.0, 271.0, 575.0, 1392.0, 3839.0, 15375.0, 113253.0, 1639912.0, 2225719.0, 165510.0, 20355.0, 4649.0, 1492.0, 630.0, 310.0, 166.0, 138.0, 67.0, 46.0, 34.0, 22.0, 17.0, 6.0, 9.0, 8.0, 5.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.130859375, -1.09326171875, -1.0556640625, -1.01806640625, -0.98046875, -0.94287109375, -0.9052734375, -0.86767578125, -0.830078125, -0.79248046875, -0.7548828125, -0.71728515625, -0.6796875, -0.64208984375, -0.6044921875, -0.56689453125, -0.529296875, -0.49169921875, -0.4541015625, -0.41650390625, -0.37890625, -0.34130859375, -0.3037109375, -0.26611328125, -0.228515625, -0.19091796875, -0.1533203125, -0.11572265625, -0.078125, -0.04052734375, -0.0029296875, 0.03466796875, 0.072265625, 0.10986328125, 0.1474609375, 0.18505859375, 0.22265625, 0.26025390625, 0.2978515625, 0.33544921875, 0.373046875, 0.41064453125, 0.4482421875, 0.48583984375, 0.5234375, 0.56103515625, 0.5986328125, 0.63623046875, 0.673828125, 0.71142578125, 0.7490234375, 0.78662109375, 0.82421875, 0.86181640625, 0.8994140625, 0.93701171875, 0.974609375, 1.01220703125, 1.0498046875, 1.08740234375, 1.125, 1.16259765625, 1.2001953125, 1.23779296875, 1.275390625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 5.0, 1.0, 3.0, 4.0, 10.0, 13.0, 16.0, 15.0, 31.0, 23.0, 44.0, 37.0, 29.0, 49.0, 50.0, 51.0, 56.0, 73.0, 45.0, 43.0, 59.0, 50.0, 42.0, 42.0, 51.0, 32.0, 23.0, 23.0, 26.0, 13.0, 10.0, 7.0, 7.0, 10.0, 3.0, 1.0, 2.0, 4.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.759765625, -0.7361373901367188, -0.7125091552734375, -0.6888809204101562, -0.665252685546875, -0.6416244506835938, -0.6179962158203125, -0.5943679809570312, -0.57073974609375, -0.5471115112304688, -0.5234832763671875, -0.49985504150390625, -0.476226806640625, -0.45259857177734375, -0.4289703369140625, -0.40534210205078125, -0.3817138671875, -0.35808563232421875, -0.3344573974609375, -0.31082916259765625, -0.287200927734375, -0.26357269287109375, -0.2399444580078125, -0.21631622314453125, -0.19268798828125, -0.16905975341796875, -0.1454315185546875, -0.12180328369140625, -0.098175048828125, -0.07454681396484375, -0.0509185791015625, -0.02729034423828125, -0.003662109375, 0.01996612548828125, 0.0435943603515625, 0.06722259521484375, 0.090850830078125, 0.11447906494140625, 0.1381072998046875, 0.16173553466796875, 0.18536376953125, 0.20899200439453125, 0.2326202392578125, 0.25624847412109375, 0.279876708984375, 0.30350494384765625, 0.3271331787109375, 0.35076141357421875, 0.3743896484375, 0.39801788330078125, 0.4216461181640625, 0.44527435302734375, 0.468902587890625, 0.49253082275390625, 0.5161590576171875, 0.5397872924804688, 0.56341552734375, 0.5870437622070312, 0.6106719970703125, 0.6343002319335938, 0.657928466796875, 0.6815567016601562, 0.7051849365234375, 0.7288131713867188, 0.75244140625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 3.0, 8.0, 7.0, 7.0, 15.0, 25.0, 43.0, 81.0, 123.0, 203.0, 357.0, 694.0, 2163.0, 22211.0, 3815071.0, 343682.0, 6976.0, 1379.0, 501.0, 304.0, 143.0, 96.0, 61.0, 37.0, 25.0, 15.0, 17.0, 8.0, 7.0, 7.0, 6.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.603515625, -3.482574462890625, -3.36163330078125, -3.240692138671875, -3.1197509765625, -2.998809814453125, -2.87786865234375, -2.756927490234375, -2.635986328125, -2.515045166015625, -2.39410400390625, -2.273162841796875, -2.1522216796875, -2.031280517578125, -1.91033935546875, -1.789398193359375, -1.66845703125, -1.547515869140625, -1.42657470703125, -1.305633544921875, -1.1846923828125, -1.063751220703125, -0.94281005859375, -0.821868896484375, -0.700927734375, -0.579986572265625, -0.45904541015625, -0.338104248046875, -0.2171630859375, -0.096221923828125, 0.02471923828125, 0.145660400390625, 0.2666015625, 0.387542724609375, 0.50848388671875, 0.629425048828125, 0.7503662109375, 0.871307373046875, 0.99224853515625, 1.113189697265625, 1.234130859375, 1.355072021484375, 1.47601318359375, 1.596954345703125, 1.7178955078125, 1.838836669921875, 1.95977783203125, 2.080718994140625, 2.20166015625, 2.322601318359375, 2.44354248046875, 2.564483642578125, 2.6854248046875, 2.806365966796875, 2.92730712890625, 3.048248291015625, 3.169189453125, 3.290130615234375, 3.41107177734375, 3.532012939453125, 3.6529541015625, 3.773895263671875, 3.89483642578125, 4.015777587890625, 4.13671875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 14.0, 30.0, 69.0, 154.0, 534.0, 1596.0, 1183.0, 316.0, 97.0, 52.0, 20.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.95703125, -3.832794189453125, -3.70855712890625, -3.584320068359375, -3.4600830078125, -3.335845947265625, -3.21160888671875, -3.087371826171875, -2.963134765625, -2.838897705078125, -2.71466064453125, -2.590423583984375, -2.4661865234375, -2.341949462890625, -2.21771240234375, -2.093475341796875, -1.96923828125, -1.845001220703125, -1.72076416015625, -1.596527099609375, -1.4722900390625, -1.348052978515625, -1.22381591796875, -1.099578857421875, -0.975341796875, -0.851104736328125, -0.72686767578125, -0.602630615234375, -0.4783935546875, -0.354156494140625, -0.22991943359375, -0.105682373046875, 0.0185546875, 0.142791748046875, 0.26702880859375, 0.391265869140625, 0.5155029296875, 0.639739990234375, 0.76397705078125, 0.888214111328125, 1.012451171875, 1.136688232421875, 1.26092529296875, 1.385162353515625, 1.5093994140625, 1.633636474609375, 1.75787353515625, 1.882110595703125, 2.00634765625, 2.130584716796875, 2.25482177734375, 2.379058837890625, 2.5032958984375, 2.627532958984375, 2.75177001953125, 2.876007080078125, 3.000244140625, 3.124481201171875, 3.24871826171875, 3.372955322265625, 3.4971923828125, 3.621429443359375, 3.74566650390625, 3.869903564453125, 3.994140625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 8.0, 10.0, 22.0, 60.0, 186.0, 276.0, 224.0, 119.0, 53.0, 19.0, 8.0, 7.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.307045936584473, -12.55985164642334, -11.812658309936523, -11.06546401977539, -10.318269729614258, -9.571075439453125, -8.823881149291992, -8.076687812805176, -7.329493522644043, -6.58229923248291, -5.8351054191589355, -5.087911605834961, -4.340717315673828, -3.5935232639312744, -2.8463292121887207, -2.099135398864746, -1.3519411087036133, -0.6047470569610596, 0.14244699478149414, 0.8896410465240479, 1.6368350982666016, 2.3840291500091553, 3.131223201751709, 3.8784170150756836, 4.625611305236816, 5.372805595397949, 6.119999408721924, 6.867193222045898, 7.614387512207031, 8.361581802368164, 9.108776092529297, 9.855969429016113, 10.603164672851562, 11.350358963012695, 12.097553253173828, 12.844746589660645, 13.591940879821777, 14.33913516998291, 15.086328506469727, 15.83352279663086, 16.580717086791992, 17.327911376953125, 18.075105667114258, 18.82229995727539, 19.56949234008789, 20.316686630249023, 21.063880920410156, 21.81107521057129, 22.558269500732422, 23.305463790893555, 24.052658081054688, 24.79985237121582, 25.547046661376953, 26.294239044189453, 27.041433334350586, 27.78862762451172, 28.53582191467285, 29.283016204833984, 30.030210494995117, 30.77740478515625, 31.52459716796875, 32.271793365478516, 33.018985748291016, 33.76618194580078, 34.51337432861328]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 7.0, 4.0, 6.0, 5.0, 11.0, 9.0, 6.0, 15.0, 17.0, 24.0, 18.0, 29.0, 28.0, 34.0, 54.0, 48.0, 57.0, 43.0, 49.0, 38.0, 49.0, 60.0, 51.0, 53.0, 58.0, 28.0, 34.0, 41.0, 32.0, 22.0, 23.0, 12.0, 12.0, 9.0, 9.0, 2.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-10.2860746383667, -10.0123872756958, -9.738698959350586, -9.465011596679688, -9.191324234008789, -8.91763687133789, -8.643948554992676, -8.370261192321777, -8.096573829650879, -7.822885990142822, -7.549198627471924, -7.275510787963867, -7.001823425292969, -6.728135585784912, -6.4544477462768555, -6.180760383605957, -5.9070725440979, -5.633384704589844, -5.359697341918945, -5.086009502410889, -4.81232213973999, -4.538634300231934, -4.264946937561035, -3.9912590980529785, -3.717571496963501, -3.4438838958740234, -3.170196294784546, -2.8965086936950684, -2.6228208541870117, -2.3491334915161133, -2.0754456520080566, -1.801758050918579, -1.5280704498291016, -1.254382848739624, -0.9806951880455017, -0.7070075273513794, -0.43331992626190186, -0.15963232517242432, 0.11405539512634277, 0.3877429962158203, 0.6614305973052979, 0.9351181983947754, 1.208805799484253, 1.48249351978302, 1.7561811208724976, 2.0298686027526855, 2.303556442260742, 2.5772440433502197, 2.8509316444396973, 3.124619245529175, 3.3983068466186523, 3.671994686126709, 3.9456820487976074, 4.219369888305664, 4.4930572509765625, 4.766745090484619, 5.040432929992676, 5.314120769500732, 5.587808132171631, 5.8614959716796875, 6.135183334350586, 6.408871173858643, 6.682559013366699, 6.956246376037598, 7.229933738708496]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 8.0, 8.0, 20.0, 20.0, 30.0, 40.0, 77.0, 130.0, 182.0, 297.0, 473.0, 794.0, 1454.0, 2482.0, 4490.0, 8647.0, 16863.0, 34537.0, 68646.0, 129081.0, 203231.0, 224588.0, 163753.0, 92608.0, 47174.0, 23429.0, 11892.0, 5846.0, 3316.0, 1769.0, 1007.0, 636.0, 372.0, 248.0, 137.0, 85.0, 64.0, 44.0, 26.0, 14.0, 10.0, 12.0, 4.0, 6.0, 5.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7451171875, -0.7204666137695312, -0.6958160400390625, -0.6711654663085938, -0.646514892578125, -0.6218643188476562, -0.5972137451171875, -0.5725631713867188, -0.54791259765625, -0.5232620239257812, -0.4986114501953125, -0.47396087646484375, -0.449310302734375, -0.42465972900390625, -0.4000091552734375, -0.37535858154296875, -0.3507080078125, -0.32605743408203125, -0.3014068603515625, -0.27675628662109375, -0.252105712890625, -0.22745513916015625, -0.2028045654296875, -0.17815399169921875, -0.15350341796875, -0.12885284423828125, -0.1042022705078125, -0.07955169677734375, -0.054901123046875, -0.03025054931640625, -0.0055999755859375, 0.01905059814453125, 0.043701171875, 0.06835174560546875, 0.0930023193359375, 0.11765289306640625, 0.142303466796875, 0.16695404052734375, 0.1916046142578125, 0.21625518798828125, 0.24090576171875, 0.26555633544921875, 0.2902069091796875, 0.31485748291015625, 0.339508056640625, 0.36415863037109375, 0.3888092041015625, 0.41345977783203125, 0.4381103515625, 0.46276092529296875, 0.4874114990234375, 0.5120620727539062, 0.536712646484375, 0.5613632202148438, 0.5860137939453125, 0.6106643676757812, 0.63531494140625, 0.6599655151367188, 0.6846160888671875, 0.7092666625976562, 0.733917236328125, 0.7585678100585938, 0.7832183837890625, 0.8078689575195312, 0.83251953125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 10.0, 13.0, 11.0, 18.0, 10.0, 18.0, 21.0, 33.0, 27.0, 33.0, 29.0, 41.0, 38.0, 45.0, 35.0, 47.0, 48.0, 41.0, 58.0, 43.0, 35.0, 38.0, 42.0, 38.0, 34.0, 38.0, 30.0, 23.0, 19.0, 15.0, 23.0, 8.0, 10.0, 11.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.71337890625, -0.691925048828125, -0.67047119140625, -0.649017333984375, -0.6275634765625, -0.606109619140625, -0.58465576171875, -0.563201904296875, -0.541748046875, -0.520294189453125, -0.49884033203125, -0.477386474609375, -0.4559326171875, -0.434478759765625, -0.41302490234375, -0.391571044921875, -0.3701171875, -0.348663330078125, -0.32720947265625, -0.305755615234375, -0.2843017578125, -0.262847900390625, -0.24139404296875, -0.219940185546875, -0.198486328125, -0.177032470703125, -0.15557861328125, -0.134124755859375, -0.1126708984375, -0.091217041015625, -0.06976318359375, -0.048309326171875, -0.02685546875, -0.005401611328125, 0.01605224609375, 0.037506103515625, 0.0589599609375, 0.080413818359375, 0.10186767578125, 0.123321533203125, 0.144775390625, 0.166229248046875, 0.18768310546875, 0.209136962890625, 0.2305908203125, 0.252044677734375, 0.27349853515625, 0.294952392578125, 0.31640625, 0.337860107421875, 0.35931396484375, 0.380767822265625, 0.4022216796875, 0.423675537109375, 0.44512939453125, 0.466583251953125, 0.488037109375, 0.509490966796875, 0.53094482421875, 0.552398681640625, 0.5738525390625, 0.595306396484375, 0.61676025390625, 0.638214111328125, 0.65966796875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 9.0, 11.0, 13.0, 31.0, 36.0, 46.0, 103.0, 189.0, 401.0, 1028.0, 3925.0, 24854.0, 263316.0, 685095.0, 58954.0, 7819.0, 1643.0, 532.0, 240.0, 121.0, 74.0, 44.0, 22.0, 13.0, 12.0, 13.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.861328125, -3.7652587890625, -3.669189453125, -3.5731201171875, -3.47705078125, -3.3809814453125, -3.284912109375, -3.1888427734375, -3.0927734375, -2.9967041015625, -2.900634765625, -2.8045654296875, -2.70849609375, -2.6124267578125, -2.516357421875, -2.4202880859375, -2.32421875, -2.2281494140625, -2.132080078125, -2.0360107421875, -1.93994140625, -1.8438720703125, -1.747802734375, -1.6517333984375, -1.5556640625, -1.4595947265625, -1.363525390625, -1.2674560546875, -1.17138671875, -1.0753173828125, -0.979248046875, -0.8831787109375, -0.787109375, -0.6910400390625, -0.594970703125, -0.4989013671875, -0.40283203125, -0.3067626953125, -0.210693359375, -0.1146240234375, -0.0185546875, 0.0775146484375, 0.173583984375, 0.2696533203125, 0.36572265625, 0.4617919921875, 0.557861328125, 0.6539306640625, 0.75, 0.8460693359375, 0.942138671875, 1.0382080078125, 1.13427734375, 1.2303466796875, 1.326416015625, 1.4224853515625, 1.5185546875, 1.6146240234375, 1.710693359375, 1.8067626953125, 1.90283203125, 1.9989013671875, 2.094970703125, 2.1910400390625, 2.287109375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 5.0, 5.0, 4.0, 8.0, 5.0, 16.0, 14.0, 19.0, 13.0, 24.0, 23.0, 28.0, 36.0, 38.0, 36.0, 26.0, 53.0, 42.0, 54.0, 34.0, 59.0, 63.0, 34.0, 48.0, 35.0, 35.0, 40.0, 32.0, 25.0, 23.0, 29.0, 18.0, 16.0, 7.0, 4.0, 6.0, 5.0, 8.0, 3.0, 5.0, 6.0, 1.0, 6.0, 2.0, 2.0, 1.0, 6.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.318359375, -2.241180419921875, -2.16400146484375, -2.086822509765625, -2.0096435546875, -1.932464599609375, -1.85528564453125, -1.778106689453125, -1.700927734375, -1.623748779296875, -1.54656982421875, -1.469390869140625, -1.3922119140625, -1.315032958984375, -1.23785400390625, -1.160675048828125, -1.08349609375, -1.006317138671875, -0.92913818359375, -0.851959228515625, -0.7747802734375, -0.697601318359375, -0.62042236328125, -0.543243408203125, -0.466064453125, -0.388885498046875, -0.31170654296875, -0.234527587890625, -0.1573486328125, -0.080169677734375, -0.00299072265625, 0.074188232421875, 0.1513671875, 0.228546142578125, 0.30572509765625, 0.382904052734375, 0.4600830078125, 0.537261962890625, 0.61444091796875, 0.691619873046875, 0.768798828125, 0.845977783203125, 0.92315673828125, 1.000335693359375, 1.0775146484375, 1.154693603515625, 1.23187255859375, 1.309051513671875, 1.38623046875, 1.463409423828125, 1.54058837890625, 1.617767333984375, 1.6949462890625, 1.772125244140625, 1.84930419921875, 1.926483154296875, 2.003662109375, 2.080841064453125, 2.15802001953125, 2.235198974609375, 2.3123779296875, 2.389556884765625, 2.46673583984375, 2.543914794921875, 2.62109375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 0.0, 1.0, 2.0, 3.0, 6.0, 6.0, 10.0, 20.0, 17.0, 31.0, 57.0, 99.0, 176.0, 290.0, 518.0, 1058.0, 2246.0, 5096.0, 13239.0, 37278.0, 126909.0, 552656.0, 214808.0, 60576.0, 19974.0, 7337.0, 3089.0, 1434.0, 693.0, 386.0, 217.0, 109.0, 76.0, 40.0, 39.0, 16.0, 19.0, 6.0, 6.0, 2.0, 2.0, 2.0, 1.0, 6.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.4990234375, -0.4822235107421875, -0.465423583984375, -0.4486236572265625, -0.43182373046875, -0.4150238037109375, -0.398223876953125, -0.3814239501953125, -0.3646240234375, -0.3478240966796875, -0.331024169921875, -0.3142242431640625, -0.29742431640625, -0.2806243896484375, -0.263824462890625, -0.2470245361328125, -0.230224609375, -0.2134246826171875, -0.196624755859375, -0.1798248291015625, -0.16302490234375, -0.1462249755859375, -0.129425048828125, -0.1126251220703125, -0.0958251953125, -0.0790252685546875, -0.062225341796875, -0.0454254150390625, -0.02862548828125, -0.0118255615234375, 0.004974365234375, 0.0217742919921875, 0.03857421875, 0.0553741455078125, 0.072174072265625, 0.0889739990234375, 0.10577392578125, 0.1225738525390625, 0.139373779296875, 0.1561737060546875, 0.1729736328125, 0.1897735595703125, 0.206573486328125, 0.2233734130859375, 0.24017333984375, 0.2569732666015625, 0.273773193359375, 0.2905731201171875, 0.307373046875, 0.3241729736328125, 0.340972900390625, 0.3577728271484375, 0.37457275390625, 0.3913726806640625, 0.408172607421875, 0.4249725341796875, 0.4417724609375, 0.4585723876953125, 0.475372314453125, 0.4921722412109375, 0.50897216796875, 0.5257720947265625, 0.542572021484375, 0.5593719482421875, 0.576171875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 5.0, 11.0, 17.0, 19.0, 39.0, 56.0, 109.0, 147.0, 154.0, 145.0, 101.0, 64.0, 43.0, 30.0, 16.0, 16.0, 5.0, 6.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0003688335418701172, -0.0003575049340724945, -0.0003461763262748718, -0.00033484771847724915, -0.00032351911067962646, -0.0003121905028820038, -0.0003008618950843811, -0.0002895332872867584, -0.00027820467948913574, -0.00026687607169151306, -0.0002555474638938904, -0.0002442188560962677, -0.00023289024829864502, -0.00022156164050102234, -0.00021023303270339966, -0.00019890442490577698, -0.0001875758171081543, -0.00017624720931053162, -0.00016491860151290894, -0.00015358999371528625, -0.00014226138591766357, -0.0001309327781200409, -0.00011960417032241821, -0.00010827556252479553, -9.694695472717285e-05, -8.561834692955017e-05, -7.428973913192749e-05, -6.296113133430481e-05, -5.163252353668213e-05, -4.030391573905945e-05, -2.8975307941436768e-05, -1.7646700143814087e-05, -6.318092346191406e-06, 5.010515451431274e-06, 1.6339123249053955e-05, 2.7667731046676636e-05, 3.8996338844299316e-05, 5.0324946641922e-05, 6.165355443954468e-05, 7.298216223716736e-05, 8.431077003479004e-05, 9.563937783241272e-05, 0.0001069679856300354, 0.00011829659342765808, 0.00012962520122528076, 0.00014095380902290344, 0.00015228241682052612, 0.0001636110246181488, 0.00017493963241577148, 0.00018626824021339417, 0.00019759684801101685, 0.00020892545580863953, 0.0002202540636062622, 0.0002315826714038849, 0.00024291127920150757, 0.00025423988699913025, 0.00026556849479675293, 0.0002768971025943756, 0.0002882257103919983, 0.00029955431818962097, 0.00031088292598724365, 0.00032221153378486633, 0.000333540141582489, 0.0003448687493801117, 0.0003561973571777344]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 5.0, 8.0, 9.0, 12.0, 25.0, 33.0, 74.0, 137.0, 292.0, 722.0, 2157.0, 8946.0, 52022.0, 392390.0, 524518.0, 54376.0, 9289.0, 2265.0, 688.0, 284.0, 138.0, 57.0, 42.0, 15.0, 16.0, 16.0, 5.0, 5.0, 2.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0283203125, -1.0019607543945312, -0.9756011962890625, -0.9492416381835938, -0.922882080078125, -0.8965225219726562, -0.8701629638671875, -0.8438034057617188, -0.81744384765625, -0.7910842895507812, -0.7647247314453125, -0.7383651733398438, -0.712005615234375, -0.6856460571289062, -0.6592864990234375, -0.6329269409179688, -0.6065673828125, -0.5802078247070312, -0.5538482666015625, -0.5274887084960938, -0.501129150390625, -0.47476959228515625, -0.4484100341796875, -0.42205047607421875, -0.39569091796875, -0.36933135986328125, -0.3429718017578125, -0.31661224365234375, -0.290252685546875, -0.26389312744140625, -0.2375335693359375, -0.21117401123046875, -0.184814453125, -0.15845489501953125, -0.1320953369140625, -0.10573577880859375, -0.079376220703125, -0.05301666259765625, -0.0266571044921875, -0.00029754638671875, 0.02606201171875, 0.05242156982421875, 0.0787811279296875, 0.10514068603515625, 0.131500244140625, 0.15785980224609375, 0.1842193603515625, 0.21057891845703125, 0.2369384765625, 0.26329803466796875, 0.2896575927734375, 0.31601715087890625, 0.342376708984375, 0.36873626708984375, 0.3950958251953125, 0.42145538330078125, 0.44781494140625, 0.47417449951171875, 0.5005340576171875, 0.5268936157226562, 0.553253173828125, 0.5796127319335938, 0.6059722900390625, 0.6323318481445312, 0.65869140625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 10.0, 6.0, 13.0, 17.0, 18.0, 23.0, 33.0, 43.0, 41.0, 73.0, 75.0, 89.0, 93.0, 71.0, 74.0, 69.0, 53.0, 46.0, 39.0, 33.0, 22.0, 18.0, 15.0, 15.0, 4.0, 4.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.578125, -0.5546722412109375, -0.531219482421875, -0.5077667236328125, -0.48431396484375, -0.4608612060546875, -0.437408447265625, -0.4139556884765625, -0.3905029296875, -0.3670501708984375, -0.343597412109375, -0.3201446533203125, -0.29669189453125, -0.2732391357421875, -0.249786376953125, -0.2263336181640625, -0.202880859375, -0.1794281005859375, -0.155975341796875, -0.1325225830078125, -0.10906982421875, -0.0856170654296875, -0.062164306640625, -0.0387115478515625, -0.0152587890625, 0.0081939697265625, 0.031646728515625, 0.0550994873046875, 0.07855224609375, 0.1020050048828125, 0.125457763671875, 0.1489105224609375, 0.17236328125, 0.1958160400390625, 0.219268798828125, 0.2427215576171875, 0.26617431640625, 0.2896270751953125, 0.313079833984375, 0.3365325927734375, 0.3599853515625, 0.3834381103515625, 0.406890869140625, 0.4303436279296875, 0.45379638671875, 0.4772491455078125, 0.500701904296875, 0.5241546630859375, 0.547607421875, 0.5710601806640625, 0.594512939453125, 0.6179656982421875, 0.64141845703125, 0.6648712158203125, 0.688323974609375, 0.7117767333984375, 0.7352294921875, 0.7586822509765625, 0.782135009765625, 0.8055877685546875, 0.82904052734375, 0.8524932861328125, 0.875946044921875, 0.8993988037109375, 0.9228515625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 4.0, 14.0, 21.0, 40.0, 99.0, 166.0, 329.0, 192.0, 81.0, 29.0, 14.0, 6.0, 3.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.855045318603516, -34.05562210083008, -33.256202697753906, -32.45677947998047, -31.657358169555664, -30.85793685913086, -30.058513641357422, -29.259092330932617, -28.459671020507812, -27.660249710083008, -26.860828399658203, -26.061405181884766, -25.26198387145996, -24.462562561035156, -23.66313934326172, -22.863718032836914, -22.06429672241211, -21.264875411987305, -20.4654541015625, -19.666030883789062, -18.866609573364258, -18.067188262939453, -17.267765045166016, -16.46834373474121, -15.668922424316406, -14.869501113891602, -14.07007884979248, -13.27065658569336, -12.471235275268555, -11.67181396484375, -10.872391700744629, -10.072969436645508, -9.273548126220703, -8.474126815795898, -7.674704551696777, -6.8752827644348145, -6.075860977172852, -5.276439189910889, -4.477017402648926, -3.677595615386963, -2.878173828125, -2.078752040863037, -1.2793302536010742, -0.47990846633911133, 0.31951332092285156, 1.1189351081848145, 1.9183568954467773, 2.7177786827087402, 3.517200469970703, 4.316622257232666, 5.116044044494629, 5.915465831756592, 6.714887619018555, 7.514309406280518, 8.31373119354248, 9.113153457641602, 9.912574768066406, 10.711996078491211, 11.511418342590332, 12.310840606689453, 13.110261917114258, 13.909683227539062, 14.709105491638184, 15.508527755737305, 16.30794906616211]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 9.0, 7.0, 6.0, 9.0, 12.0, 7.0, 11.0, 18.0, 17.0, 15.0, 29.0, 33.0, 33.0, 24.0, 33.0, 38.0, 44.0, 44.0, 77.0, 73.0, 75.0, 50.0, 39.0, 44.0, 30.0, 22.0, 31.0, 27.0, 17.0, 22.0, 14.0, 16.0, 11.0, 10.0, 15.0, 7.0, 10.0, 6.0, 3.0, 4.0, 2.0, 0.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-11.15542221069336, -10.822574615478516, -10.489727020263672, -10.156880378723145, -9.8240327835083, -9.491185188293457, -9.158337593078613, -8.825490951538086, -8.492643356323242, -8.159795761108398, -7.826948642730713, -7.494101047515869, -7.161253929138184, -6.82840633392334, -6.495558738708496, -6.1627116203308105, -5.829864025115967, -5.497016429901123, -5.1641693115234375, -4.831321716308594, -4.498474597930908, -4.1656270027160645, -3.8327796459198, -3.499932289123535, -3.1670849323272705, -2.834237575531006, -2.501390218734741, -2.1685428619384766, -1.8356953859329224, -1.5028480291366577, -1.1700005531311035, -0.8371531963348389, -0.5043058395385742, -0.17145845293998718, 0.16138893365859985, 0.4942363500595093, 0.8270837068557739, 1.1599310636520386, 1.4927785396575928, 1.8256258964538574, 2.158473253250122, 2.4913206100463867, 2.8241679668426514, 3.157015323638916, 3.4898629188537598, 3.8227100372314453, 4.155557632446289, 4.488405227661133, 4.821252346038818, 5.154099941253662, 5.486947059631348, 5.819794654846191, 6.152641773223877, 6.485489368438721, 6.818336486816406, 7.15118408203125, 7.484031677246094, 7.8168792724609375, 8.149726867675781, 8.482573509216309, 8.815421104431152, 9.148268699645996, 9.48111629486084, 9.813962936401367, 10.146810531616211]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 19.0, 19.0, 22.0, 33.0, 68.0, 99.0, 158.0, 250.0, 389.0, 620.0, 1185.0, 2440.0, 5490.0, 15645.0, 57658.0, 274725.0, 1244048.0, 1866085.0, 566245.0, 115034.0, 27873.0, 8877.0, 3519.0, 1668.0, 897.0, 459.0, 284.0, 172.0, 88.0, 68.0, 47.0, 24.0, 22.0, 15.0, 6.0, 16.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.75439453125, -0.7329788208007812, -0.7115631103515625, -0.6901473999023438, -0.668731689453125, -0.6473159790039062, -0.6259002685546875, -0.6044845581054688, -0.58306884765625, -0.5616531372070312, -0.5402374267578125, -0.5188217163085938, -0.497406005859375, -0.47599029541015625, -0.4545745849609375, -0.43315887451171875, -0.4117431640625, -0.39032745361328125, -0.3689117431640625, -0.34749603271484375, -0.326080322265625, -0.30466461181640625, -0.2832489013671875, -0.26183319091796875, -0.24041748046875, -0.21900177001953125, -0.1975860595703125, -0.17617034912109375, -0.154754638671875, -0.13333892822265625, -0.1119232177734375, -0.09050750732421875, -0.069091796875, -0.04767608642578125, -0.0262603759765625, -0.00484466552734375, 0.016571044921875, 0.03798675537109375, 0.0594024658203125, 0.08081817626953125, 0.10223388671875, 0.12364959716796875, 0.1450653076171875, 0.16648101806640625, 0.187896728515625, 0.20931243896484375, 0.2307281494140625, 0.25214385986328125, 0.2735595703125, 0.29497528076171875, 0.3163909912109375, 0.33780670166015625, 0.359222412109375, 0.38063812255859375, 0.4020538330078125, 0.42346954345703125, 0.44488525390625, 0.46630096435546875, 0.4877166748046875, 0.5091323852539062, 0.530548095703125, 0.5519638061523438, 0.5733795166015625, 0.5947952270507812, 0.6162109375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 1.0, 4.0, 3.0, 1.0, 9.0, 6.0, 14.0, 10.0, 9.0, 23.0, 23.0, 22.0, 21.0, 35.0, 29.0, 48.0, 28.0, 42.0, 43.0, 47.0, 55.0, 37.0, 49.0, 55.0, 45.0, 35.0, 40.0, 48.0, 31.0, 31.0, 32.0, 18.0, 20.0, 21.0, 11.0, 14.0, 8.0, 7.0, 8.0, 7.0, 6.0, 2.0, 2.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67919921875, -0.6595535278320312, -0.6399078369140625, -0.6202621459960938, -0.600616455078125, -0.5809707641601562, -0.5613250732421875, -0.5416793823242188, -0.52203369140625, -0.5023880004882812, -0.4827423095703125, -0.46309661865234375, -0.443450927734375, -0.42380523681640625, -0.4041595458984375, -0.38451385498046875, -0.3648681640625, -0.34522247314453125, -0.3255767822265625, -0.30593109130859375, -0.286285400390625, -0.26663970947265625, -0.2469940185546875, -0.22734832763671875, -0.20770263671875, -0.18805694580078125, -0.1684112548828125, -0.14876556396484375, -0.129119873046875, -0.10947418212890625, -0.0898284912109375, -0.07018280029296875, -0.050537109375, -0.03089141845703125, -0.0112457275390625, 0.00839996337890625, 0.028045654296875, 0.04769134521484375, 0.0673370361328125, 0.08698272705078125, 0.10662841796875, 0.12627410888671875, 0.1459197998046875, 0.16556549072265625, 0.185211181640625, 0.20485687255859375, 0.2245025634765625, 0.24414825439453125, 0.2637939453125, 0.28343963623046875, 0.3030853271484375, 0.32273101806640625, 0.342376708984375, 0.36202239990234375, 0.3816680908203125, 0.40131378173828125, 0.42095947265625, 0.44060516357421875, 0.4602508544921875, 0.47989654541015625, 0.499542236328125, 0.5191879272460938, 0.5388336181640625, 0.5584793090820312, 0.578125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 9.0, 15.0, 16.0, 20.0, 46.0, 73.0, 117.0, 220.0, 516.0, 1163.0, 3633.0, 26255.0, 1113403.0, 2991733.0, 49127.0, 5288.0, 1451.0, 578.0, 288.0, 159.0, 74.0, 36.0, 15.0, 17.0, 5.0, 9.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.240234375, -2.168243408203125, -2.09625244140625, -2.024261474609375, -1.9522705078125, -1.880279541015625, -1.80828857421875, -1.736297607421875, -1.664306640625, -1.592315673828125, -1.52032470703125, -1.448333740234375, -1.3763427734375, -1.304351806640625, -1.23236083984375, -1.160369873046875, -1.08837890625, -1.016387939453125, -0.94439697265625, -0.872406005859375, -0.8004150390625, -0.728424072265625, -0.65643310546875, -0.584442138671875, -0.512451171875, -0.440460205078125, -0.36846923828125, -0.296478271484375, -0.2244873046875, -0.152496337890625, -0.08050537109375, -0.008514404296875, 0.0634765625, 0.135467529296875, 0.20745849609375, 0.279449462890625, 0.3514404296875, 0.423431396484375, 0.49542236328125, 0.567413330078125, 0.639404296875, 0.711395263671875, 0.78338623046875, 0.855377197265625, 0.9273681640625, 0.999359130859375, 1.07135009765625, 1.143341064453125, 1.21533203125, 1.287322998046875, 1.35931396484375, 1.431304931640625, 1.5032958984375, 1.575286865234375, 1.64727783203125, 1.719268798828125, 1.791259765625, 1.863250732421875, 1.93524169921875, 2.007232666015625, 2.0792236328125, 2.151214599609375, 2.22320556640625, 2.295196533203125, 2.3671875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 5.0, 14.0, 11.0, 20.0, 31.0, 44.0, 60.0, 118.0, 217.0, 355.0, 607.0, 800.0, 698.0, 455.0, 250.0, 134.0, 83.0, 48.0, 42.0, 32.0, 15.0, 6.0, 9.0, 8.0, 6.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.802734375, -1.7476654052734375, -1.692596435546875, -1.6375274658203125, -1.58245849609375, -1.5273895263671875, -1.472320556640625, -1.4172515869140625, -1.3621826171875, -1.3071136474609375, -1.252044677734375, -1.1969757080078125, -1.14190673828125, -1.0868377685546875, -1.031768798828125, -0.9766998291015625, -0.921630859375, -0.8665618896484375, -0.811492919921875, -0.7564239501953125, -0.70135498046875, -0.6462860107421875, -0.591217041015625, -0.5361480712890625, -0.4810791015625, -0.4260101318359375, -0.370941162109375, -0.3158721923828125, -0.26080322265625, -0.2057342529296875, -0.150665283203125, -0.0955963134765625, -0.04052734375, 0.0145416259765625, 0.069610595703125, 0.1246795654296875, 0.17974853515625, 0.2348175048828125, 0.289886474609375, 0.3449554443359375, 0.4000244140625, 0.4550933837890625, 0.510162353515625, 0.5652313232421875, 0.62030029296875, 0.6753692626953125, 0.730438232421875, 0.7855072021484375, 0.840576171875, 0.8956451416015625, 0.950714111328125, 1.0057830810546875, 1.06085205078125, 1.1159210205078125, 1.170989990234375, 1.2260589599609375, 1.2811279296875, 1.3361968994140625, 1.391265869140625, 1.4463348388671875, 1.50140380859375, 1.5564727783203125, 1.611541748046875, 1.6666107177734375, 1.7216796875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 7.0, 4.0, 8.0, 19.0, 26.0, 48.0, 79.0, 151.0, 143.0, 159.0, 133.0, 108.0, 61.0, 25.0, 13.0, 6.0, 5.0, 3.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.149273872375488, -7.768694877624512, -7.388116359710693, -7.007537364959717, -6.626958847045898, -6.246379852294922, -5.865800857543945, -5.485221862792969, -5.10464334487915, -4.724064350128174, -4.3434858322143555, -3.962906837463379, -3.5823280811309814, -3.201749324798584, -2.8211703300476074, -2.44059157371521, -2.0600128173828125, -1.679434061050415, -1.298855185508728, -0.918276309967041, -0.5376975536346436, -0.1571187973022461, 0.22346019744873047, 0.6040389537811279, 0.9846177101135254, 1.3651964664459229, 1.7457753419876099, 2.126354217529297, 2.5069329738616943, 2.887511730194092, 3.2680907249450684, 3.648669481277466, 4.02924919128418, 4.409828186035156, 4.790406703948975, 5.170985698699951, 5.5515642166137695, 5.932143211364746, 6.312722206115723, 6.693301200866699, 7.073879718780518, 7.454458713531494, 7.8350372314453125, 8.215616226196289, 8.596195220947266, 8.976774215698242, 9.357353210449219, 9.737931251525879, 10.118510246276855, 10.499089241027832, 10.879668235778809, 11.260246276855469, 11.640825271606445, 12.021404266357422, 12.401983261108398, 12.782562255859375, 13.163141250610352, 13.543720245361328, 13.924299240112305, 14.304878234863281, 14.685456275939941, 15.066035270690918, 15.446614265441895, 15.827193260192871, 16.20777130126953]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 7.0, 7.0, 15.0, 17.0, 16.0, 21.0, 27.0, 32.0, 30.0, 49.0, 50.0, 38.0, 56.0, 73.0, 60.0, 72.0, 53.0, 59.0, 49.0, 46.0, 32.0, 32.0, 33.0, 30.0, 17.0, 16.0, 19.0, 11.0, 7.0, 12.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.081058502197266, -6.836199760437012, -6.591341495513916, -6.346482753753662, -6.101624488830566, -5.8567657470703125, -5.611907005310059, -5.367048740386963, -5.122190475463867, -4.877331733703613, -4.632473468780518, -4.387614727020264, -4.142756462097168, -3.897897720336914, -3.6530392169952393, -3.4081807136535645, -3.1633219718933105, -2.9184634685516357, -2.673604965209961, -2.428746223449707, -2.1838879585266113, -1.939029335975647, -1.6941707134246826, -1.4493122100830078, -1.204453706741333, -0.9595952033996582, -0.7147366404533386, -0.46987807750701904, -0.22501957416534424, 0.019838929176330566, 0.2646975517272949, 0.5095560550689697, 0.7544145584106445, 0.9992730617523193, 1.2441315650939941, 1.4889901876449585, 1.7338486909866333, 1.978707194328308, 2.2235658168792725, 2.4684243202209473, 2.713282823562622, 2.958141326904297, 3.2029998302459717, 3.4478583335876465, 3.6927170753479004, 3.937575340270996, 4.18243408203125, 4.427292823791504, 4.6721510887146, 4.9170098304748535, 5.161868095397949, 5.406726837158203, 5.651585102081299, 5.896443843841553, 6.141302108764648, 6.386160850524902, 6.631019592285156, 6.87587833404541, 7.120736598968506, 7.36559534072876, 7.6104536056518555, 7.855312347412109, 8.100171089172363, 8.345029830932617, 8.589887619018555]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 3.0, 5.0, 3.0, 5.0, 10.0, 13.0, 22.0, 16.0, 30.0, 57.0, 62.0, 113.0, 152.0, 266.0, 410.0, 635.0, 1103.0, 1959.0, 3326.0, 6205.0, 11379.0, 21732.0, 41598.0, 79800.0, 146213.0, 223435.0, 215456.0, 137174.0, 74127.0, 38934.0, 20326.0, 10693.0, 5625.0, 3067.0, 1754.0, 1114.0, 629.0, 376.0, 255.0, 151.0, 106.0, 67.0, 45.0, 36.0, 22.0, 13.0, 15.0, 11.0, 5.0, 4.0, 5.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.7548828125, -0.7326431274414062, -0.7104034423828125, -0.6881637573242188, -0.665924072265625, -0.6436843872070312, -0.6214447021484375, -0.5992050170898438, -0.57696533203125, -0.5547256469726562, -0.5324859619140625, -0.5102462768554688, -0.488006591796875, -0.46576690673828125, -0.4435272216796875, -0.42128753662109375, -0.3990478515625, -0.37680816650390625, -0.3545684814453125, -0.33232879638671875, -0.310089111328125, -0.28784942626953125, -0.2656097412109375, -0.24337005615234375, -0.22113037109375, -0.19889068603515625, -0.1766510009765625, -0.15441131591796875, -0.132171630859375, -0.10993194580078125, -0.0876922607421875, -0.06545257568359375, -0.043212890625, -0.02097320556640625, 0.0012664794921875, 0.02350616455078125, 0.045745849609375, 0.06798553466796875, 0.0902252197265625, 0.11246490478515625, 0.13470458984375, 0.15694427490234375, 0.1791839599609375, 0.20142364501953125, 0.223663330078125, 0.24590301513671875, 0.2681427001953125, 0.29038238525390625, 0.3126220703125, 0.33486175537109375, 0.3571014404296875, 0.37934112548828125, 0.401580810546875, 0.42382049560546875, 0.4460601806640625, 0.46829986572265625, 0.49053955078125, 0.5127792358398438, 0.5350189208984375, 0.5572586059570312, 0.579498291015625, 0.6017379760742188, 0.6239776611328125, 0.6462173461914062, 0.66845703125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 8.0, 7.0, 7.0, 3.0, 6.0, 14.0, 18.0, 22.0, 20.0, 24.0, 36.0, 29.0, 44.0, 53.0, 48.0, 68.0, 48.0, 61.0, 57.0, 51.0, 60.0, 48.0, 36.0, 55.0, 34.0, 43.0, 17.0, 15.0, 25.0, 13.0, 11.0, 9.0, 7.0, 4.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8759765625, -0.8508224487304688, -0.8256683349609375, -0.8005142211914062, -0.775360107421875, -0.7502059936523438, -0.7250518798828125, -0.6998977661132812, -0.67474365234375, -0.6495895385742188, -0.6244354248046875, -0.5992813110351562, -0.574127197265625, -0.5489730834960938, -0.5238189697265625, -0.49866485595703125, -0.4735107421875, -0.44835662841796875, -0.4232025146484375, -0.39804840087890625, -0.372894287109375, -0.34774017333984375, -0.3225860595703125, -0.29743194580078125, -0.27227783203125, -0.24712371826171875, -0.2219696044921875, -0.19681549072265625, -0.171661376953125, -0.14650726318359375, -0.1213531494140625, -0.09619903564453125, -0.071044921875, -0.04589080810546875, -0.0207366943359375, 0.00441741943359375, 0.029571533203125, 0.05472564697265625, 0.0798797607421875, 0.10503387451171875, 0.13018798828125, 0.15534210205078125, 0.1804962158203125, 0.20565032958984375, 0.230804443359375, 0.25595855712890625, 0.2811126708984375, 0.30626678466796875, 0.3314208984375, 0.35657501220703125, 0.3817291259765625, 0.40688323974609375, 0.432037353515625, 0.45719146728515625, 0.4823455810546875, 0.5074996948242188, 0.53265380859375, 0.5578079223632812, 0.5829620361328125, 0.6081161499023438, 0.633270263671875, 0.6584243774414062, 0.6835784912109375, 0.7087326049804688, 0.73388671875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 9.0, 4.0, 5.0, 11.0, 14.0, 16.0, 19.0, 33.0, 40.0, 62.0, 111.0, 180.0, 274.0, 465.0, 850.0, 2159.0, 6746.0, 35104.0, 281289.0, 646502.0, 59388.0, 10001.0, 2802.0, 1067.0, 576.0, 288.0, 185.0, 126.0, 75.0, 44.0, 37.0, 24.0, 19.0, 8.0, 6.0, 9.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.56640625, -2.48895263671875, -2.4114990234375, -2.33404541015625, -2.256591796875, -2.17913818359375, -2.1016845703125, -2.02423095703125, -1.94677734375, -1.86932373046875, -1.7918701171875, -1.71441650390625, -1.636962890625, -1.55950927734375, -1.4820556640625, -1.40460205078125, -1.3271484375, -1.24969482421875, -1.1722412109375, -1.09478759765625, -1.017333984375, -0.93988037109375, -0.8624267578125, -0.78497314453125, -0.70751953125, -0.63006591796875, -0.5526123046875, -0.47515869140625, -0.397705078125, -0.32025146484375, -0.2427978515625, -0.16534423828125, -0.087890625, -0.01043701171875, 0.0670166015625, 0.14447021484375, 0.221923828125, 0.29937744140625, 0.3768310546875, 0.45428466796875, 0.53173828125, 0.60919189453125, 0.6866455078125, 0.76409912109375, 0.841552734375, 0.91900634765625, 0.9964599609375, 1.07391357421875, 1.1513671875, 1.22882080078125, 1.3062744140625, 1.38372802734375, 1.461181640625, 1.53863525390625, 1.6160888671875, 1.69354248046875, 1.77099609375, 1.84844970703125, 1.9259033203125, 2.00335693359375, 2.080810546875, 2.15826416015625, 2.2357177734375, 2.31317138671875, 2.390625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 9.0, 10.0, 10.0, 9.0, 19.0, 23.0, 14.0, 30.0, 36.0, 39.0, 43.0, 51.0, 75.0, 57.0, 80.0, 60.0, 56.0, 62.0, 60.0, 45.0, 37.0, 34.0, 38.0, 24.0, 15.0, 16.0, 9.0, 8.0, 6.0, 0.0, 7.0, 7.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.73828125, -2.633453369140625, -2.52862548828125, -2.423797607421875, -2.3189697265625, -2.214141845703125, -2.10931396484375, -2.004486083984375, -1.899658203125, -1.794830322265625, -1.69000244140625, -1.585174560546875, -1.4803466796875, -1.375518798828125, -1.27069091796875, -1.165863037109375, -1.06103515625, -0.956207275390625, -0.85137939453125, -0.746551513671875, -0.6417236328125, -0.536895751953125, -0.43206787109375, -0.327239990234375, -0.222412109375, -0.117584228515625, -0.01275634765625, 0.092071533203125, 0.1968994140625, 0.301727294921875, 0.40655517578125, 0.511383056640625, 0.6162109375, 0.721038818359375, 0.82586669921875, 0.930694580078125, 1.0355224609375, 1.140350341796875, 1.24517822265625, 1.350006103515625, 1.454833984375, 1.559661865234375, 1.66448974609375, 1.769317626953125, 1.8741455078125, 1.978973388671875, 2.08380126953125, 2.188629150390625, 2.29345703125, 2.398284912109375, 2.50311279296875, 2.607940673828125, 2.7127685546875, 2.817596435546875, 2.92242431640625, 3.027252197265625, 3.132080078125, 3.236907958984375, 3.34173583984375, 3.446563720703125, 3.5513916015625, 3.656219482421875, 3.76104736328125, 3.865875244140625, 3.970703125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 2.0, 7.0, 7.0, 8.0, 3.0, 14.0, 19.0, 17.0, 24.0, 37.0, 61.0, 98.0, 125.0, 234.0, 386.0, 786.0, 1553.0, 3600.0, 9300.0, 27990.0, 100194.0, 610582.0, 213967.0, 52849.0, 16244.0, 5755.0, 2314.0, 1040.0, 500.0, 300.0, 186.0, 111.0, 73.0, 41.0, 33.0, 28.0, 20.0, 17.0, 11.0, 7.0, 2.0, 8.0, 5.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.5517578125, -0.5363273620605469, -0.5208969116210938, -0.5054664611816406, -0.4900360107421875, -0.4746055603027344, -0.45917510986328125, -0.4437446594238281, -0.428314208984375, -0.4128837585449219, -0.39745330810546875, -0.3820228576660156, -0.3665924072265625, -0.3511619567871094, -0.33573150634765625, -0.3203010559082031, -0.30487060546875, -0.2894401550292969, -0.27400970458984375, -0.2585792541503906, -0.2431488037109375, -0.22771835327148438, -0.21228790283203125, -0.19685745239257812, -0.181427001953125, -0.16599655151367188, -0.15056610107421875, -0.13513565063476562, -0.1197052001953125, -0.10427474975585938, -0.08884429931640625, -0.07341384887695312, -0.0579833984375, -0.042552947998046875, -0.02712249755859375, -0.011692047119140625, 0.0037384033203125, 0.019168853759765625, 0.03459930419921875, 0.050029754638671875, 0.065460205078125, 0.08089065551757812, 0.09632110595703125, 0.11175155639648438, 0.1271820068359375, 0.14261245727539062, 0.15804290771484375, 0.17347335815429688, 0.18890380859375, 0.20433425903320312, 0.21976470947265625, 0.23519515991210938, 0.2506256103515625, 0.2660560607910156, 0.28148651123046875, 0.2969169616699219, 0.312347412109375, 0.3277778625488281, 0.34320831298828125, 0.3586387634277344, 0.3740692138671875, 0.3894996643066406, 0.40493011474609375, 0.4203605651855469, 0.435791015625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 4.0, 4.0, 3.0, 8.0, 6.0, 14.0, 6.0, 15.0, 17.0, 20.0, 35.0, 50.0, 61.0, 86.0, 103.0, 93.0, 115.0, 78.0, 55.0, 45.0, 47.0, 31.0, 28.0, 25.0, 18.0, 8.0, 7.0, 4.0, 5.0, 2.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0001710653305053711, -0.00016509182751178741, -0.00015911832451820374, -0.00015314482152462006, -0.00014717131853103638, -0.0001411978155374527, -0.00013522431254386902, -0.00012925080955028534, -0.00012327730655670166, -0.00011730380356311798, -0.0001113303005695343, -0.00010535679757595062, -9.938329458236694e-05, -9.340979158878326e-05, -8.743628859519958e-05, -8.14627856016159e-05, -7.548928260803223e-05, -6.951577961444855e-05, -6.354227662086487e-05, -5.756877362728119e-05, -5.159527063369751e-05, -4.562176764011383e-05, -3.964826464653015e-05, -3.367476165294647e-05, -2.7701258659362793e-05, -2.1727755665779114e-05, -1.5754252672195435e-05, -9.780749678611755e-06, -3.807246685028076e-06, 2.166256308555603e-06, 8.139759302139282e-06, 1.4113262295722961e-05, 2.008676528930664e-05, 2.606026828289032e-05, 3.2033771276474e-05, 3.800727427005768e-05, 4.398077726364136e-05, 4.995428025722504e-05, 5.5927783250808716e-05, 6.19012862443924e-05, 6.787478923797607e-05, 7.384829223155975e-05, 7.982179522514343e-05, 8.579529821872711e-05, 9.176880121231079e-05, 9.774230420589447e-05, 0.00010371580719947815, 0.00010968931019306183, 0.00011566281318664551, 0.00012163631618022919, 0.00012760981917381287, 0.00013358332216739655, 0.00013955682516098022, 0.0001455303281545639, 0.00015150383114814758, 0.00015747733414173126, 0.00016345083713531494, 0.00016942434012889862, 0.0001753978431224823, 0.00018137134611606598, 0.00018734484910964966, 0.00019331835210323334, 0.00019929185509681702, 0.0002052653580904007, 0.00021123886108398438]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0, 2.0, 3.0, 2.0, 7.0, 3.0, 8.0, 3.0, 9.0, 23.0, 19.0, 25.0, 34.0, 58.0, 115.0, 220.0, 329.0, 569.0, 1303.0, 3572.0, 12524.0, 61871.0, 630410.0, 280794.0, 42019.0, 9425.0, 2808.0, 1139.0, 582.0, 282.0, 140.0, 90.0, 71.0, 41.0, 15.0, 12.0, 7.0, 7.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.66943359375, -0.649078369140625, -0.62872314453125, -0.608367919921875, -0.5880126953125, -0.567657470703125, -0.54730224609375, -0.526947021484375, -0.506591796875, -0.486236572265625, -0.46588134765625, -0.445526123046875, -0.4251708984375, -0.404815673828125, -0.38446044921875, -0.364105224609375, -0.34375, -0.323394775390625, -0.30303955078125, -0.282684326171875, -0.2623291015625, -0.241973876953125, -0.22161865234375, -0.201263427734375, -0.180908203125, -0.160552978515625, -0.14019775390625, -0.119842529296875, -0.0994873046875, -0.079132080078125, -0.05877685546875, -0.038421630859375, -0.01806640625, 0.002288818359375, 0.02264404296875, 0.042999267578125, 0.0633544921875, 0.083709716796875, 0.10406494140625, 0.124420166015625, 0.144775390625, 0.165130615234375, 0.18548583984375, 0.205841064453125, 0.2261962890625, 0.246551513671875, 0.26690673828125, 0.287261962890625, 0.3076171875, 0.327972412109375, 0.34832763671875, 0.368682861328125, 0.3890380859375, 0.409393310546875, 0.42974853515625, 0.450103759765625, 0.470458984375, 0.490814208984375, 0.51116943359375, 0.531524658203125, 0.5518798828125, 0.572235107421875, 0.59259033203125, 0.612945556640625, 0.63330078125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 3.0, 9.0, 5.0, 10.0, 8.0, 11.0, 10.0, 13.0, 22.0, 20.0, 20.0, 40.0, 43.0, 48.0, 76.0, 80.0, 86.0, 66.0, 72.0, 66.0, 59.0, 42.0, 38.0, 32.0, 23.0, 12.0, 22.0, 10.0, 6.0, 6.0, 7.0, 9.0, 5.0, 3.0, 3.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51806640625, -0.5023002624511719, -0.48653411865234375, -0.4707679748535156, -0.4550018310546875, -0.4392356872558594, -0.42346954345703125, -0.4077033996582031, -0.391937255859375, -0.3761711120605469, -0.36040496826171875, -0.3446388244628906, -0.3288726806640625, -0.3131065368652344, -0.29734039306640625, -0.2815742492675781, -0.26580810546875, -0.2500419616699219, -0.23427581787109375, -0.21850967407226562, -0.2027435302734375, -0.18697738647460938, -0.17121124267578125, -0.15544509887695312, -0.139678955078125, -0.12391281127929688, -0.10814666748046875, -0.09238052368164062, -0.0766143798828125, -0.060848236083984375, -0.04508209228515625, -0.029315948486328125, -0.0135498046875, 0.002216339111328125, 0.01798248291015625, 0.033748626708984375, 0.0495147705078125, 0.06528091430664062, 0.08104705810546875, 0.09681320190429688, 0.112579345703125, 0.12834548950195312, 0.14411163330078125, 0.15987777709960938, 0.1756439208984375, 0.19141006469726562, 0.20717620849609375, 0.22294235229492188, 0.23870849609375, 0.2544746398925781, 0.27024078369140625, 0.2860069274902344, 0.3017730712890625, 0.3175392150878906, 0.33330535888671875, 0.3490715026855469, 0.364837646484375, 0.3806037902832031, 0.39636993408203125, 0.4121360778808594, 0.4279022216796875, 0.4436683654785156, 0.45943450927734375, 0.4752006530761719, 0.490966796875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 3.0, 4.0, 18.0, 10.0, 29.0, 51.0, 102.0, 170.0, 298.0, 132.0, 79.0, 58.0, 23.0, 11.0, 7.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.802608489990234, -20.228418350219727, -19.65422821044922, -19.08003807067871, -18.505847930908203, -17.931657791137695, -17.357467651367188, -16.783279418945312, -16.209087371826172, -15.634897232055664, -15.060707092285156, -14.486516952514648, -13.91232681274414, -13.338136672973633, -12.763947486877441, -12.189757347106934, -11.615568161010742, -11.041378021240234, -10.467187881469727, -9.892997741699219, -9.318807601928711, -8.744617462158203, -8.170428276062012, -7.596238136291504, -7.022047996520996, -6.447857856750488, -5.8736677169799805, -5.299478054046631, -4.725287914276123, -4.151097774505615, -3.5769078731536865, -3.002717971801758, -2.428529739379883, -1.8543397188186646, -1.2801496982574463, -0.705959677696228, -0.13176965713500977, 0.44242048263549805, 1.0166103839874268, 1.5908002853393555, 2.1649904251098633, 2.739180564880371, 3.3133704662323, 3.8875603675842285, 4.461750507354736, 5.035940647125244, 5.610130310058594, 6.184320449829102, 6.758510589599609, 7.332700729370117, 7.906890869140625, 8.481081008911133, 9.05527114868164, 9.629461288452148, 10.20365047454834, 10.777840614318848, 11.352030754089355, 11.926220893859863, 12.500411033630371, 13.074601173400879, 13.64879035949707, 14.222980499267578, 14.797170639038086, 15.371360778808594, 15.945550918579102]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 6.0, 0.0, 2.0, 1.0, 6.0, 5.0, 4.0, 8.0, 12.0, 12.0, 16.0, 22.0, 27.0, 30.0, 22.0, 29.0, 22.0, 32.0, 41.0, 50.0, 81.0, 116.0, 99.0, 57.0, 44.0, 38.0, 32.0, 34.0, 25.0, 31.0, 19.0, 14.0, 9.0, 8.0, 8.0, 11.0, 8.0, 2.0, 7.0, 10.0, 1.0, 4.0, 5.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.73277759552002, -12.387369155883789, -12.041961669921875, -11.696554183959961, -11.35114574432373, -11.0057373046875, -10.660329818725586, -10.314922332763672, -9.969513893127441, -9.624105453491211, -9.278697967529297, -8.933290481567383, -8.587882041931152, -8.242473602294922, -7.897066116333008, -7.5516581535339355, -7.206250190734863, -6.860842227935791, -6.515434265136719, -6.1700263023376465, -5.824618339538574, -5.479210376739502, -5.13380241394043, -4.788394451141357, -4.442986488342285, -4.097578525543213, -3.7521705627441406, -3.4067625999450684, -3.061354637145996, -2.715946674346924, -2.3705387115478516, -2.0251307487487793, -1.679722785949707, -1.3343148231506348, -0.9889068603515625, -0.6434988975524902, -0.29809093475341797, 0.0473170280456543, 0.39272499084472656, 0.7381329536437988, 1.083540916442871, 1.4289488792419434, 1.7743568420410156, 2.119764804840088, 2.46517276763916, 2.8105807304382324, 3.1559886932373047, 3.501396656036377, 3.846804618835449, 4.1922125816345215, 4.537620544433594, 4.883028507232666, 5.228436470031738, 5.5738444328308105, 5.919252395629883, 6.264660358428955, 6.610068321228027, 6.9554762840271, 7.300884246826172, 7.646292209625244, 7.991700172424316, 8.337108612060547, 8.682516098022461, 9.027923583984375, 9.373332023620605]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 7.0, 11.0, 21.0, 15.0, 26.0, 58.0, 59.0, 93.0, 165.0, 260.0, 455.0, 853.0, 1549.0, 3761.0, 10311.0, 36010.0, 164310.0, 869684.0, 2086854.0, 810885.0, 157041.0, 34599.0, 10060.0, 3675.0, 1571.0, 784.0, 436.0, 288.0, 156.0, 81.0, 75.0, 44.0, 29.0, 21.0, 9.0, 8.0, 6.0, 7.0, 5.0, 3.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.662109375, -0.6380157470703125, -0.613922119140625, -0.5898284912109375, -0.56573486328125, -0.5416412353515625, -0.517547607421875, -0.4934539794921875, -0.4693603515625, -0.4452667236328125, -0.421173095703125, -0.3970794677734375, -0.37298583984375, -0.3488922119140625, -0.324798583984375, -0.3007049560546875, -0.276611328125, -0.2525177001953125, -0.228424072265625, -0.2043304443359375, -0.18023681640625, -0.1561431884765625, -0.132049560546875, -0.1079559326171875, -0.0838623046875, -0.0597686767578125, -0.035675048828125, -0.0115814208984375, 0.01251220703125, 0.0366058349609375, 0.060699462890625, 0.0847930908203125, 0.10888671875, 0.1329803466796875, 0.157073974609375, 0.1811676025390625, 0.20526123046875, 0.2293548583984375, 0.253448486328125, 0.2775421142578125, 0.3016357421875, 0.3257293701171875, 0.349822998046875, 0.3739166259765625, 0.39801025390625, 0.4221038818359375, 0.446197509765625, 0.4702911376953125, 0.494384765625, 0.5184783935546875, 0.542572021484375, 0.5666656494140625, 0.59075927734375, 0.6148529052734375, 0.638946533203125, 0.6630401611328125, 0.6871337890625, 0.7112274169921875, 0.735321044921875, 0.7594146728515625, 0.78350830078125, 0.8076019287109375, 0.831695556640625, 0.8557891845703125, 0.8798828125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 7.0, 2.0, 10.0, 6.0, 9.0, 10.0, 17.0, 19.0, 19.0, 24.0, 32.0, 37.0, 37.0, 32.0, 64.0, 44.0, 57.0, 53.0, 57.0, 61.0, 55.0, 48.0, 41.0, 44.0, 48.0, 29.0, 29.0, 27.0, 20.0, 12.0, 18.0, 7.0, 9.0, 11.0, 5.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.76513671875, -0.7414627075195312, -0.7177886962890625, -0.6941146850585938, -0.670440673828125, -0.6467666625976562, -0.6230926513671875, -0.5994186401367188, -0.57574462890625, -0.5520706176757812, -0.5283966064453125, -0.5047225952148438, -0.481048583984375, -0.45737457275390625, -0.4337005615234375, -0.41002655029296875, -0.3863525390625, -0.36267852783203125, -0.3390045166015625, -0.31533050537109375, -0.291656494140625, -0.26798248291015625, -0.2443084716796875, -0.22063446044921875, -0.19696044921875, -0.17328643798828125, -0.1496124267578125, -0.12593841552734375, -0.102264404296875, -0.07859039306640625, -0.0549163818359375, -0.03124237060546875, -0.007568359375, 0.01610565185546875, 0.0397796630859375, 0.06345367431640625, 0.087127685546875, 0.11080169677734375, 0.1344757080078125, 0.15814971923828125, 0.18182373046875, 0.20549774169921875, 0.2291717529296875, 0.25284576416015625, 0.276519775390625, 0.30019378662109375, 0.3238677978515625, 0.34754180908203125, 0.3712158203125, 0.39488983154296875, 0.4185638427734375, 0.44223785400390625, 0.465911865234375, 0.48958587646484375, 0.5132598876953125, 0.5369338989257812, 0.56060791015625, 0.5842819213867188, 0.6079559326171875, 0.6316299438476562, 0.655303955078125, 0.6789779663085938, 0.7026519775390625, 0.7263259887695312, 0.75]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 4.0, 12.0, 10.0, 36.0, 83.0, 181.0, 338.0, 912.0, 11294.0, 4045942.0, 132319.0, 2155.0, 510.0, 266.0, 120.0, 56.0, 26.0, 12.0, 13.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.25, -3.08526611328125, -2.9205322265625, -2.75579833984375, -2.591064453125, -2.42633056640625, -2.2615966796875, -2.09686279296875, -1.93212890625, -1.76739501953125, -1.6026611328125, -1.43792724609375, -1.273193359375, -1.10845947265625, -0.9437255859375, -0.77899169921875, -0.6142578125, -0.44952392578125, -0.2847900390625, -0.12005615234375, 0.044677734375, 0.20941162109375, 0.3741455078125, 0.53887939453125, 0.70361328125, 0.86834716796875, 1.0330810546875, 1.19781494140625, 1.362548828125, 1.52728271484375, 1.6920166015625, 1.85675048828125, 2.021484375, 2.18621826171875, 2.3509521484375, 2.51568603515625, 2.680419921875, 2.84515380859375, 3.0098876953125, 3.17462158203125, 3.33935546875, 3.50408935546875, 3.6688232421875, 3.83355712890625, 3.998291015625, 4.16302490234375, 4.3277587890625, 4.49249267578125, 4.6572265625, 4.82196044921875, 4.9866943359375, 5.15142822265625, 5.316162109375, 5.48089599609375, 5.6456298828125, 5.81036376953125, 5.97509765625, 6.13983154296875, 6.3045654296875, 6.46929931640625, 6.634033203125, 6.79876708984375, 6.9635009765625, 7.12823486328125, 7.29296875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 8.0, 10.0, 13.0, 21.0, 61.0, 133.0, 280.0, 686.0, 1243.0, 869.0, 420.0, 156.0, 81.0, 30.0, 29.0, 8.0, 16.0, 6.0, 2.0, 7.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.869140625, -1.773895263671875, -1.67864990234375, -1.583404541015625, -1.4881591796875, -1.392913818359375, -1.29766845703125, -1.202423095703125, -1.107177734375, -1.011932373046875, -0.91668701171875, -0.821441650390625, -0.7261962890625, -0.630950927734375, -0.53570556640625, -0.440460205078125, -0.34521484375, -0.249969482421875, -0.15472412109375, -0.059478759765625, 0.0357666015625, 0.131011962890625, 0.22625732421875, 0.321502685546875, 0.416748046875, 0.511993408203125, 0.60723876953125, 0.702484130859375, 0.7977294921875, 0.892974853515625, 0.98822021484375, 1.083465576171875, 1.1787109375, 1.273956298828125, 1.36920166015625, 1.464447021484375, 1.5596923828125, 1.654937744140625, 1.75018310546875, 1.845428466796875, 1.940673828125, 2.035919189453125, 2.13116455078125, 2.226409912109375, 2.3216552734375, 2.416900634765625, 2.51214599609375, 2.607391357421875, 2.70263671875, 2.797882080078125, 2.89312744140625, 2.988372802734375, 3.0836181640625, 3.178863525390625, 3.27410888671875, 3.369354248046875, 3.464599609375, 3.559844970703125, 3.65509033203125, 3.750335693359375, 3.8455810546875, 3.940826416015625, 4.03607177734375, 4.131317138671875, 4.2265625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 9.0, 23.0, 60.0, 237.0, 376.0, 198.0, 47.0, 29.0, 10.0, 9.0, 7.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.704120635986328, -22.638961791992188, -21.573802947998047, -20.508642196655273, -19.443483352661133, -18.378324508666992, -17.31316375732422, -16.248004913330078, -15.182846069335938, -14.117687225341797, -13.05252742767334, -11.987367630004883, -10.922208786010742, -9.857049942016602, -8.791890144348145, -7.726730823516846, -6.661571502685547, -5.596412181854248, -4.531252861022949, -3.4660935401916504, -2.4009342193603516, -1.3357748985290527, -0.2706155776977539, 0.7945437431335449, 1.8597030639648438, 2.9248623847961426, 3.9900217056274414, 5.05518102645874, 6.120340347290039, 7.185499668121338, 8.250658988952637, 9.315818786621094, 10.380973815917969, 11.44613265991211, 12.511292457580566, 13.576452255249023, 14.641611099243164, 15.706769943237305, 16.771930694580078, 17.83708953857422, 18.90224838256836, 19.9674072265625, 21.03256607055664, 22.097726821899414, 23.162885665893555, 24.228044509887695, 25.29320526123047, 26.35836410522461, 27.42352294921875, 28.48868179321289, 29.55384063720703, 30.619001388549805, 31.684160232543945, 32.74932098388672, 33.81447982788086, 34.879638671875, 35.94479751586914, 37.00995635986328, 38.07511520385742, 39.14027404785156, 40.20543670654297, 41.27059555053711, 42.33575439453125, 43.40091323852539, 44.46607208251953]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 2.0, 7.0, 8.0, 8.0, 17.0, 18.0, 17.0, 14.0, 34.0, 30.0, 38.0, 21.0, 27.0, 33.0, 39.0, 49.0, 56.0, 44.0, 47.0, 59.0, 46.0, 53.0, 44.0, 32.0, 35.0, 22.0, 33.0, 35.0, 22.0, 21.0, 16.0, 12.0, 12.0, 10.0, 7.0, 6.0, 10.0, 8.0, 0.0, 3.0, 2.0, 6.0, 2.0, 0.0, 2.0], "bins": [-9.743474960327148, -9.488177299499512, -9.232880592346191, -8.977582931518555, -8.722286224365234, -8.466988563537598, -8.211691856384277, -7.956394195556641, -7.701097011566162, -7.445799827575684, -7.190502643585205, -6.935205459594727, -6.67990779876709, -6.4246110916137695, -6.169313430786133, -5.914016246795654, -5.658719062805176, -5.403421878814697, -5.148124694824219, -4.89282751083374, -4.637530326843262, -4.382232666015625, -4.1269354820251465, -3.871638298034668, -3.6163411140441895, -3.361043930053711, -3.1057467460632324, -2.850449323654175, -2.5951521396636963, -2.3398549556732178, -2.08455753326416, -1.8292603492736816, -1.5739641189575195, -1.318666934967041, -1.063369631767273, -0.8080723881721497, -0.5527751445770264, -0.29747796058654785, -0.042180657386779785, 0.21311664581298828, 0.4684138298034668, 0.7237110733985901, 0.9790083169937134, 1.2343056201934814, 1.48960280418396, 1.7448999881744385, 2.000197410583496, 2.2554945945739746, 2.510791778564453, 2.7660889625549316, 3.02138614654541, 3.2766835689544678, 3.5319807529449463, 3.787277936935425, 4.042575359344482, 4.297872543334961, 4.5531697273254395, 4.808466911315918, 5.0637640953063965, 5.319061279296875, 5.574358940124512, 5.829655647277832, 6.084953308105469, 6.340250492095947, 6.595547676086426]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 6.0, 4.0, 5.0, 9.0, 13.0, 17.0, 39.0, 41.0, 71.0, 83.0, 164.0, 259.0, 401.0, 648.0, 1150.0, 1962.0, 3512.0, 6453.0, 12196.0, 24648.0, 53073.0, 124137.0, 276367.0, 292264.0, 136779.0, 58551.0, 26963.0, 13142.0, 6809.0, 3757.0, 2046.0, 1200.0, 646.0, 404.0, 255.0, 172.0, 104.0, 62.0, 42.0, 33.0, 22.0, 18.0, 10.0, 6.0, 4.0, 5.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.1015625, -1.064910888671875, -1.02825927734375, -0.991607666015625, -0.9549560546875, -0.918304443359375, -0.88165283203125, -0.845001220703125, -0.808349609375, -0.771697998046875, -0.73504638671875, -0.698394775390625, -0.6617431640625, -0.625091552734375, -0.58843994140625, -0.551788330078125, -0.51513671875, -0.478485107421875, -0.44183349609375, -0.405181884765625, -0.3685302734375, -0.331878662109375, -0.29522705078125, -0.258575439453125, -0.221923828125, -0.185272216796875, -0.14862060546875, -0.111968994140625, -0.0753173828125, -0.038665771484375, -0.00201416015625, 0.034637451171875, 0.0712890625, 0.107940673828125, 0.14459228515625, 0.181243896484375, 0.2178955078125, 0.254547119140625, 0.29119873046875, 0.327850341796875, 0.364501953125, 0.401153564453125, 0.43780517578125, 0.474456787109375, 0.5111083984375, 0.547760009765625, 0.58441162109375, 0.621063232421875, 0.65771484375, 0.694366455078125, 0.73101806640625, 0.767669677734375, 0.8043212890625, 0.840972900390625, 0.87762451171875, 0.914276123046875, 0.950927734375, 0.987579345703125, 1.02423095703125, 1.060882568359375, 1.0975341796875, 1.134185791015625, 1.17083740234375, 1.207489013671875, 1.244140625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 8.0, 2.0, 2.0, 7.0, 7.0, 8.0, 12.0, 14.0, 10.0, 11.0, 10.0, 12.0, 23.0, 31.0, 33.0, 24.0, 26.0, 30.0, 63.0, 42.0, 58.0, 43.0, 57.0, 52.0, 37.0, 42.0, 44.0, 46.0, 24.0, 38.0, 27.0, 23.0, 29.0, 16.0, 20.0, 17.0, 17.0, 8.0, 9.0, 9.0, 3.0, 6.0, 1.0, 5.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.69580078125, -0.6737747192382812, -0.6517486572265625, -0.6297225952148438, -0.607696533203125, -0.5856704711914062, -0.5636444091796875, -0.5416183471679688, -0.51959228515625, -0.49756622314453125, -0.4755401611328125, -0.45351409912109375, -0.431488037109375, -0.40946197509765625, -0.3874359130859375, -0.36540985107421875, -0.3433837890625, -0.32135772705078125, -0.2993316650390625, -0.27730560302734375, -0.255279541015625, -0.23325347900390625, -0.2112274169921875, -0.18920135498046875, -0.16717529296875, -0.14514923095703125, -0.1231231689453125, -0.10109710693359375, -0.079071044921875, -0.05704498291015625, -0.0350189208984375, -0.01299285888671875, 0.009033203125, 0.03105926513671875, 0.0530853271484375, 0.07511138916015625, 0.097137451171875, 0.11916351318359375, 0.1411895751953125, 0.16321563720703125, 0.18524169921875, 0.20726776123046875, 0.2292938232421875, 0.25131988525390625, 0.273345947265625, 0.29537200927734375, 0.3173980712890625, 0.33942413330078125, 0.3614501953125, 0.38347625732421875, 0.4055023193359375, 0.42752838134765625, 0.449554443359375, 0.47158050537109375, 0.4936065673828125, 0.5156326293945312, 0.53765869140625, 0.5596847534179688, 0.5817108154296875, 0.6037368774414062, 0.625762939453125, 0.6477890014648438, 0.6698150634765625, 0.6918411254882812, 0.7138671875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 11.0, 9.0, 12.0, 28.0, 41.0, 72.0, 134.0, 221.0, 465.0, 981.0, 2311.0, 9354.0, 111561.0, 863263.0, 50755.0, 5923.0, 1764.0, 777.0, 392.0, 213.0, 110.0, 62.0, 39.0, 22.0, 12.0, 8.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.544921875, -3.419952392578125, -3.29498291015625, -3.170013427734375, -3.0450439453125, -2.920074462890625, -2.79510498046875, -2.670135498046875, -2.545166015625, -2.420196533203125, -2.29522705078125, -2.170257568359375, -2.0452880859375, -1.920318603515625, -1.79534912109375, -1.670379638671875, -1.54541015625, -1.420440673828125, -1.29547119140625, -1.170501708984375, -1.0455322265625, -0.920562744140625, -0.79559326171875, -0.670623779296875, -0.545654296875, -0.420684814453125, -0.29571533203125, -0.170745849609375, -0.0457763671875, 0.079193115234375, 0.20416259765625, 0.329132080078125, 0.4541015625, 0.579071044921875, 0.70404052734375, 0.829010009765625, 0.9539794921875, 1.078948974609375, 1.20391845703125, 1.328887939453125, 1.453857421875, 1.578826904296875, 1.70379638671875, 1.828765869140625, 1.9537353515625, 2.078704833984375, 2.20367431640625, 2.328643798828125, 2.45361328125, 2.578582763671875, 2.70355224609375, 2.828521728515625, 2.9534912109375, 3.078460693359375, 3.20343017578125, 3.328399658203125, 3.453369140625, 3.578338623046875, 3.70330810546875, 3.828277587890625, 3.9532470703125, 4.078216552734375, 4.20318603515625, 4.328155517578125, 4.453125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 2.0, 6.0, 8.0, 16.0, 14.0, 30.0, 38.0, 56.0, 66.0, 61.0, 74.0, 89.0, 98.0, 99.0, 85.0, 71.0, 52.0, 32.0, 28.0, 22.0, 14.0, 12.0, 13.0, 8.0, 4.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.302734375, -3.153839111328125, -3.00494384765625, -2.856048583984375, -2.7071533203125, -2.558258056640625, -2.40936279296875, -2.260467529296875, -2.111572265625, -1.962677001953125, -1.81378173828125, -1.664886474609375, -1.5159912109375, -1.367095947265625, -1.21820068359375, -1.069305419921875, -0.92041015625, -0.771514892578125, -0.62261962890625, -0.473724365234375, -0.3248291015625, -0.175933837890625, -0.02703857421875, 0.121856689453125, 0.270751953125, 0.419647216796875, 0.56854248046875, 0.717437744140625, 0.8663330078125, 1.015228271484375, 1.16412353515625, 1.313018798828125, 1.4619140625, 1.610809326171875, 1.75970458984375, 1.908599853515625, 2.0574951171875, 2.206390380859375, 2.35528564453125, 2.504180908203125, 2.653076171875, 2.801971435546875, 2.95086669921875, 3.099761962890625, 3.2486572265625, 3.397552490234375, 3.54644775390625, 3.695343017578125, 3.84423828125, 3.993133544921875, 4.14202880859375, 4.290924072265625, 4.4398193359375, 4.588714599609375, 4.73760986328125, 4.886505126953125, 5.035400390625, 5.184295654296875, 5.33319091796875, 5.482086181640625, 5.6309814453125, 5.779876708984375, 5.92877197265625, 6.077667236328125, 6.2265625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 7.0, 6.0, 5.0, 7.0, 23.0, 27.0, 40.0, 51.0, 114.0, 234.0, 469.0, 1113.0, 3112.0, 11848.0, 72676.0, 792554.0, 140268.0, 18943.0, 4427.0, 1424.0, 613.0, 251.0, 140.0, 63.0, 55.0, 28.0, 24.0, 12.0, 6.0, 8.0, 11.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6572265625, -0.6315994262695312, -0.6059722900390625, -0.5803451538085938, -0.554718017578125, -0.5290908813476562, -0.5034637451171875, -0.47783660888671875, -0.45220947265625, -0.42658233642578125, -0.4009552001953125, -0.37532806396484375, -0.349700927734375, -0.32407379150390625, -0.2984466552734375, -0.27281951904296875, -0.2471923828125, -0.22156524658203125, -0.1959381103515625, -0.17031097412109375, -0.144683837890625, -0.11905670166015625, -0.0934295654296875, -0.06780242919921875, -0.04217529296875, -0.01654815673828125, 0.0090789794921875, 0.03470611572265625, 0.060333251953125, 0.08596038818359375, 0.1115875244140625, 0.13721466064453125, 0.162841796875, 0.18846893310546875, 0.2140960693359375, 0.23972320556640625, 0.265350341796875, 0.29097747802734375, 0.3166046142578125, 0.34223175048828125, 0.36785888671875, 0.39348602294921875, 0.4191131591796875, 0.44474029541015625, 0.470367431640625, 0.49599456787109375, 0.5216217041015625, 0.5472488403320312, 0.5728759765625, 0.5985031127929688, 0.6241302490234375, 0.6497573852539062, 0.675384521484375, 0.7010116577148438, 0.7266387939453125, 0.7522659301757812, 0.77789306640625, 0.8035202026367188, 0.8291473388671875, 0.8547744750976562, 0.880401611328125, 0.9060287475585938, 0.9316558837890625, 0.9572830200195312, 0.98291015625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 5.0, 1.0, 4.0, 2.0, 2.0, 3.0, 11.0, 11.0, 11.0, 31.0, 35.0, 42.0, 77.0, 112.0, 173.0, 166.0, 115.0, 58.0, 37.0, 36.0, 19.0, 12.0, 16.0, 14.0, 5.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00038623809814453125, -0.00037449970841407776, -0.00036276131868362427, -0.0003510229289531708, -0.0003392845392227173, -0.0003275461494922638, -0.0003158077597618103, -0.0003040693700313568, -0.0002923309803009033, -0.00028059259057044983, -0.00026885420083999634, -0.00025711581110954285, -0.00024537742137908936, -0.00023363903164863586, -0.00022190064191818237, -0.00021016225218772888, -0.0001984238624572754, -0.0001866854727268219, -0.0001749470829963684, -0.00016320869326591492, -0.00015147030353546143, -0.00013973191380500793, -0.00012799352407455444, -0.00011625513434410095, -0.00010451674461364746, -9.277835488319397e-05, -8.103996515274048e-05, -6.930157542228699e-05, -5.7563185691833496e-05, -4.5824795961380005e-05, -3.4086406230926514e-05, -2.2348016500473022e-05, -1.0609626770019531e-05, 1.12876296043396e-06, 1.2867152690887451e-05, 2.4605542421340942e-05, 3.6343932151794434e-05, 4.8082321882247925e-05, 5.9820711612701416e-05, 7.155910134315491e-05, 8.32974910736084e-05, 9.503588080406189e-05, 0.00010677427053451538, 0.00011851266026496887, 0.00013025104999542236, 0.00014198943972587585, 0.00015372782945632935, 0.00016546621918678284, 0.00017720460891723633, 0.00018894299864768982, 0.0002006813883781433, 0.0002124197781085968, 0.0002241581678390503, 0.00023589655756950378, 0.0002476349472999573, 0.00025937333703041077, 0.00027111172676086426, 0.00028285011649131775, 0.00029458850622177124, 0.00030632689595222473, 0.0003180652856826782, 0.0003298036754131317, 0.0003415420651435852, 0.0003532804548740387, 0.0003650188446044922]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 7.0, 4.0, 3.0, 6.0, 7.0, 17.0, 22.0, 29.0, 38.0, 58.0, 79.0, 178.0, 290.0, 448.0, 920.0, 2232.0, 6509.0, 28665.0, 224388.0, 709796.0, 58325.0, 10637.0, 3198.0, 1277.0, 584.0, 315.0, 187.0, 109.0, 82.0, 46.0, 32.0, 28.0, 10.0, 7.0, 9.0, 3.0, 1.0, 4.0, 4.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.63671875, -0.616302490234375, -0.59588623046875, -0.575469970703125, -0.5550537109375, -0.534637451171875, -0.51422119140625, -0.493804931640625, -0.473388671875, -0.452972412109375, -0.43255615234375, -0.412139892578125, -0.3917236328125, -0.371307373046875, -0.35089111328125, -0.330474853515625, -0.31005859375, -0.289642333984375, -0.26922607421875, -0.248809814453125, -0.2283935546875, -0.207977294921875, -0.18756103515625, -0.167144775390625, -0.146728515625, -0.126312255859375, -0.10589599609375, -0.085479736328125, -0.0650634765625, -0.044647216796875, -0.02423095703125, -0.003814697265625, 0.0166015625, 0.037017822265625, 0.05743408203125, 0.077850341796875, 0.0982666015625, 0.118682861328125, 0.13909912109375, 0.159515380859375, 0.179931640625, 0.200347900390625, 0.22076416015625, 0.241180419921875, 0.2615966796875, 0.282012939453125, 0.30242919921875, 0.322845458984375, 0.34326171875, 0.363677978515625, 0.38409423828125, 0.404510498046875, 0.4249267578125, 0.445343017578125, 0.46575927734375, 0.486175537109375, 0.506591796875, 0.527008056640625, 0.54742431640625, 0.567840576171875, 0.5882568359375, 0.608673095703125, 0.62908935546875, 0.649505615234375, 0.669921875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 4.0, 3.0, 2.0, 3.0, 5.0, 8.0, 3.0, 3.0, 10.0, 11.0, 21.0, 23.0, 27.0, 26.0, 37.0, 44.0, 52.0, 62.0, 76.0, 79.0, 81.0, 88.0, 64.0, 49.0, 48.0, 40.0, 30.0, 30.0, 19.0, 15.0, 9.0, 9.0, 6.0, 6.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.58056640625, -0.5638885498046875, -0.547210693359375, -0.5305328369140625, -0.51385498046875, -0.4971771240234375, -0.480499267578125, -0.4638214111328125, -0.4471435546875, -0.4304656982421875, -0.413787841796875, -0.3971099853515625, -0.38043212890625, -0.3637542724609375, -0.347076416015625, -0.3303985595703125, -0.313720703125, -0.2970428466796875, -0.280364990234375, -0.2636871337890625, -0.24700927734375, -0.2303314208984375, -0.213653564453125, -0.1969757080078125, -0.1802978515625, -0.1636199951171875, -0.146942138671875, -0.1302642822265625, -0.11358642578125, -0.0969085693359375, -0.080230712890625, -0.0635528564453125, -0.046875, -0.0301971435546875, -0.013519287109375, 0.0031585693359375, 0.01983642578125, 0.0365142822265625, 0.053192138671875, 0.0698699951171875, 0.0865478515625, 0.1032257080078125, 0.119903564453125, 0.1365814208984375, 0.15325927734375, 0.1699371337890625, 0.186614990234375, 0.2032928466796875, 0.219970703125, 0.2366485595703125, 0.253326416015625, 0.2700042724609375, 0.28668212890625, 0.3033599853515625, 0.320037841796875, 0.3367156982421875, 0.3533935546875, 0.3700714111328125, 0.386749267578125, 0.4034271240234375, 0.42010498046875, 0.4367828369140625, 0.453460693359375, 0.4701385498046875, 0.48681640625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 5.0, 3.0, 9.0, 11.0, 42.0, 60.0, 126.0, 382.0, 180.0, 96.0, 47.0, 21.0, 9.0, 7.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.90968132019043, -23.1590576171875, -22.40843391418457, -21.65781021118164, -20.907188415527344, -20.156564712524414, -19.405941009521484, -18.655317306518555, -17.904693603515625, -17.154069900512695, -16.403446197509766, -15.652823448181152, -14.902199745178223, -14.151576042175293, -13.40095329284668, -12.65032958984375, -11.89970588684082, -11.14908218383789, -10.398458480834961, -9.647835731506348, -8.897212028503418, -8.146588325500488, -7.395965099334717, -6.645341873168945, -5.894718170166016, -5.144094467163086, -4.3934712409973145, -3.642847776412964, -2.8922243118286133, -2.1416008472442627, -1.390977382659912, -0.6403541564941406, 0.11027145385742188, 0.8608949184417725, 1.611518383026123, 2.3621418476104736, 3.112765312194824, 3.863388776779175, 4.614012241363525, 5.364635467529297, 6.115259170532227, 6.865882873535156, 7.616506099700928, 8.3671293258667, 9.117753028869629, 9.868376731872559, 10.618999481201172, 11.369623184204102, 12.120246887207031, 12.870870590209961, 13.62149429321289, 14.372117042541504, 15.122740745544434, 15.873364448547363, 16.623987197875977, 17.374610900878906, 18.125234603881836, 18.875858306884766, 19.626482009887695, 20.377105712890625, 21.127727508544922, 21.87835121154785, 22.62897491455078, 23.37959861755371, 24.13022232055664]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 6.0, 6.0, 10.0, 15.0, 13.0, 15.0, 17.0, 27.0, 28.0, 29.0, 31.0, 44.0, 36.0, 48.0, 161.0, 167.0, 59.0, 41.0, 37.0, 27.0, 24.0, 36.0, 15.0, 24.0, 19.0, 15.0, 12.0, 10.0, 12.0, 4.0, 3.0, 7.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.678079605102539, -15.230937004089355, -14.783794403076172, -14.336651802062988, -13.889509201049805, -13.442366600036621, -12.995223999023438, -12.548081398010254, -12.10093879699707, -11.653796195983887, -11.206653594970703, -10.75951099395752, -10.312368392944336, -9.865225791931152, -9.418083190917969, -8.970940589904785, -8.523797988891602, -8.076655387878418, -7.629512786865234, -7.182370185852051, -6.735227584838867, -6.288084983825684, -5.8409423828125, -5.393799781799316, -4.946658134460449, -4.499515533447266, -4.052372932434082, -3.6052303314208984, -3.158087730407715, -2.7109453678131104, -2.2638027667999268, -1.8166601657867432, -1.3695173263549805, -0.9223747253417969, -0.47523218393325806, -0.02808964252471924, 0.41905295848846436, 0.8661954402923584, 1.313338041305542, 1.7604806423187256, 2.207623243331909, 2.6547658443450928, 3.1019084453582764, 3.549050807952881, 3.9961934089660645, 4.443336009979248, 4.890478610992432, 5.337621212005615, 5.784763813018799, 6.231906414031982, 6.679049015045166, 7.12619161605835, 7.573334217071533, 8.020476341247559, 8.467618942260742, 8.914761543273926, 9.36190414428711, 9.809046745300293, 10.256189346313477, 10.70333194732666, 11.150474548339844, 11.597617149353027, 12.044759750366211, 12.491902351379395, 12.939044952392578]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 4.0, 5.0, 6.0, 10.0, 13.0, 18.0, 35.0, 43.0, 57.0, 77.0, 113.0, 156.0, 227.0, 334.0, 507.0, 770.0, 1087.0, 1849.0, 3190.0, 5680.0, 11227.0, 24845.0, 62065.0, 173317.0, 488745.0, 1094812.0, 1272543.0, 646446.0, 253231.0, 88605.0, 32848.0, 14271.0, 7064.0, 3948.0, 2168.0, 1299.0, 849.0, 552.0, 376.0, 243.0, 176.0, 128.0, 97.0, 66.0, 45.0, 40.0, 27.0, 18.0, 17.0, 9.0, 16.0, 7.0, 1.0, 3.0, 3.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.62744140625, -0.605926513671875, -0.58441162109375, -0.562896728515625, -0.5413818359375, -0.519866943359375, -0.49835205078125, -0.476837158203125, -0.455322265625, -0.433807373046875, -0.41229248046875, -0.390777587890625, -0.3692626953125, -0.347747802734375, -0.32623291015625, -0.304718017578125, -0.283203125, -0.261688232421875, -0.24017333984375, -0.218658447265625, -0.1971435546875, -0.175628662109375, -0.15411376953125, -0.132598876953125, -0.111083984375, -0.089569091796875, -0.06805419921875, -0.046539306640625, -0.0250244140625, -0.003509521484375, 0.01800537109375, 0.039520263671875, 0.06103515625, 0.082550048828125, 0.10406494140625, 0.125579833984375, 0.1470947265625, 0.168609619140625, 0.19012451171875, 0.211639404296875, 0.233154296875, 0.254669189453125, 0.27618408203125, 0.297698974609375, 0.3192138671875, 0.340728759765625, 0.36224365234375, 0.383758544921875, 0.4052734375, 0.426788330078125, 0.44830322265625, 0.469818115234375, 0.4913330078125, 0.512847900390625, 0.53436279296875, 0.555877685546875, 0.577392578125, 0.598907470703125, 0.62042236328125, 0.641937255859375, 0.6634521484375, 0.684967041015625, 0.70648193359375, 0.727996826171875, 0.74951171875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 3.0, 3.0, 4.0, 7.0, 6.0, 14.0, 14.0, 10.0, 11.0, 23.0, 15.0, 20.0, 27.0, 18.0, 28.0, 25.0, 22.0, 48.0, 39.0, 39.0, 41.0, 44.0, 47.0, 45.0, 45.0, 43.0, 44.0, 49.0, 34.0, 34.0, 32.0, 30.0, 28.0, 22.0, 13.0, 18.0, 8.0, 17.0, 7.0, 4.0, 6.0, 8.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.59228515625, -0.5721893310546875, -0.552093505859375, -0.5319976806640625, -0.51190185546875, -0.4918060302734375, -0.471710205078125, -0.4516143798828125, -0.4315185546875, -0.4114227294921875, -0.391326904296875, -0.3712310791015625, -0.35113525390625, -0.3310394287109375, -0.310943603515625, -0.2908477783203125, -0.270751953125, -0.2506561279296875, -0.230560302734375, -0.2104644775390625, -0.19036865234375, -0.1702728271484375, -0.150177001953125, -0.1300811767578125, -0.1099853515625, -0.0898895263671875, -0.069793701171875, -0.0496978759765625, -0.02960205078125, -0.0095062255859375, 0.010589599609375, 0.0306854248046875, 0.05078125, 0.0708770751953125, 0.090972900390625, 0.1110687255859375, 0.13116455078125, 0.1512603759765625, 0.171356201171875, 0.1914520263671875, 0.2115478515625, 0.2316436767578125, 0.251739501953125, 0.2718353271484375, 0.29193115234375, 0.3120269775390625, 0.332122802734375, 0.3522186279296875, 0.372314453125, 0.3924102783203125, 0.412506103515625, 0.4326019287109375, 0.45269775390625, 0.4727935791015625, 0.492889404296875, 0.5129852294921875, 0.5330810546875, 0.5531768798828125, 0.573272705078125, 0.5933685302734375, 0.61346435546875, 0.6335601806640625, 0.653656005859375, 0.6737518310546875, 0.69384765625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 7.0, 5.0, 6.0, 19.0, 26.0, 42.0, 61.0, 101.0, 173.0, 344.0, 654.0, 1270.0, 3741.0, 28064.0, 3798826.0, 347729.0, 8903.0, 2278.0, 941.0, 483.0, 259.0, 159.0, 74.0, 47.0, 21.0, 17.0, 12.0, 6.0, 3.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.09765625, -4.9510498046875, -4.804443359375, -4.6578369140625, -4.51123046875, -4.3646240234375, -4.218017578125, -4.0714111328125, -3.9248046875, -3.7781982421875, -3.631591796875, -3.4849853515625, -3.33837890625, -3.1917724609375, -3.045166015625, -2.8985595703125, -2.751953125, -2.6053466796875, -2.458740234375, -2.3121337890625, -2.16552734375, -2.0189208984375, -1.872314453125, -1.7257080078125, -1.5791015625, -1.4324951171875, -1.285888671875, -1.1392822265625, -0.99267578125, -0.8460693359375, -0.699462890625, -0.5528564453125, -0.40625, -0.2596435546875, -0.113037109375, 0.0335693359375, 0.18017578125, 0.3267822265625, 0.473388671875, 0.6199951171875, 0.7666015625, 0.9132080078125, 1.059814453125, 1.2064208984375, 1.35302734375, 1.4996337890625, 1.646240234375, 1.7928466796875, 1.939453125, 2.0860595703125, 2.232666015625, 2.3792724609375, 2.52587890625, 2.6724853515625, 2.819091796875, 2.9656982421875, 3.1123046875, 3.2589111328125, 3.405517578125, 3.5521240234375, 3.69873046875, 3.8453369140625, 3.991943359375, 4.1385498046875, 4.28515625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 5.0, 12.0, 9.0, 15.0, 24.0, 36.0, 48.0, 73.0, 120.0, 197.0, 255.0, 403.0, 587.0, 679.0, 554.0, 368.0, 222.0, 135.0, 117.0, 65.0, 58.0, 31.0, 19.0, 16.0, 10.0, 9.0, 6.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.07421875, -1.989105224609375, -1.90399169921875, -1.818878173828125, -1.7337646484375, -1.648651123046875, -1.56353759765625, -1.478424072265625, -1.393310546875, -1.308197021484375, -1.22308349609375, -1.137969970703125, -1.0528564453125, -0.967742919921875, -0.88262939453125, -0.797515869140625, -0.71240234375, -0.627288818359375, -0.54217529296875, -0.457061767578125, -0.3719482421875, -0.286834716796875, -0.20172119140625, -0.116607666015625, -0.031494140625, 0.053619384765625, 0.13873291015625, 0.223846435546875, 0.3089599609375, 0.394073486328125, 0.47918701171875, 0.564300537109375, 0.6494140625, 0.734527587890625, 0.81964111328125, 0.904754638671875, 0.9898681640625, 1.074981689453125, 1.16009521484375, 1.245208740234375, 1.330322265625, 1.415435791015625, 1.50054931640625, 1.585662841796875, 1.6707763671875, 1.755889892578125, 1.84100341796875, 1.926116943359375, 2.01123046875, 2.096343994140625, 2.18145751953125, 2.266571044921875, 2.3516845703125, 2.436798095703125, 2.52191162109375, 2.607025146484375, 2.692138671875, 2.777252197265625, 2.86236572265625, 2.947479248046875, 3.0325927734375, 3.117706298828125, 3.20281982421875, 3.287933349609375, 3.373046875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 12.0, 28.0, 70.0, 215.0, 372.0, 201.0, 66.0, 22.0, 9.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.13917541503906, -50.42607879638672, -48.71297836303711, -46.999881744384766, -45.286781311035156, -43.57368469238281, -41.86058807373047, -40.14748764038086, -38.434391021728516, -36.72129440307617, -35.00819396972656, -33.29509735107422, -31.581998825073242, -29.868900299072266, -28.15580177307129, -26.442703247070312, -24.729604721069336, -23.01650619506836, -21.303407669067383, -19.590309143066406, -17.877212524414062, -16.164113998413086, -14.45101547241211, -12.73791790008545, -11.024819374084473, -9.311720848083496, -7.598623275756836, -5.885524749755859, -4.172426700592041, -2.4593286514282227, -0.7462301254272461, 0.9668674468994141, 2.6799659729003906, 4.393064022064209, 6.106162071228027, 7.819260597229004, 9.532358169555664, 11.24545669555664, 12.958555221557617, 14.671652793884277, 16.384750366210938, 18.097848892211914, 19.81094741821289, 21.524044036865234, 23.23714256286621, 24.950241088867188, 26.663339614868164, 28.37643814086914, 30.089536666870117, 31.802635192871094, 33.51573181152344, 35.22883224487305, 36.94192886352539, 38.655029296875, 40.368125915527344, 42.08122253417969, 43.7943229675293, 45.50741958618164, 47.22052001953125, 48.933616638183594, 50.6467170715332, 52.35981369018555, 54.072914123535156, 55.7860107421875, 57.499107360839844]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 5.0, 7.0, 11.0, 8.0, 14.0, 17.0, 22.0, 16.0, 28.0, 30.0, 32.0, 50.0, 40.0, 52.0, 45.0, 66.0, 68.0, 60.0, 52.0, 39.0, 58.0, 36.0, 44.0, 49.0, 23.0, 28.0, 25.0, 18.0, 15.0, 8.0, 15.0, 6.0, 11.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.97799301147461, -15.527382850646973, -15.076772689819336, -14.626163482666016, -14.175553321838379, -13.724943161010742, -13.274333953857422, -12.823723793029785, -12.373113632202148, -11.922503471374512, -11.471893310546875, -11.021284103393555, -10.570673942565918, -10.120063781738281, -9.669454574584961, -9.218844413757324, -8.768234252929688, -8.31762409210205, -7.867014408111572, -7.416404724121094, -6.965794563293457, -6.51518440246582, -6.064574718475342, -5.613965034484863, -5.163354873657227, -4.71274471282959, -4.262135028839111, -3.8115251064300537, -3.360915184020996, -2.9103052616119385, -2.459695339202881, -2.0090854167938232, -1.558476448059082, -1.1078665256500244, -0.6572566032409668, -0.20664668083190918, 0.24396324157714844, 0.694573163986206, 1.1451830863952637, 1.5957930088043213, 2.046402931213379, 2.4970128536224365, 2.947622776031494, 3.3982326984405518, 3.8488426208496094, 4.299452781677246, 4.750062465667725, 5.200672149658203, 5.65128231048584, 6.101892471313477, 6.552502155303955, 7.003111839294434, 7.45372200012207, 7.904332160949707, 8.354942321777344, 8.805551528930664, 9.2561616897583, 9.706771850585938, 10.157381057739258, 10.607991218566895, 11.058601379394531, 11.509211540222168, 11.959821701049805, 12.410430908203125, 12.861041069030762]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 5.0, 5.0, 11.0, 19.0, 22.0, 26.0, 46.0, 83.0, 123.0, 226.0, 385.0, 703.0, 1305.0, 2775.0, 5966.0, 14075.0, 36857.0, 109745.0, 470004.0, 284189.0, 75438.0, 26602.0, 10569.0, 4651.0, 2230.0, 1048.0, 587.0, 353.0, 177.0, 108.0, 72.0, 49.0, 28.0, 16.0, 11.0, 14.0, 14.0, 7.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4453125, -1.3999176025390625, -1.354522705078125, -1.3091278076171875, -1.26373291015625, -1.2183380126953125, -1.172943115234375, -1.1275482177734375, -1.0821533203125, -1.0367584228515625, -0.991363525390625, -0.9459686279296875, -0.90057373046875, -0.8551788330078125, -0.809783935546875, -0.7643890380859375, -0.718994140625, -0.6735992431640625, -0.628204345703125, -0.5828094482421875, -0.53741455078125, -0.4920196533203125, -0.446624755859375, -0.4012298583984375, -0.3558349609375, -0.3104400634765625, -0.265045166015625, -0.2196502685546875, -0.17425537109375, -0.1288604736328125, -0.083465576171875, -0.0380706787109375, 0.00732421875, 0.0527191162109375, 0.098114013671875, 0.1435089111328125, 0.18890380859375, 0.2342987060546875, 0.279693603515625, 0.3250885009765625, 0.3704833984375, 0.4158782958984375, 0.461273193359375, 0.5066680908203125, 0.55206298828125, 0.5974578857421875, 0.642852783203125, 0.6882476806640625, 0.733642578125, 0.7790374755859375, 0.824432373046875, 0.8698272705078125, 0.91522216796875, 0.9606170654296875, 1.006011962890625, 1.0514068603515625, 1.0968017578125, 1.1421966552734375, 1.187591552734375, 1.2329864501953125, 1.27838134765625, 1.3237762451171875, 1.369171142578125, 1.4145660400390625, 1.4599609375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 5.0, 5.0, 16.0, 15.0, 11.0, 17.0, 26.0, 25.0, 33.0, 39.0, 44.0, 49.0, 62.0, 67.0, 63.0, 57.0, 59.0, 55.0, 54.0, 51.0, 45.0, 44.0, 37.0, 32.0, 19.0, 23.0, 10.0, 11.0, 11.0, 8.0, 8.0, 0.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.2626953125, -1.2306671142578125, -1.198638916015625, -1.1666107177734375, -1.13458251953125, -1.1025543212890625, -1.070526123046875, -1.0384979248046875, -1.0064697265625, -0.9744415283203125, -0.942413330078125, -0.9103851318359375, -0.87835693359375, -0.8463287353515625, -0.814300537109375, -0.7822723388671875, -0.750244140625, -0.7182159423828125, -0.686187744140625, -0.6541595458984375, -0.62213134765625, -0.5901031494140625, -0.558074951171875, -0.5260467529296875, -0.4940185546875, -0.4619903564453125, -0.429962158203125, -0.3979339599609375, -0.36590576171875, -0.3338775634765625, -0.301849365234375, -0.2698211669921875, -0.23779296875, -0.2057647705078125, -0.173736572265625, -0.1417083740234375, -0.10968017578125, -0.0776519775390625, -0.045623779296875, -0.0135955810546875, 0.0184326171875, 0.0504608154296875, 0.082489013671875, 0.1145172119140625, 0.14654541015625, 0.1785736083984375, 0.210601806640625, 0.2426300048828125, 0.274658203125, 0.3066864013671875, 0.338714599609375, 0.3707427978515625, 0.40277099609375, 0.4347991943359375, 0.466827392578125, 0.4988555908203125, 0.5308837890625, 0.5629119873046875, 0.594940185546875, 0.6269683837890625, 0.65899658203125, 0.6910247802734375, 0.723052978515625, 0.7550811767578125, 0.787109375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 6.0, 14.0, 14.0, 11.0, 9.0, 29.0, 31.0, 48.0, 86.0, 104.0, 193.0, 240.0, 417.0, 767.0, 1629.0, 4390.0, 17265.0, 108547.0, 838035.0, 59868.0, 10805.0, 3122.0, 1250.0, 635.0, 360.0, 223.0, 143.0, 74.0, 66.0, 44.0, 36.0, 30.0, 26.0, 11.0, 7.0, 5.0, 3.0, 3.0, 5.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9521484375, -1.8878326416015625, -1.823516845703125, -1.7592010498046875, -1.69488525390625, -1.6305694580078125, -1.566253662109375, -1.5019378662109375, -1.4376220703125, -1.3733062744140625, -1.308990478515625, -1.2446746826171875, -1.18035888671875, -1.1160430908203125, -1.051727294921875, -0.9874114990234375, -0.923095703125, -0.8587799072265625, -0.794464111328125, -0.7301483154296875, -0.66583251953125, -0.6015167236328125, -0.537200927734375, -0.4728851318359375, -0.4085693359375, -0.3442535400390625, -0.279937744140625, -0.2156219482421875, -0.15130615234375, -0.0869903564453125, -0.022674560546875, 0.0416412353515625, 0.10595703125, 0.1702728271484375, 0.234588623046875, 0.2989044189453125, 0.36322021484375, 0.4275360107421875, 0.491851806640625, 0.5561676025390625, 0.6204833984375, 0.6847991943359375, 0.749114990234375, 0.8134307861328125, 0.87774658203125, 0.9420623779296875, 1.006378173828125, 1.0706939697265625, 1.135009765625, 1.1993255615234375, 1.263641357421875, 1.3279571533203125, 1.39227294921875, 1.4565887451171875, 1.520904541015625, 1.5852203369140625, 1.6495361328125, 1.7138519287109375, 1.778167724609375, 1.8424835205078125, 1.90679931640625, 1.9711151123046875, 2.035430908203125, 2.0997467041015625, 2.1640625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 7.0, 8.0, 6.0, 14.0, 6.0, 7.0, 9.0, 19.0, 16.0, 18.0, 19.0, 18.0, 28.0, 24.0, 22.0, 34.0, 40.0, 46.0, 52.0, 78.0, 67.0, 71.0, 58.0, 57.0, 32.0, 40.0, 29.0, 19.0, 27.0, 10.0, 20.0, 13.0, 9.0, 12.0, 10.0, 12.0, 9.0, 11.0, 7.0, 3.0, 7.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 4.0, 0.0, 2.0], "bins": [-3.1796875, -3.087432861328125, -2.99517822265625, -2.902923583984375, -2.8106689453125, -2.718414306640625, -2.62615966796875, -2.533905029296875, -2.441650390625, -2.349395751953125, -2.25714111328125, -2.164886474609375, -2.0726318359375, -1.980377197265625, -1.88812255859375, -1.795867919921875, -1.70361328125, -1.611358642578125, -1.51910400390625, -1.426849365234375, -1.3345947265625, -1.242340087890625, -1.15008544921875, -1.057830810546875, -0.965576171875, -0.873321533203125, -0.78106689453125, -0.688812255859375, -0.5965576171875, -0.504302978515625, -0.41204833984375, -0.319793701171875, -0.2275390625, -0.135284423828125, -0.04302978515625, 0.049224853515625, 0.1414794921875, 0.233734130859375, 0.32598876953125, 0.418243408203125, 0.510498046875, 0.602752685546875, 0.69500732421875, 0.787261962890625, 0.8795166015625, 0.971771240234375, 1.06402587890625, 1.156280517578125, 1.24853515625, 1.340789794921875, 1.43304443359375, 1.525299072265625, 1.6175537109375, 1.709808349609375, 1.80206298828125, 1.894317626953125, 1.986572265625, 2.078826904296875, 2.17108154296875, 2.263336181640625, 2.3555908203125, 2.447845458984375, 2.54010009765625, 2.632354736328125, 2.724609375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 8.0, 11.0, 12.0, 12.0, 18.0, 22.0, 24.0, 35.0, 43.0, 54.0, 108.0, 156.0, 266.0, 523.0, 1078.0, 2669.0, 7526.0, 29994.0, 719766.0, 247471.0, 27092.0, 7039.0, 2428.0, 955.0, 481.0, 274.0, 135.0, 97.0, 60.0, 46.0, 34.0, 31.0, 15.0, 17.0, 9.0, 9.0, 10.0, 7.0, 3.0, 2.0, 4.0, 1.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.47802734375, -0.4635276794433594, -0.44902801513671875, -0.4345283508300781, -0.4200286865234375, -0.4055290222167969, -0.39102935791015625, -0.3765296936035156, -0.362030029296875, -0.3475303649902344, -0.33303070068359375, -0.3185310363769531, -0.3040313720703125, -0.2895317077636719, -0.27503204345703125, -0.2605323791503906, -0.24603271484375, -0.23153305053710938, -0.21703338623046875, -0.20253372192382812, -0.1880340576171875, -0.17353439331054688, -0.15903472900390625, -0.14453506469726562, -0.130035400390625, -0.11553573608398438, -0.10103607177734375, -0.08653640747070312, -0.0720367431640625, -0.057537078857421875, -0.04303741455078125, -0.028537750244140625, -0.0140380859375, 0.000461578369140625, 0.01496124267578125, 0.029460906982421875, 0.0439605712890625, 0.058460235595703125, 0.07295989990234375, 0.08745956420898438, 0.101959228515625, 0.11645889282226562, 0.13095855712890625, 0.14545822143554688, 0.1599578857421875, 0.17445755004882812, 0.18895721435546875, 0.20345687866210938, 0.21795654296875, 0.23245620727539062, 0.24695587158203125, 0.2614555358886719, 0.2759552001953125, 0.2904548645019531, 0.30495452880859375, 0.3194541931152344, 0.333953857421875, 0.3484535217285156, 0.36295318603515625, 0.3774528503417969, 0.3919525146484375, 0.4064521789550781, 0.42095184326171875, 0.4354515075683594, 0.449951171875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 2.0, 7.0, 12.0, 10.0, 14.0, 20.0, 18.0, 22.0, 59.0, 100.0, 149.0, 186.0, 145.0, 77.0, 43.0, 30.0, 24.0, 16.0, 12.0, 4.0, 11.0, 8.0, 1.0, 6.0, 1.0, 2.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00027751922607421875, -0.00026943907141685486, -0.00026135891675949097, -0.0002532787621021271, -0.0002451986074447632, -0.0002371184527873993, -0.0002290382981300354, -0.0002209581434726715, -0.00021287798881530762, -0.00020479783415794373, -0.00019671767950057983, -0.00018863752484321594, -0.00018055737018585205, -0.00017247721552848816, -0.00016439706087112427, -0.00015631690621376038, -0.00014823675155639648, -0.0001401565968990326, -0.0001320764422416687, -0.0001239962875843048, -0.00011591613292694092, -0.00010783597826957703, -9.975582361221313e-05, -9.167566895484924e-05, -8.359551429748535e-05, -7.551535964012146e-05, -6.743520498275757e-05, -5.935505032539368e-05, -5.1274895668029785e-05, -4.3194741010665894e-05, -3.5114586353302e-05, -2.703443169593811e-05, -1.895427703857422e-05, -1.0874122381210327e-05, -2.7939677238464355e-06, 5.286186933517456e-06, 1.3366341590881348e-05, 2.144649624824524e-05, 2.952665090560913e-05, 3.760680556297302e-05, 4.5686960220336914e-05, 5.3767114877700806e-05, 6.18472695350647e-05, 6.992742419242859e-05, 7.800757884979248e-05, 8.608773350715637e-05, 9.416788816452026e-05, 0.00010224804282188416, 0.00011032819747924805, 0.00011840835213661194, 0.00012648850679397583, 0.00013456866145133972, 0.0001426488161087036, 0.0001507289707660675, 0.0001588091254234314, 0.0001668892800807953, 0.00017496943473815918, 0.00018304958939552307, 0.00019112974405288696, 0.00019920989871025085, 0.00020729005336761475, 0.00021537020802497864, 0.00022345036268234253, 0.00023153051733970642, 0.0002396106719970703]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 5.0, 4.0, 4.0, 3.0, 16.0, 25.0, 23.0, 41.0, 36.0, 42.0, 79.0, 119.0, 210.0, 291.0, 497.0, 755.0, 1265.0, 2390.0, 4719.0, 9941.0, 24780.0, 83697.0, 757233.0, 109867.0, 29464.0, 11438.0, 5209.0, 2671.0, 1458.0, 815.0, 545.0, 312.0, 198.0, 131.0, 87.0, 59.0, 35.0, 25.0, 21.0, 16.0, 10.0, 11.0, 8.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.2587890625, -0.2510833740234375, -0.243377685546875, -0.2356719970703125, -0.22796630859375, -0.2202606201171875, -0.212554931640625, -0.2048492431640625, -0.1971435546875, -0.1894378662109375, -0.181732177734375, -0.1740264892578125, -0.16632080078125, -0.1586151123046875, -0.150909423828125, -0.1432037353515625, -0.135498046875, -0.1277923583984375, -0.120086669921875, -0.1123809814453125, -0.10467529296875, -0.0969696044921875, -0.089263916015625, -0.0815582275390625, -0.0738525390625, -0.0661468505859375, -0.058441162109375, -0.0507354736328125, -0.04302978515625, -0.0353240966796875, -0.027618408203125, -0.0199127197265625, -0.01220703125, -0.0045013427734375, 0.003204345703125, 0.0109100341796875, 0.01861572265625, 0.0263214111328125, 0.034027099609375, 0.0417327880859375, 0.0494384765625, 0.0571441650390625, 0.064849853515625, 0.0725555419921875, 0.08026123046875, 0.0879669189453125, 0.095672607421875, 0.1033782958984375, 0.111083984375, 0.1187896728515625, 0.126495361328125, 0.1342010498046875, 0.14190673828125, 0.1496124267578125, 0.157318115234375, 0.1650238037109375, 0.1727294921875, 0.1804351806640625, 0.188140869140625, 0.1958465576171875, 0.20355224609375, 0.2112579345703125, 0.218963623046875, 0.2266693115234375, 0.234375]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 6.0, 5.0, 6.0, 3.0, 6.0, 6.0, 4.0, 10.0, 10.0, 21.0, 17.0, 40.0, 34.0, 58.0, 67.0, 106.0, 110.0, 109.0, 87.0, 87.0, 52.0, 42.0, 29.0, 18.0, 15.0, 12.0, 7.0, 6.0, 1.0, 7.0, 6.0, 7.0, 6.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5185546875, -0.5045013427734375, -0.490447998046875, -0.4763946533203125, -0.46234130859375, -0.4482879638671875, -0.434234619140625, -0.4201812744140625, -0.4061279296875, -0.3920745849609375, -0.378021240234375, -0.3639678955078125, -0.34991455078125, -0.3358612060546875, -0.321807861328125, -0.3077545166015625, -0.293701171875, -0.2796478271484375, -0.265594482421875, -0.2515411376953125, -0.23748779296875, -0.2234344482421875, -0.209381103515625, -0.1953277587890625, -0.1812744140625, -0.1672210693359375, -0.153167724609375, -0.1391143798828125, -0.12506103515625, -0.1110076904296875, -0.096954345703125, -0.0829010009765625, -0.06884765625, -0.0547943115234375, -0.040740966796875, -0.0266876220703125, -0.01263427734375, 0.0014190673828125, 0.015472412109375, 0.0295257568359375, 0.0435791015625, 0.0576324462890625, 0.071685791015625, 0.0857391357421875, 0.09979248046875, 0.1138458251953125, 0.127899169921875, 0.1419525146484375, 0.156005859375, 0.1700592041015625, 0.184112548828125, 0.1981658935546875, 0.21221923828125, 0.2262725830078125, 0.240325927734375, 0.2543792724609375, 0.2684326171875, 0.2824859619140625, 0.296539306640625, 0.3105926513671875, 0.32464599609375, 0.3386993408203125, 0.352752685546875, 0.3668060302734375, 0.380859375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 5.0, 12.0, 20.0, 60.0, 128.0, 627.0, 98.0, 36.0, 17.0, 5.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.526641845703125, -32.52521896362305, -31.523794174194336, -30.522369384765625, -29.520946502685547, -28.519521713256836, -27.518096923828125, -26.516674041748047, -25.51525115966797, -24.513826370239258, -23.51240348815918, -22.51097869873047, -21.50955581665039, -20.50813102722168, -19.50670623779297, -18.50528335571289, -17.50385856628418, -16.50243377685547, -15.50101089477539, -14.49958610534668, -13.498163223266602, -12.49673843383789, -11.495314598083496, -10.493890762329102, -9.492466926574707, -8.491043090820312, -7.489619255065918, -6.488194942474365, -5.486771106719971, -4.485347270965576, -3.4839229583740234, -2.482499122619629, -1.4810733795166016, -0.4796494245529175, 0.5217745304107666, 1.5231986045837402, 2.5246224403381348, 3.5260462760925293, 4.527470588684082, 5.528894424438477, 6.530318260192871, 7.531742095947266, 8.53316593170166, 9.534589767456055, 10.536014556884766, 11.537437438964844, 12.538862228393555, 13.54028606414795, 14.541709899902344, 15.543133735656738, 16.544557571411133, 17.545982360839844, 18.547405242919922, 19.548830032348633, 20.550254821777344, 21.551677703857422, 22.5531005859375, 23.55452537536621, 24.55594825744629, 25.557373046875, 26.558795928955078, 27.56022071838379, 28.5616455078125, 29.563068389892578, 30.56449317932129]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 10.0, 4.0, 6.0, 9.0, 12.0, 8.0, 11.0, 22.0, 15.0, 23.0, 25.0, 27.0, 31.0, 27.0, 43.0, 238.0, 230.0, 49.0, 32.0, 24.0, 28.0, 23.0, 17.0, 16.0, 8.0, 15.0, 11.0, 2.0, 4.0, 9.0, 5.0, 4.0, 1.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.442407608032227, -8.129712104797363, -7.8170166015625, -7.504321098327637, -7.191625595092773, -6.87893009185791, -6.566235065460205, -6.253539562225342, -5.9408440589904785, -5.628148555755615, -5.315453052520752, -5.002757549285889, -4.690062522888184, -4.37736701965332, -4.064671516418457, -3.7519760131835938, -3.4392805099487305, -3.126585006713867, -2.813889503479004, -2.5011942386627197, -2.1884987354278564, -1.8758032321929932, -1.5631078481674194, -1.2504124641418457, -0.9377169609069824, -0.6250215172767639, -0.3123260736465454, 0.0003693699836730957, 0.3130648136138916, 0.6257603168487549, 0.9384557008743286, 1.2511510848999023, 1.563847541809082, 1.8765430450439453, 2.1892385482788086, 2.5019338130950928, 2.814629316329956, 3.1273248195648193, 3.4400200843811035, 3.752715587615967, 4.06541109085083, 4.378106594085693, 4.690802097320557, 5.00349760055542, 5.316192626953125, 5.628888130187988, 5.941583633422852, 6.254279136657715, 6.566974639892578, 6.879670143127441, 7.192365646362305, 7.505061149597168, 7.817756652832031, 8.130452156066895, 8.443147659301758, 8.755842208862305, 9.068538665771484, 9.381234169006348, 9.693929672241211, 10.006625175476074, 10.319320678710938, 10.6320161819458, 10.944711685180664, 11.257406234741211, 11.570101737976074]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 6.0, 9.0, 5.0, 6.0, 10.0, 13.0, 11.0, 27.0, 28.0, 46.0, 40.0, 63.0, 126.0, 287.0, 93.0, 57.0, 51.0, 27.0, 30.0, 21.0, 18.0, 6.0, 11.0, 6.0, 5.0, 0.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1708984375, -1.133514404296875, -1.09613037109375, -1.058746337890625, -1.0213623046875, -0.983978271484375, -0.94659423828125, -0.909210205078125, -0.871826171875, -0.834442138671875, -0.79705810546875, -0.759674072265625, -0.7222900390625, -0.684906005859375, -0.64752197265625, -0.610137939453125, -0.57275390625, -0.535369873046875, -0.49798583984375, -0.460601806640625, -0.4232177734375, -0.385833740234375, -0.34844970703125, -0.311065673828125, -0.273681640625, -0.236297607421875, -0.19891357421875, -0.161529541015625, -0.1241455078125, -0.086761474609375, -0.04937744140625, -0.011993408203125, 0.025390625, 0.062774658203125, 0.10015869140625, 0.137542724609375, 0.1749267578125, 0.212310791015625, 0.24969482421875, 0.287078857421875, 0.324462890625, 0.361846923828125, 0.39923095703125, 0.436614990234375, 0.4739990234375, 0.511383056640625, 0.54876708984375, 0.586151123046875, 0.62353515625, 0.660919189453125, 0.69830322265625, 0.735687255859375, 0.7730712890625, 0.810455322265625, 0.84783935546875, 0.885223388671875, 0.922607421875, 0.959991455078125, 0.99737548828125, 1.034759521484375, 1.0721435546875, 1.109527587890625, 1.14691162109375, 1.184295654296875, 1.2216796875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 5.0, 3.0, 5.0, 4.0, 8.0, 11.0, 13.0, 12.0, 28.0, 31.0, 61.0, 102.0, 156.0, 349.0, 989.0, 3840.0, 36363.0, 8334536.0, 9000.0, 1898.0, 605.0, 215.0, 126.0, 84.0, 61.0, 22.0, 15.0, 6.0, 8.0, 4.0, 5.0, 6.0, 2.0, 2.0, 0.0, 1.0, 3.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.785748481750488, -9.500036239624023, -9.214324951171875, -8.92861270904541, -8.642901420593262, -8.357189178466797, -8.071477890014648, -7.785765647888184, -7.500053882598877, -7.21434211730957, -6.928630352020264, -6.642918586730957, -6.357206344604492, -6.071495056152344, -5.785782814025879, -5.500071048736572, -5.214359283447266, -4.928647518157959, -4.642935752868652, -4.357223987579346, -4.071512222290039, -3.7858002185821533, -3.5000882148742676, -3.214376449584961, -2.9286646842956543, -2.6429529190063477, -2.357241153717041, -2.0715291500091553, -1.7858173847198486, -1.500105619430542, -1.2143937349319458, -0.9286818504333496, -0.642970085144043, -0.35725826025009155, -0.07154643535614014, 0.21416538953781128, 0.4998772144317627, 0.7855889797210693, 1.0713008642196655, 1.3570127487182617, 1.6427245140075684, 1.928436279296875, 2.2141480445861816, 2.4998600482940674, 2.785571813583374, 3.0712835788726807, 3.3569955825805664, 3.642707347869873, 3.9284191131591797, 4.214130878448486, 4.499842643737793, 4.7855544090271, 5.071266174316406, 5.356978416442871, 5.642690181732178, 5.928401947021484, 6.214113712310791, 6.499825477600098, 6.785537242889404, 7.071249008178711, 7.356961250305176, 7.642672538757324, 7.928384780883789, 8.214096069335938, 8.499808311462402]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 6.0, 6.0, 2.0, 4.0, 8.0, 8.0, 2.0, 4.0, 4.0, 5.0, 9.0, 5.0, 3.0, 6.0, 2.0, 3.0, 6.0, 2.0, 2.0, 2.0, 1.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.060517311096191, -8.824185371398926, -8.58785343170166, -8.351521492004395, -8.115188598632812, -7.878857135772705, -7.642524719238281, -7.406192779541016, -7.16986083984375, -6.933528900146484, -6.697196960449219, -6.460864543914795, -6.224532604217529, -5.988200664520264, -5.75186824798584, -5.515536308288574, -5.279204368591309, -5.042872428894043, -4.806540489196777, -4.5702080726623535, -4.333876132965088, -4.097544193267822, -3.8612120151519775, -3.624879837036133, -3.388547897338867, -3.1522159576416016, -2.915883779525757, -2.679551601409912, -2.4432196617126465, -2.206887722015381, -1.9705555438995361, -1.734223484992981, -1.497891902923584, -1.2615598440170288, -1.0252277851104736, -0.7888957262039185, -0.5525636672973633, -0.3162316083908081, -0.07989954948425293, 0.15643250942230225, 0.3927645683288574, 0.6290966272354126, 0.8654286861419678, 1.101760745048523, 1.3380928039550781, 1.5744248628616333, 1.8107569217681885, 2.047089099884033, 2.283421039581299, 2.5197529792785645, 2.756085157394409, 2.992417335510254, 3.2287492752075195, 3.465081214904785, 3.70141339302063, 3.9377455711364746, 4.17407751083374, 4.410409450531006, 4.64674186706543, 4.883073806762695, 5.119405746459961, 5.355737686157227, 5.592069625854492, 5.828402042388916, 6.064733982086182]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 8.0, 11.0, 14.0, 11.0, 21.0, 41.0, 46.0, 64.0, 106.0, 153.0, 289.0, 652.0, 1545.0, 4948.0, 18767.0, 85491.0, 268832.0, 109989.0, 23745.0, 6111.0, 1860.0, 733.0, 352.0, 185.0, 117.0, 68.0, 39.0, 28.0, 15.0, 5.0, 7.0, 4.0, 9.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.0859375, -10.7828369140625, -10.479736328125, -10.1766357421875, -9.87353515625, -9.5704345703125, -9.267333984375, -8.9642333984375, -8.6611328125, -8.3580322265625, -8.054931640625, -7.7518310546875, -7.44873046875, -7.1456298828125, -6.842529296875, -6.5394287109375, -6.236328125, -5.9332275390625, -5.630126953125, -5.3270263671875, -5.02392578125, -4.7208251953125, -4.417724609375, -4.1146240234375, -3.8115234375, -3.5084228515625, -3.205322265625, -2.9022216796875, -2.59912109375, -2.2960205078125, -1.992919921875, -1.6898193359375, -1.38671875, -1.0836181640625, -0.780517578125, -0.4774169921875, -0.17431640625, 0.1287841796875, 0.431884765625, 0.7349853515625, 1.0380859375, 1.3411865234375, 1.644287109375, 1.9473876953125, 2.25048828125, 2.5535888671875, 2.856689453125, 3.1597900390625, 3.462890625, 3.7659912109375, 4.069091796875, 4.3721923828125, 4.67529296875, 4.9783935546875, 5.281494140625, 5.5845947265625, 5.8876953125, 6.1907958984375, 6.493896484375, 6.7969970703125, 7.10009765625, 7.4031982421875, 7.706298828125, 8.0093994140625, 8.3125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 10.0, 5.0, 11.0, 13.0, 24.0, 24.0, 25.0, 32.0, 57.0, 47.0, 69.0, 68.0, 75.0, 80.0, 74.0, 79.0, 67.0, 46.0, 51.0, 31.0, 24.0, 23.0, 21.0, 14.0, 8.0, 8.0, 6.0, 7.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3447265625, -1.3103790283203125, -1.276031494140625, -1.2416839599609375, -1.20733642578125, -1.1729888916015625, -1.138641357421875, -1.1042938232421875, -1.0699462890625, -1.0355987548828125, -1.001251220703125, -0.9669036865234375, -0.93255615234375, -0.8982086181640625, -0.863861083984375, -0.8295135498046875, -0.795166015625, -0.7608184814453125, -0.726470947265625, -0.6921234130859375, -0.65777587890625, -0.6234283447265625, -0.589080810546875, -0.5547332763671875, -0.5203857421875, -0.4860382080078125, -0.451690673828125, -0.4173431396484375, -0.38299560546875, -0.3486480712890625, -0.314300537109375, -0.2799530029296875, -0.24560546875, -0.2112579345703125, -0.176910400390625, -0.1425628662109375, -0.10821533203125, -0.0738677978515625, -0.039520263671875, -0.0051727294921875, 0.0291748046875, 0.0635223388671875, 0.097869873046875, 0.1322174072265625, 0.16656494140625, 0.2009124755859375, 0.235260009765625, 0.2696075439453125, 0.303955078125, 0.3383026123046875, 0.372650146484375, 0.4069976806640625, 0.44134521484375, 0.4756927490234375, 0.510040283203125, 0.5443878173828125, 0.5787353515625, 0.6130828857421875, 0.647430419921875, 0.6817779541015625, 0.71612548828125, 0.7504730224609375, 0.784820556640625, 0.8191680908203125, 0.853515625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 5.0, 2.0, 5.0, 10.0, 11.0, 19.0, 29.0, 55.0, 82.0, 105.0, 71.0, 43.0, 16.0, 11.0, 10.0, 6.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.611623764038086, -11.331544876098633, -11.051466941833496, -10.771388053894043, -10.491310119628906, -10.211231231689453, -9.931153297424316, -9.651074409484863, -9.370996475219727, -9.090917587280273, -8.810839653015137, -8.530760765075684, -8.250682830810547, -7.970603942871094, -7.690525531768799, -7.410447120666504, -7.130368232727051, -6.850289821624756, -6.570211410522461, -6.290132999420166, -6.010054588317871, -5.729975700378418, -5.449897289276123, -5.169818878173828, -4.889740467071533, -4.609662055969238, -4.329583644866943, -4.049505233764648, -3.7694265842437744, -3.4893481731414795, -3.2092695236206055, -2.9291911125183105, -2.649113655090332, -2.369035243988037, -2.088956832885742, -1.8088781833648682, -1.5287997722625732, -1.2487213611602783, -0.9686428308486938, -0.6885643005371094, -0.40848588943481445, -0.12840741872787476, 0.15167105197906494, 0.43174952268600464, 0.7118279933929443, 0.9919064044952393, 1.2719849348068237, 1.5520634651184082, 1.8321418762207031, 2.112220287322998, 2.392298698425293, 2.672377347946167, 2.952455759048462, 3.232534170150757, 3.512612819671631, 3.792691230773926, 4.072769641876221, 4.352848052978516, 4.6329264640808105, 4.9130048751831055, 5.193083763122559, 5.473161697387695, 5.753240585327148, 6.033318996429443, 6.313397407531738]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 5.0, 2.0, 1.0, 3.0, 4.0, 2.0, 6.0, 7.0, 16.0, 13.0, 29.0, 53.0, 92.0, 93.0, 70.0, 34.0, 20.0, 10.0, 10.0, 4.0, 5.0, 2.0, 0.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.147286891937256, -4.965672969818115, -4.784059047698975, -4.602445125579834, -4.420830726623535, -4.2392168045043945, -4.057602882385254, -3.8759889602661133, -3.6943750381469727, -3.512761116027832, -3.3311471939086914, -3.1495330333709717, -2.967919111251831, -2.7863051891326904, -2.6046910285949707, -2.42307710647583, -2.2414631843566895, -2.059849262237549, -1.8782352209091187, -1.6966211795806885, -1.5150072574615479, -1.3333933353424072, -1.151779294013977, -0.9701652526855469, -0.7885513305664062, -0.6069373488426208, -0.42532336711883545, -0.24370938539505005, -0.06209540367126465, 0.11951857805252075, 0.30113255977630615, 0.48274660110473633, 0.6643600463867188, 0.8459740281105042, 1.0275880098342896, 1.2092020511627197, 1.3908159732818604, 1.572429895401001, 1.7540439367294312, 1.9356579780578613, 2.117271900177002, 2.2988858222961426, 2.480499744415283, 2.662113904953003, 2.8437278270721436, 3.025341749191284, 3.206955909729004, 3.3885698318481445, 3.570183753967285, 3.751797676086426, 3.9334115982055664, 4.115025520324707, 4.296639442443848, 4.4782538414001465, 4.659867763519287, 4.841481685638428, 5.023095607757568, 5.204709529876709, 5.38632345199585, 5.56793737411499, 5.749551773071289, 5.93116569519043, 6.11277961730957, 6.294393539428711, 6.476007461547852]}, "eval/loss": 4.166304588317871, "eval/wer": 1.918524395081317, "eval/runtime": 982.6549, "eval/samples_per_second": 2.689, "eval/steps_per_second": 0.337, "train/train_runtime": 8769.6328, "train/train_samples_per_second": 3.254, "train/train_steps_per_second": 0.203, "train/total_flos": 0.0, "train/train_loss": 4.241978131735806} \ No newline at end of file