diff --git "a/wandb/run-20220228_185039-2l3jouo4/files/wandb-summary.json" "b/wandb/run-20220228_185039-2l3jouo4/files/wandb-summary.json" --- "a/wandb/run-20220228_185039-2l3jouo4/files/wandb-summary.json" +++ "b/wandb/run-20220228_185039-2l3jouo4/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 4.4108, "train/learning_rate": 9.940000000000001e-06, "train/epoch": 0.84, "train/global_step": 500, "_runtime": 4822, "_timestamp": 1646079061, "_step": 500, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 27.0, 111.0, 297.0, 320.0, 196.0, 48.0, 9.0, 3.0], "bins": [-212.42514038085938, -208.83255004882812, -205.23995971679688, -201.64736938476562, -198.05477905273438, -194.4622039794922, -190.86961364746094, -187.2770233154297, -183.68443298339844, -180.0918426513672, -176.49925231933594, -172.9066619873047, -169.3140869140625, -165.72149658203125, -162.12890625, -158.53631591796875, -154.9437255859375, -151.35113525390625, -147.758544921875, -144.16595458984375, -140.5733642578125, -136.9807891845703, -133.38819885253906, -129.7956085205078, -126.20301818847656, -122.61042785644531, -119.01783752441406, -115.42525482177734, -111.8326644897461, -108.24007415771484, -104.64749145507812, -101.05490112304688, -97.46231079101562, -93.86972045898438, -90.27713012695312, -86.6845474243164, -83.09195709228516, -79.4993667602539, -75.90678405761719, -72.31419372558594, -68.72160339355469, -65.12901306152344, -61.53642654418945, -57.94384002685547, -54.35124969482422, -50.75865936279297, -47.166072845458984, -43.573486328125, -39.98089599609375, -36.3883056640625, -32.795719146728516, -29.2031307220459, -25.61054229736328, -22.017953872680664, -18.425365447998047, -14.83277702331543, -11.24018669128418, -7.6475982666015625, -4.055009841918945, -0.4624214172363281, 3.130167007446289, 6.722755432128906, 10.315343856811523, 13.90793228149414, 17.500520706176758]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 2.0, 5.0, 8.0, 13.0, 9.0, 13.0, 15.0, 19.0, 15.0, 29.0, 23.0, 39.0, 29.0, 53.0, 52.0, 41.0, 55.0, 63.0, 51.0, 52.0, 61.0, 43.0, 38.0, 43.0, 30.0, 34.0, 28.0, 25.0, 17.0, 16.0, 22.0, 20.0, 10.0, 5.0, 4.0, 10.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-64.8299560546875, -62.763370513916016, -60.69678497314453, -58.63019943237305, -56.56361389160156, -54.49702835083008, -52.430442810058594, -50.363853454589844, -48.297271728515625, -46.23068618774414, -44.164100646972656, -42.09751510620117, -40.03092956542969, -37.9643440246582, -35.89775848388672, -33.83116912841797, -31.764583587646484, -29.697998046875, -27.631412506103516, -25.56482696533203, -23.498241424560547, -21.431655883789062, -19.365068435668945, -17.29848289489746, -15.231897354125977, -13.165311813354492, -11.098726272583008, -9.032139778137207, -6.965554237365723, -4.898968696594238, -2.8323822021484375, -0.7657966613769531, 1.3007888793945312, 3.3673746585845947, 5.433960437774658, 7.500546455383301, 9.567131996154785, 11.63371753692627, 13.70030403137207, 15.766889572143555, 17.83347511291504, 19.900060653686523, 21.966646194458008, 24.033233642578125, 26.09981918334961, 28.166404724121094, 30.232990264892578, 32.29957580566406, 34.36616134643555, 36.43274688720703, 38.499332427978516, 40.56591796875, 42.632503509521484, 44.69908905029297, 46.76567840576172, 48.83226013183594, 50.89884948730469, 52.96543502807617, 55.032020568847656, 57.09860610961914, 59.165191650390625, 61.23177719116211, 63.298362731933594, 65.36495208740234, 67.43153381347656]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 3.0, 4.0, 3.0, 9.0, 8.0, 9.0, 8.0, 8.0, 18.0, 23.0, 15.0, 23.0, 22.0, 43.0, 35.0, 31.0, 39.0, 46.0, 48.0, 53.0, 56.0, 65.0, 44.0, 50.0, 43.0, 32.0, 41.0, 27.0, 38.0, 21.0, 23.0, 15.0, 22.0, 19.0, 15.0, 10.0, 8.0, 6.0, 7.0, 5.0, 3.0, 1.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.41796875, -4.26458740234375, -4.1112060546875, -3.95782470703125, -3.804443359375, -3.65106201171875, -3.4976806640625, -3.34429931640625, -3.19091796875, -3.03753662109375, -2.8841552734375, -2.73077392578125, -2.577392578125, -2.42401123046875, -2.2706298828125, -2.11724853515625, -1.9638671875, -1.81048583984375, -1.6571044921875, -1.50372314453125, -1.350341796875, -1.19696044921875, -1.0435791015625, -0.89019775390625, -0.73681640625, -0.58343505859375, -0.4300537109375, -0.27667236328125, -0.123291015625, 0.03009033203125, 0.1834716796875, 0.33685302734375, 0.490234375, 0.64361572265625, 0.7969970703125, 0.95037841796875, 1.103759765625, 1.25714111328125, 1.4105224609375, 1.56390380859375, 1.71728515625, 1.87066650390625, 2.0240478515625, 2.17742919921875, 2.330810546875, 2.48419189453125, 2.6375732421875, 2.79095458984375, 2.9443359375, 3.09771728515625, 3.2510986328125, 3.40447998046875, 3.557861328125, 3.71124267578125, 3.8646240234375, 4.01800537109375, 4.17138671875, 4.32476806640625, 4.4781494140625, 4.63153076171875, 4.784912109375, 4.93829345703125, 5.0916748046875, 5.24505615234375, 5.3984375]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 6.0, 2.0, 7.0, 5.0, 4.0, 17.0, 19.0, 21.0, 23.0, 35.0, 52.0, 62.0, 79.0, 114.0, 126.0, 182.0, 300.0, 427.0, 650.0, 1016.0, 1704.0, 3141.0, 6775.0, 18952.0, 82652.0, 714700.0, 2570509.0, 680126.0, 79884.0, 18459.0, 6399.0, 3143.0, 1602.0, 1012.0, 639.0, 405.0, 261.0, 187.0, 150.0, 100.0, 110.0, 66.0, 49.0, 34.0, 26.0, 15.0, 21.0, 10.0, 2.0, 6.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-12.046875, -11.664306640625, -11.28173828125, -10.899169921875, -10.5166015625, -10.134033203125, -9.75146484375, -9.368896484375, -8.986328125, -8.603759765625, -8.22119140625, -7.838623046875, -7.4560546875, -7.073486328125, -6.69091796875, -6.308349609375, -5.92578125, -5.543212890625, -5.16064453125, -4.778076171875, -4.3955078125, -4.012939453125, -3.63037109375, -3.247802734375, -2.865234375, -2.482666015625, -2.10009765625, -1.717529296875, -1.3349609375, -0.952392578125, -0.56982421875, -0.187255859375, 0.1953125, 0.577880859375, 0.96044921875, 1.343017578125, 1.7255859375, 2.108154296875, 2.49072265625, 2.873291015625, 3.255859375, 3.638427734375, 4.02099609375, 4.403564453125, 4.7861328125, 5.168701171875, 5.55126953125, 5.933837890625, 6.31640625, 6.698974609375, 7.08154296875, 7.464111328125, 7.8466796875, 8.229248046875, 8.61181640625, 8.994384765625, 9.376953125, 9.759521484375, 10.14208984375, 10.524658203125, 10.9072265625, 11.289794921875, 11.67236328125, 12.054931640625, 12.4375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 7.0, 17.0, 10.0, 26.0, 31.0, 45.0, 76.0, 130.0, 194.0, 311.0, 544.0, 758.0, 757.0, 482.0, 277.0, 155.0, 87.0, 57.0, 38.0, 19.0, 21.0, 15.0, 8.0, 8.0, 3.0, 3.0, 4.0, 3.0], "bins": [-35.25, -34.5142822265625, -33.778564453125, -33.0428466796875, -32.30712890625, -31.5714111328125, -30.835693359375, -30.0999755859375, -29.3642578125, -28.6285400390625, -27.892822265625, -27.1571044921875, -26.42138671875, -25.6856689453125, -24.949951171875, -24.2142333984375, -23.478515625, -22.7427978515625, -22.007080078125, -21.2713623046875, -20.53564453125, -19.7999267578125, -19.064208984375, -18.3284912109375, -17.5927734375, -16.8570556640625, -16.121337890625, -15.3856201171875, -14.64990234375, -13.9141845703125, -13.178466796875, -12.4427490234375, -11.70703125, -10.9713134765625, -10.235595703125, -9.4998779296875, -8.76416015625, -8.0284423828125, -7.292724609375, -6.5570068359375, -5.8212890625, -5.0855712890625, -4.349853515625, -3.6141357421875, -2.87841796875, -2.1427001953125, -1.406982421875, -0.6712646484375, 0.064453125, 0.8001708984375, 1.535888671875, 2.2716064453125, 3.00732421875, 3.7430419921875, 4.478759765625, 5.2144775390625, 5.9501953125, 6.6859130859375, 7.421630859375, 8.1573486328125, 8.89306640625, 9.6287841796875, 10.364501953125, 11.1002197265625, 11.8359375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 8.0, 6.0, 16.0, 29.0, 59.0, 96.0, 167.0, 347.0, 729.0, 1995.0, 57056.0, 4121536.0, 9740.0, 1366.0, 546.0, 271.0, 143.0, 82.0, 35.0, 28.0, 19.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-113.625, -110.4990234375, -107.373046875, -104.2470703125, -101.12109375, -97.9951171875, -94.869140625, -91.7431640625, -88.6171875, -85.4912109375, -82.365234375, -79.2392578125, -76.11328125, -72.9873046875, -69.861328125, -66.7353515625, -63.609375, -60.4833984375, -57.357421875, -54.2314453125, -51.10546875, -47.9794921875, -44.853515625, -41.7275390625, -38.6015625, -35.4755859375, -32.349609375, -29.2236328125, -26.09765625, -22.9716796875, -19.845703125, -16.7197265625, -13.59375, -10.4677734375, -7.341796875, -4.2158203125, -1.08984375, 2.0361328125, 5.162109375, 8.2880859375, 11.4140625, 14.5400390625, 17.666015625, 20.7919921875, 23.91796875, 27.0439453125, 30.169921875, 33.2958984375, 36.421875, 39.5478515625, 42.673828125, 45.7998046875, 48.92578125, 52.0517578125, 55.177734375, 58.3037109375, 61.4296875, 64.5556640625, 67.681640625, 70.8076171875, 73.93359375, 77.0595703125, 80.185546875, 83.3115234375, 86.4375]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [10.0, 72.0, 411.0, 437.0, 82.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.2867488861084, -11.723611831665039, -6.160475730895996, -0.5973396301269531, 4.965797424316406, 10.528934478759766, 16.092069625854492, 21.65520668029785, 27.21834373474121, 32.78147888183594, 38.3446159362793, 43.907752990722656, 49.470890045166016, 55.034027099609375, 60.59716033935547, 66.1603012084961, 71.72343444824219, 77.28656768798828, 82.8497085571289, 88.412841796875, 93.97598266601562, 99.53911590576172, 105.10224914550781, 110.66539001464844, 116.22853088378906, 121.79166412353516, 127.35480499267578, 132.91793823242188, 138.4810791015625, 144.04421997070312, 149.6073455810547, 155.1704864501953, 160.73362731933594, 166.29676818847656, 171.85989379882812, 177.42303466796875, 182.98617553710938, 188.54931640625, 194.11244201660156, 199.6755828857422, 205.2387237548828, 210.80186462402344, 216.364990234375, 221.92813110351562, 227.49127197265625, 233.05441284179688, 238.61753845214844, 244.18067932128906, 249.74380493164062, 255.30694580078125, 260.8700866699219, 266.4332275390625, 271.996337890625, 277.5594787597656, 283.12261962890625, 288.6857604980469, 294.2489013671875, 299.8120422363281, 305.37518310546875, 310.9383239746094, 316.5014343261719, 322.0645751953125, 327.6277160644531, 333.19085693359375, 338.7539978027344]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 4.0, 3.0, 5.0, 7.0, 11.0, 11.0, 10.0, 10.0, 11.0, 10.0, 17.0, 22.0, 22.0, 23.0, 37.0, 37.0, 37.0, 32.0, 45.0, 40.0, 40.0, 49.0, 45.0, 50.0, 36.0, 39.0, 33.0, 46.0, 35.0, 37.0, 30.0, 25.0, 26.0, 22.0, 14.0, 23.0, 13.0, 17.0, 8.0, 4.0, 4.0, 7.0, 5.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-53.744384765625, -52.04072189331055, -50.337059020996094, -48.63339614868164, -46.92973327636719, -45.22606658935547, -43.522403717041016, -41.81874084472656, -40.11507797241211, -38.411415100097656, -36.7077522277832, -35.00408935546875, -33.30042266845703, -31.59676170349121, -29.893096923828125, -28.189434051513672, -26.48577117919922, -24.782108306884766, -23.078445434570312, -21.374780654907227, -19.671117782592773, -17.96745491027832, -16.263790130615234, -14.560127258300781, -12.856464385986328, -11.152801513671875, -9.449137687683105, -7.745474338531494, -6.041810989379883, -4.33814811706543, -2.63448429107666, -0.9308204650878906, 0.7728424072265625, 2.476505756378174, 4.180169105529785, 5.8838324546813965, 7.587495803833008, 9.291158676147461, 10.99482250213623, 12.698486328125, 14.402149200439453, 16.105812072753906, 17.80947494506836, 19.513139724731445, 21.2168025970459, 22.92046546936035, 24.624130249023438, 26.32779312133789, 28.031455993652344, 29.735118865966797, 31.43878173828125, 33.1424446105957, 34.846107482910156, 36.549774169921875, 38.25343704223633, 39.95709991455078, 41.660762786865234, 43.36442565917969, 45.06808853149414, 46.771751403808594, 48.47541809082031, 50.1790771484375, 51.88274383544922, 53.58640670776367, 55.290069580078125]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 2.0, 9.0, 8.0, 9.0, 12.0, 10.0, 19.0, 21.0, 23.0, 30.0, 24.0, 30.0, 45.0, 37.0, 49.0, 69.0, 52.0, 61.0, 44.0, 51.0, 52.0, 48.0, 39.0, 32.0, 40.0, 29.0, 30.0, 28.0, 21.0, 18.0, 15.0, 6.0, 8.0, 12.0, 9.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.28125, -5.093017578125, -4.90478515625, -4.716552734375, -4.5283203125, -4.340087890625, -4.15185546875, -3.963623046875, -3.775390625, -3.587158203125, -3.39892578125, -3.210693359375, -3.0224609375, -2.834228515625, -2.64599609375, -2.457763671875, -2.26953125, -2.081298828125, -1.89306640625, -1.704833984375, -1.5166015625, -1.328369140625, -1.14013671875, -0.951904296875, -0.763671875, -0.575439453125, -0.38720703125, -0.198974609375, -0.0107421875, 0.177490234375, 0.36572265625, 0.553955078125, 0.7421875, 0.930419921875, 1.11865234375, 1.306884765625, 1.4951171875, 1.683349609375, 1.87158203125, 2.059814453125, 2.248046875, 2.436279296875, 2.62451171875, 2.812744140625, 3.0009765625, 3.189208984375, 3.37744140625, 3.565673828125, 3.75390625, 3.942138671875, 4.13037109375, 4.318603515625, 4.5068359375, 4.695068359375, 4.88330078125, 5.071533203125, 5.259765625, 5.447998046875, 5.63623046875, 5.824462890625, 6.0126953125, 6.200927734375, 6.38916015625, 6.577392578125, 6.765625]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 7.0, 15.0, 14.0, 25.0, 35.0, 72.0, 98.0, 135.0, 248.0, 385.0, 639.0, 1028.0, 1801.0, 3118.0, 5346.0, 9367.0, 16470.0, 29983.0, 56010.0, 118732.0, 335691.0, 260666.0, 98912.0, 48813.0, 26418.0, 14706.0, 8275.0, 4763.0, 2734.0, 1586.0, 924.0, 583.0, 349.0, 217.0, 122.0, 87.0, 63.0, 42.0, 23.0, 16.0, 11.0, 9.0, 6.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0], "bins": [-1.5263671875, -1.4838409423828125, -1.441314697265625, -1.3987884521484375, -1.35626220703125, -1.3137359619140625, -1.271209716796875, -1.2286834716796875, -1.1861572265625, -1.1436309814453125, -1.101104736328125, -1.0585784912109375, -1.01605224609375, -0.9735260009765625, -0.930999755859375, -0.8884735107421875, -0.845947265625, -0.8034210205078125, -0.760894775390625, -0.7183685302734375, -0.67584228515625, -0.6333160400390625, -0.590789794921875, -0.5482635498046875, -0.5057373046875, -0.4632110595703125, -0.420684814453125, -0.3781585693359375, -0.33563232421875, -0.2931060791015625, -0.250579833984375, -0.2080535888671875, -0.16552734375, -0.1230010986328125, -0.080474853515625, -0.0379486083984375, 0.00457763671875, 0.0471038818359375, 0.089630126953125, 0.1321563720703125, 0.1746826171875, 0.2172088623046875, 0.259735107421875, 0.3022613525390625, 0.34478759765625, 0.3873138427734375, 0.429840087890625, 0.4723663330078125, 0.514892578125, 0.5574188232421875, 0.599945068359375, 0.6424713134765625, 0.68499755859375, 0.7275238037109375, 0.770050048828125, 0.8125762939453125, 0.8551025390625, 0.8976287841796875, 0.940155029296875, 0.9826812744140625, 1.02520751953125, 1.0677337646484375, 1.110260009765625, 1.1527862548828125, 1.1953125]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 2.0, 6.0, 6.0, 7.0, 7.0, 6.0, 10.0, 11.0, 7.0, 10.0, 15.0, 18.0, 22.0, 20.0, 22.0, 29.0, 31.0, 32.0, 32.0, 38.0, 36.0, 34.0, 31.0, 42.0, 1066.0, 32.0, 38.0, 31.0, 24.0, 41.0, 35.0, 34.0, 35.0, 28.0, 31.0, 26.0, 24.0, 12.0, 19.0, 12.0, 17.0, 12.0, 6.0, 7.0, 6.0, 4.0, 6.0, 2.0, 4.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0], "bins": [-3.048828125, -2.956817626953125, -2.86480712890625, -2.772796630859375, -2.6807861328125, -2.588775634765625, -2.49676513671875, -2.404754638671875, -2.312744140625, -2.220733642578125, -2.12872314453125, -2.036712646484375, -1.9447021484375, -1.852691650390625, -1.76068115234375, -1.668670654296875, -1.57666015625, -1.484649658203125, -1.39263916015625, -1.300628662109375, -1.2086181640625, -1.116607666015625, -1.02459716796875, -0.932586669921875, -0.840576171875, -0.748565673828125, -0.65655517578125, -0.564544677734375, -0.4725341796875, -0.380523681640625, -0.28851318359375, -0.196502685546875, -0.1044921875, -0.012481689453125, 0.07952880859375, 0.171539306640625, 0.2635498046875, 0.355560302734375, 0.44757080078125, 0.539581298828125, 0.631591796875, 0.723602294921875, 0.81561279296875, 0.907623291015625, 0.9996337890625, 1.091644287109375, 1.18365478515625, 1.275665283203125, 1.36767578125, 1.459686279296875, 1.55169677734375, 1.643707275390625, 1.7357177734375, 1.827728271484375, 1.91973876953125, 2.011749267578125, 2.103759765625, 2.195770263671875, 2.28778076171875, 2.379791259765625, 2.4718017578125, 2.563812255859375, 2.65582275390625, 2.747833251953125, 2.83984375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 5.0, 3.0, 6.0, 3.0, 5.0, 13.0, 26.0, 20.0, 26.0, 42.0, 76.0, 105.0, 140.0, 171.0, 282.0, 368.0, 503.0, 723.0, 1052.0, 1540.0, 2169.0, 2979.0, 4515.0, 6588.0, 9617.0, 14425.0, 22060.0, 34226.0, 54102.0, 87443.0, 159518.0, 1332349.0, 139889.0, 80037.0, 49200.0, 30873.0, 20032.0, 13143.0, 8830.0, 6029.0, 4195.0, 2864.0, 2068.0, 1426.0, 1056.0, 694.0, 510.0, 362.0, 244.0, 173.0, 123.0, 93.0, 66.0, 41.0, 34.0, 23.0, 15.0, 9.0, 7.0, 5.0, 3.0, 4.0, 1.0], "bins": [-0.85693359375, -0.8304901123046875, -0.804046630859375, -0.7776031494140625, -0.75115966796875, -0.7247161865234375, -0.698272705078125, -0.6718292236328125, -0.6453857421875, -0.6189422607421875, -0.592498779296875, -0.5660552978515625, -0.53961181640625, -0.5131683349609375, -0.486724853515625, -0.4602813720703125, -0.433837890625, -0.4073944091796875, -0.380950927734375, -0.3545074462890625, -0.32806396484375, -0.3016204833984375, -0.275177001953125, -0.2487335205078125, -0.2222900390625, -0.1958465576171875, -0.169403076171875, -0.1429595947265625, -0.11651611328125, -0.0900726318359375, -0.063629150390625, -0.0371856689453125, -0.0107421875, 0.0157012939453125, 0.042144775390625, 0.0685882568359375, 0.09503173828125, 0.1214752197265625, 0.147918701171875, 0.1743621826171875, 0.2008056640625, 0.2272491455078125, 0.253692626953125, 0.2801361083984375, 0.30657958984375, 0.3330230712890625, 0.359466552734375, 0.3859100341796875, 0.412353515625, 0.4387969970703125, 0.465240478515625, 0.4916839599609375, 0.51812744140625, 0.5445709228515625, 0.571014404296875, 0.5974578857421875, 0.6239013671875, 0.6503448486328125, 0.676788330078125, 0.7032318115234375, 0.72967529296875, 0.7561187744140625, 0.782562255859375, 0.8090057373046875, 0.83544921875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 6.0, 5.0, 5.0, 4.0, 2.0, 9.0, 10.0, 19.0, 22.0, 20.0, 33.0, 34.0, 39.0, 36.0, 44.0, 46.0, 50.0, 65.0, 69.0, 68.0, 56.0, 56.0, 51.0, 37.0, 31.0, 32.0, 35.0, 13.0, 23.0, 10.0, 16.0, 10.0, 8.0, 11.0, 5.0, 5.0, 8.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.0005397796630859375, -0.0005257166922092438, -0.00051165372133255, -0.0004975907504558563, -0.0004835277795791626, -0.00046946480870246887, -0.00045540183782577515, -0.0004413388669490814, -0.0004272758960723877, -0.00041321292519569397, -0.00039914995431900024, -0.0003850869834423065, -0.0003710240125656128, -0.00035696104168891907, -0.00034289807081222534, -0.0003288350999355316, -0.0003147721290588379, -0.00030070915818214417, -0.00028664618730545044, -0.0002725832164287567, -0.000258520245552063, -0.00024445727467536926, -0.00023039430379867554, -0.0002163313329219818, -0.00020226836204528809, -0.00018820539116859436, -0.00017414242029190063, -0.0001600794494152069, -0.00014601647853851318, -0.00013195350766181946, -0.00011789053678512573, -0.00010382756590843201, -8.976459503173828e-05, -7.570162415504456e-05, -6.163865327835083e-05, -4.7575682401657104e-05, -3.351271152496338e-05, -1.9449740648269653e-05, -5.386769771575928e-06, 8.676201105117798e-06, 2.2739171981811523e-05, 3.680214285850525e-05, 5.0865113735198975e-05, 6.49280846118927e-05, 7.899105548858643e-05, 9.305402636528015e-05, 0.00010711699724197388, 0.0001211799681186676, 0.00013524293899536133, 0.00014930590987205505, 0.00016336888074874878, 0.0001774318516254425, 0.00019149482250213623, 0.00020555779337882996, 0.00021962076425552368, 0.0002336837351322174, 0.00024774670600891113, 0.00026180967688560486, 0.0002758726477622986, 0.0002899356186389923, 0.00030399858951568604, 0.00031806156039237976, 0.0003321245312690735, 0.0003461875021457672, 0.00036025047302246094]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 9.0, 9.0, 14.0, 19.0, 20.0, 21.0, 31.0, 35.0, 49.0, 98.0, 127.0, 194.0, 276.0, 457.0, 729.0, 34886.0, 1009071.0, 950.0, 512.0, 321.0, 215.0, 156.0, 98.0, 71.0, 59.0, 40.0, 28.0, 18.0, 14.0, 9.0, 5.0, 8.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00942230224609375, -0.009061932563781738, -0.008701562881469727, -0.008341193199157715, -0.007980823516845703, -0.007620453834533691, -0.00726008415222168, -0.006899714469909668, -0.006539344787597656, -0.0061789751052856445, -0.005818605422973633, -0.005458235740661621, -0.005097866058349609, -0.004737496376037598, -0.004377126693725586, -0.004016757011413574, -0.0036563873291015625, -0.0032960176467895508, -0.002935647964477539, -0.0025752782821655273, -0.0022149085998535156, -0.001854538917541504, -0.0014941692352294922, -0.0011337995529174805, -0.0007734298706054688, -0.00041306018829345703, -5.269050598144531e-05, 0.0003076791763305664, 0.0006680488586425781, 0.0010284185409545898, 0.0013887882232666016, 0.0017491579055786133, 0.002109527587890625, 0.0024698972702026367, 0.0028302669525146484, 0.00319063663482666, 0.003551006317138672, 0.003911375999450684, 0.004271745681762695, 0.004632115364074707, 0.004992485046386719, 0.0053528547286987305, 0.005713224411010742, 0.006073594093322754, 0.006433963775634766, 0.006794333457946777, 0.007154703140258789, 0.007515072822570801, 0.007875442504882812, 0.008235812187194824, 0.008596181869506836, 0.008956551551818848, 0.00931692123413086, 0.009677290916442871, 0.010037660598754883, 0.010398030281066895, 0.010758399963378906, 0.011118769645690918, 0.01147913932800293, 0.011839509010314941, 0.012199878692626953, 0.012560248374938965, 0.012920618057250977, 0.013280987739562988, 0.013641357421875]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 11.0, 908.0, 97.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002463884884491563, -0.0023885290138423443, -0.0023131731431931257, -0.002237817272543907, -0.0021624614018946886, -0.00208710553124547, -0.002011749893426895, -0.0019363940227776766, -0.001861038152128458, -0.0017856822814792395, -0.001710326410830021, -0.0016349705401808023, -0.0015596147859469056, -0.001484258915297687, -0.0014089030446484685, -0.0013335472904145718, -0.0012581913033500314, -0.0011828354327008128, -0.0011074795620515943, -0.0010321238078176975, -0.000956767937168479, -0.0008814120665192604, -0.0008060561958700418, -0.0007307003834284842, -0.0006553445127792656, -0.0005799886421300471, -0.0005046328296884894, -0.0004292769590392709, -0.0003539211174938828, -0.00027856527594849467, -0.0002032094052992761, -0.00012785359285771847, -5.249772220849991e-05, 2.2858126612845808e-05, 9.821397543419152e-05, 0.00017356983153149486, 0.00024892567307688296, 0.00032428151462227106, 0.0003996373852714896, 0.00047499319771304727, 0.0005503490683622658, 0.0006257049390114844, 0.000701060751453042, 0.0007764166221022606, 0.0008517724927514791, 0.0009271283051930368, 0.0010024842340499163, 0.001077839988283813, 0.0011531958589330316, 0.0012285517295822501, 0.0013039076002314687, 0.0013792633544653654, 0.001454619225114584, 0.0015299750957638025, 0.001605330966413021, 0.0016806868370622396, 0.0017560427077114582, 0.0018313985783606768, 0.0019067544490098953, 0.001982110319659114, 0.0020574661903083324, 0.0021328218281269073, 0.0022081779316067696, 0.0022835335694253445, 0.002358889440074563]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 6.0, 2.0, 6.0, 8.0, 9.0, 9.0, 10.0, 12.0, 15.0, 18.0, 19.0, 21.0, 25.0, 37.0, 17.0, 34.0, 39.0, 34.0, 34.0, 41.0, 38.0, 37.0, 46.0, 42.0, 41.0, 38.0, 42.0, 52.0, 36.0, 32.0, 18.0, 21.0, 32.0, 19.0, 21.0, 15.0, 16.0, 15.0, 15.0, 4.0, 3.0, 9.0, 3.0, 2.0, 7.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0002180337905883789, -0.0002108132466673851, -0.0002035927027463913, -0.0001963721588253975, -0.0001891516149044037, -0.00018193107098340988, -0.00017471052706241608, -0.00016748998314142227, -0.00016026943922042847, -0.00015304889529943466, -0.00014582835137844086, -0.00013860780745744705, -0.00013138726353645325, -0.00012416671961545944, -0.00011694617569446564, -0.00010972563177347183, -0.00010250508785247803, -9.528454393148422e-05, -8.806400001049042e-05, -8.084345608949661e-05, -7.362291216850281e-05, -6.6402368247509e-05, -5.91818243265152e-05, -5.196128040552139e-05, -4.474073648452759e-05, -3.752019256353378e-05, -3.0299648642539978e-05, -2.3079104721546173e-05, -1.5858560800552368e-05, -8.638016879558563e-06, -1.4174729585647583e-06, 5.803070962429047e-06, 1.3023614883422852e-05, 2.0244158804416656e-05, 2.746470272541046e-05, 3.4685246646404266e-05, 4.190579056739807e-05, 4.9126334488391876e-05, 5.634687840938568e-05, 6.356742233037949e-05, 7.078796625137329e-05, 7.80085101723671e-05, 8.52290540933609e-05, 9.24495980143547e-05, 9.967014193534851e-05, 0.00010689068585634232, 0.00011411122977733612, 0.00012133177369832993, 0.00012855231761932373, 0.00013577286154031754, 0.00014299340546131134, 0.00015021394938230515, 0.00015743449330329895, 0.00016465503722429276, 0.00017187558114528656, 0.00017909612506628036, 0.00018631666898727417, 0.00019353721290826797, 0.00020075775682926178, 0.00020797830075025558, 0.0002151988446712494, 0.0002224193885922432, 0.000229639932513237, 0.0002368604764342308, 0.0002440810203552246]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 2.0, 9.0, 8.0, 9.0, 12.0, 10.0, 19.0, 21.0, 23.0, 30.0, 24.0, 30.0, 45.0, 37.0, 49.0, 69.0, 52.0, 61.0, 44.0, 51.0, 52.0, 48.0, 39.0, 32.0, 40.0, 29.0, 30.0, 28.0, 21.0, 18.0, 15.0, 6.0, 8.0, 12.0, 9.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.28125, -5.093017578125, -4.90478515625, -4.716552734375, -4.5283203125, -4.340087890625, -4.15185546875, -3.963623046875, -3.775390625, -3.587158203125, -3.39892578125, -3.210693359375, -3.0224609375, -2.834228515625, -2.64599609375, -2.457763671875, -2.26953125, -2.081298828125, -1.89306640625, -1.704833984375, -1.5166015625, -1.328369140625, -1.14013671875, -0.951904296875, -0.763671875, -0.575439453125, -0.38720703125, -0.198974609375, -0.0107421875, 0.177490234375, 0.36572265625, 0.553955078125, 0.7421875, 0.930419921875, 1.11865234375, 1.306884765625, 1.4951171875, 1.683349609375, 1.87158203125, 2.059814453125, 2.248046875, 2.436279296875, 2.62451171875, 2.812744140625, 3.0009765625, 3.189208984375, 3.37744140625, 3.565673828125, 3.75390625, 3.942138671875, 4.13037109375, 4.318603515625, 4.5068359375, 4.695068359375, 4.88330078125, 5.071533203125, 5.259765625, 5.447998046875, 5.63623046875, 5.824462890625, 6.0126953125, 6.200927734375, 6.38916015625, 6.577392578125, 6.765625]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 8.0, 7.0, 8.0, 9.0, 14.0, 18.0, 20.0, 34.0, 37.0, 58.0, 86.0, 108.0, 121.0, 159.0, 260.0, 308.0, 481.0, 630.0, 823.0, 1202.0, 1625.0, 2544.0, 4060.0, 7140.0, 15846.0, 95107.0, 843580.0, 44974.0, 12090.0, 5992.0, 3393.0, 2329.0, 1490.0, 1085.0, 752.0, 572.0, 411.0, 278.0, 221.0, 183.0, 115.0, 103.0, 79.0, 49.0, 39.0, 27.0, 23.0, 16.0, 12.0, 7.0, 7.0, 8.0, 3.0, 3.0, 4.0, 3.0, 1.0, 2.0], "bins": [-31.921875, -30.935302734375, -29.94873046875, -28.962158203125, -27.9755859375, -26.989013671875, -26.00244140625, -25.015869140625, -24.029296875, -23.042724609375, -22.05615234375, -21.069580078125, -20.0830078125, -19.096435546875, -18.10986328125, -17.123291015625, -16.13671875, -15.150146484375, -14.16357421875, -13.177001953125, -12.1904296875, -11.203857421875, -10.21728515625, -9.230712890625, -8.244140625, -7.257568359375, -6.27099609375, -5.284423828125, -4.2978515625, -3.311279296875, -2.32470703125, -1.338134765625, -0.3515625, 0.635009765625, 1.62158203125, 2.608154296875, 3.5947265625, 4.581298828125, 5.56787109375, 6.554443359375, 7.541015625, 8.527587890625, 9.51416015625, 10.500732421875, 11.4873046875, 12.473876953125, 13.46044921875, 14.447021484375, 15.43359375, 16.420166015625, 17.40673828125, 18.393310546875, 19.3798828125, 20.366455078125, 21.35302734375, 22.339599609375, 23.326171875, 24.312744140625, 25.29931640625, 26.285888671875, 27.2724609375, 28.259033203125, 29.24560546875, 30.232177734375, 31.21875]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 4.0, 7.0, 9.0, 12.0, 8.0, 9.0, 24.0, 22.0, 25.0, 29.0, 32.0, 38.0, 34.0, 34.0, 47.0, 42.0, 57.0, 148.0, 1722.0, 291.0, 61.0, 51.0, 43.0, 43.0, 37.0, 43.0, 27.0, 22.0, 26.0, 21.0, 18.0, 18.0, 9.0, 16.0, 9.0, 3.0, 3.0, 5.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.484375, -16.94873046875, -16.4130859375, -15.87744140625, -15.341796875, -14.80615234375, -14.2705078125, -13.73486328125, -13.19921875, -12.66357421875, -12.1279296875, -11.59228515625, -11.056640625, -10.52099609375, -9.9853515625, -9.44970703125, -8.9140625, -8.37841796875, -7.8427734375, -7.30712890625, -6.771484375, -6.23583984375, -5.7001953125, -5.16455078125, -4.62890625, -4.09326171875, -3.5576171875, -3.02197265625, -2.486328125, -1.95068359375, -1.4150390625, -0.87939453125, -0.34375, 0.19189453125, 0.7275390625, 1.26318359375, 1.798828125, 2.33447265625, 2.8701171875, 3.40576171875, 3.94140625, 4.47705078125, 5.0126953125, 5.54833984375, 6.083984375, 6.61962890625, 7.1552734375, 7.69091796875, 8.2265625, 8.76220703125, 9.2978515625, 9.83349609375, 10.369140625, 10.90478515625, 11.4404296875, 11.97607421875, 12.51171875, 13.04736328125, 13.5830078125, 14.11865234375, 14.654296875, 15.18994140625, 15.7255859375, 16.26123046875, 16.796875]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 7.0, 12.0, 14.0, 10.0, 11.0, 22.0, 28.0, 20.0, 33.0, 35.0, 42.0, 49.0, 75.0, 137.0, 415.0, 3136.0, 3134882.0, 5699.0, 545.0, 138.0, 92.0, 43.0, 40.0, 41.0, 35.0, 20.0, 24.0, 25.0, 17.0, 12.0, 10.0, 9.0, 11.0, 5.0, 7.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.4375, -75.9521484375, -73.466796875, -70.9814453125, -68.49609375, -66.0107421875, -63.525390625, -61.0400390625, -58.5546875, -56.0693359375, -53.583984375, -51.0986328125, -48.61328125, -46.1279296875, -43.642578125, -41.1572265625, -38.671875, -36.1865234375, -33.701171875, -31.2158203125, -28.73046875, -26.2451171875, -23.759765625, -21.2744140625, -18.7890625, -16.3037109375, -13.818359375, -11.3330078125, -8.84765625, -6.3623046875, -3.876953125, -1.3916015625, 1.09375, 3.5791015625, 6.064453125, 8.5498046875, 11.03515625, 13.5205078125, 16.005859375, 18.4912109375, 20.9765625, 23.4619140625, 25.947265625, 28.4326171875, 30.91796875, 33.4033203125, 35.888671875, 38.3740234375, 40.859375, 43.3447265625, 45.830078125, 48.3154296875, 50.80078125, 53.2861328125, 55.771484375, 58.2568359375, 60.7421875, 63.2275390625, 65.712890625, 68.1982421875, 70.68359375, 73.1689453125, 75.654296875, 78.1396484375, 80.625]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 366.0, 642.0, 8.0, 0.0, 3.0, 0.0, 1.0], "bins": [-234.38319396972656, -230.3497772216797, -226.3163604736328, -222.282958984375, -218.24954223632812, -214.21612548828125, -210.18270874023438, -206.1492919921875, -202.11587524414062, -198.08245849609375, -194.04904174804688, -190.015625, -185.9822235107422, -181.9488067626953, -177.91539001464844, -173.88197326660156, -169.84857177734375, -165.81515502929688, -161.78173828125, -157.74832153320312, -153.7149200439453, -149.68150329589844, -145.64808654785156, -141.6146697998047, -137.5812530517578, -133.54783630371094, -129.51441955566406, -125.48101043701172, -121.44759368896484, -117.4141845703125, -113.38076782226562, -109.34735107421875, -105.31393432617188, -101.280517578125, -97.24710845947266, -93.21369171142578, -89.1802749633789, -85.14686584472656, -81.11344909667969, -77.08003234863281, -73.04662322998047, -69.0132064819336, -64.97979736328125, -60.946380615234375, -56.9129638671875, -52.87955093383789, -48.84613800048828, -44.812721252441406, -40.77930450439453, -36.74589157104492, -32.71247482299805, -28.679061889648438, -24.645647048950195, -20.612232208251953, -16.578819274902344, -12.545404434204102, -8.511991500854492, -4.478577136993408, -0.4451627731323242, 3.5882511138916016, 7.621665954589844, 11.655080795288086, 15.688493728637695, 19.721908569335938, 23.75532341003418]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 5.0, 4.0, 4.0, 2.0, 5.0, 9.0, 14.0, 3.0, 10.0, 24.0, 8.0, 14.0, 25.0, 42.0, 28.0, 34.0, 25.0, 25.0, 43.0, 46.0, 43.0, 38.0, 41.0, 44.0, 48.0, 54.0, 35.0, 28.0, 36.0, 40.0, 32.0, 26.0, 29.0, 22.0, 21.0, 19.0, 14.0, 13.0, 8.0, 13.0, 9.0, 12.0, 3.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.21943283081055, -46.74687957763672, -45.27432632446289, -43.80177307128906, -42.32921600341797, -40.85666275024414, -39.38410949707031, -37.911556243896484, -36.439002990722656, -34.96644973754883, -33.493896484375, -32.021339416503906, -30.548786163330078, -29.07623291015625, -27.603679656982422, -26.131126403808594, -24.6585693359375, -23.186016082763672, -21.71346092224121, -20.240907669067383, -18.768352508544922, -17.295799255371094, -15.823246002197266, -14.350691795349121, -12.878137588500977, -11.405583381652832, -9.933029174804688, -8.46047592163086, -6.987921714782715, -5.51536750793457, -4.042814254760742, -2.5702600479125977, -1.0977020263671875, 0.37485194206237793, 1.8474059104919434, 3.3199596405029297, 4.792513847351074, 6.265068054199219, 7.737621307373047, 9.210175514221191, 10.682729721069336, 12.15528392791748, 13.627838134765625, 15.100391387939453, 16.57294464111328, 18.045499801635742, 19.51805305480957, 20.99060821533203, 22.46316146850586, 23.935714721679688, 25.40826988220215, 26.880823135375977, 28.353378295898438, 29.825931549072266, 31.298484802246094, 32.77103805541992, 34.24359130859375, 35.71614456176758, 37.188697814941406, 38.6612548828125, 40.13380813598633, 41.606361389160156, 43.078914642333984, 44.55146789550781, 46.024024963378906]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 2.0, 7.0, 5.0, 13.0, 12.0, 8.0, 9.0, 20.0, 19.0, 25.0, 29.0, 21.0, 36.0, 38.0, 41.0, 52.0, 59.0, 52.0, 53.0, 56.0, 48.0, 56.0, 43.0, 42.0, 29.0, 34.0, 34.0, 29.0, 29.0, 18.0, 19.0, 16.0, 9.0, 9.0, 16.0, 5.0, 5.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4375, -5.24395751953125, -5.0504150390625, -4.85687255859375, -4.663330078125, -4.46978759765625, -4.2762451171875, -4.08270263671875, -3.88916015625, -3.69561767578125, -3.5020751953125, -3.30853271484375, -3.114990234375, -2.92144775390625, -2.7279052734375, -2.53436279296875, -2.3408203125, -2.14727783203125, -1.9537353515625, -1.76019287109375, -1.566650390625, -1.37310791015625, -1.1795654296875, -0.98602294921875, -0.79248046875, -0.59893798828125, -0.4053955078125, -0.21185302734375, -0.018310546875, 0.17523193359375, 0.3687744140625, 0.56231689453125, 0.755859375, 0.94940185546875, 1.1429443359375, 1.33648681640625, 1.530029296875, 1.72357177734375, 1.9171142578125, 2.11065673828125, 2.30419921875, 2.49774169921875, 2.6912841796875, 2.88482666015625, 3.078369140625, 3.27191162109375, 3.4654541015625, 3.65899658203125, 3.8525390625, 4.04608154296875, 4.2396240234375, 4.43316650390625, 4.626708984375, 4.82025146484375, 5.0137939453125, 5.20733642578125, 5.40087890625, 5.59442138671875, 5.7879638671875, 5.98150634765625, 6.175048828125, 6.36859130859375, 6.5621337890625, 6.75567626953125, 6.94921875]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [5.0, 0.0, 1.0, 4.0, 1.0, 4.0, 4.0, 2.0, 5.0, 7.0, 3.0, 6.0, 12.0, 19.0, 21.0, 32.0, 37.0, 62.0, 87.0, 127.0, 202.0, 344.0, 542.0, 982.0, 1807.0, 3503.0, 7304.0, 18656.0, 70613.0, 1901012.0, 2082077.0, 72367.0, 18847.0, 7723.0, 3632.0, 1776.0, 969.0, 519.0, 335.0, 209.0, 122.0, 84.0, 65.0, 38.0, 27.0, 29.0, 18.0, 19.0, 13.0, 6.0, 2.0, 5.0, 4.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-28.421875, -27.474853515625, -26.52783203125, -25.580810546875, -24.6337890625, -23.686767578125, -22.73974609375, -21.792724609375, -20.845703125, -19.898681640625, -18.95166015625, -18.004638671875, -17.0576171875, -16.110595703125, -15.16357421875, -14.216552734375, -13.26953125, -12.322509765625, -11.37548828125, -10.428466796875, -9.4814453125, -8.534423828125, -7.58740234375, -6.640380859375, -5.693359375, -4.746337890625, -3.79931640625, -2.852294921875, -1.9052734375, -0.958251953125, -0.01123046875, 0.935791015625, 1.8828125, 2.829833984375, 3.77685546875, 4.723876953125, 5.6708984375, 6.617919921875, 7.56494140625, 8.511962890625, 9.458984375, 10.406005859375, 11.35302734375, 12.300048828125, 13.2470703125, 14.194091796875, 15.14111328125, 16.088134765625, 17.03515625, 17.982177734375, 18.92919921875, 19.876220703125, 20.8232421875, 21.770263671875, 22.71728515625, 23.664306640625, 24.611328125, 25.558349609375, 26.50537109375, 27.452392578125, 28.3994140625, 29.346435546875, 30.29345703125, 31.240478515625, 32.1875]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 6.0, 7.0, 4.0, 15.0, 13.0, 28.0, 55.0, 80.0, 80.0, 128.0, 191.0, 322.0, 536.0, 725.0, 706.0, 439.0, 246.0, 171.0, 107.0, 60.0, 45.0, 29.0, 23.0, 21.0, 15.0, 7.0, 4.0, 5.0, 3.0, 0.0, 4.0, 2.0, 1.0, 1.0, 2.0], "bins": [-41.75, -40.77392578125, -39.7978515625, -38.82177734375, -37.845703125, -36.86962890625, -35.8935546875, -34.91748046875, -33.94140625, -32.96533203125, -31.9892578125, -31.01318359375, -30.037109375, -29.06103515625, -28.0849609375, -27.10888671875, -26.1328125, -25.15673828125, -24.1806640625, -23.20458984375, -22.228515625, -21.25244140625, -20.2763671875, -19.30029296875, -18.32421875, -17.34814453125, -16.3720703125, -15.39599609375, -14.419921875, -13.44384765625, -12.4677734375, -11.49169921875, -10.515625, -9.53955078125, -8.5634765625, -7.58740234375, -6.611328125, -5.63525390625, -4.6591796875, -3.68310546875, -2.70703125, -1.73095703125, -0.7548828125, 0.22119140625, 1.197265625, 2.17333984375, 3.1494140625, 4.12548828125, 5.1015625, 6.07763671875, 7.0537109375, 8.02978515625, 9.005859375, 9.98193359375, 10.9580078125, 11.93408203125, 12.91015625, 13.88623046875, 14.8623046875, 15.83837890625, 16.814453125, 17.79052734375, 18.7666015625, 19.74267578125, 20.71875]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 3.0, 2.0, 6.0, 4.0, 2.0, 14.0, 14.0, 19.0, 24.0, 42.0, 51.0, 90.0, 124.0, 219.0, 437.0, 1867.0, 3995783.0, 193707.0, 927.0, 367.0, 217.0, 120.0, 82.0, 56.0, 36.0, 25.0, 20.0, 11.0, 6.0, 6.0, 6.0, 1.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.6875, -88.9677734375, -84.248046875, -79.5283203125, -74.80859375, -70.0888671875, -65.369140625, -60.6494140625, -55.9296875, -51.2099609375, -46.490234375, -41.7705078125, -37.05078125, -32.3310546875, -27.611328125, -22.8916015625, -18.171875, -13.4521484375, -8.732421875, -4.0126953125, 0.70703125, 5.4267578125, 10.146484375, 14.8662109375, 19.5859375, 24.3056640625, 29.025390625, 33.7451171875, 38.46484375, 43.1845703125, 47.904296875, 52.6240234375, 57.34375, 62.0634765625, 66.783203125, 71.5029296875, 76.22265625, 80.9423828125, 85.662109375, 90.3818359375, 95.1015625, 99.8212890625, 104.541015625, 109.2607421875, 113.98046875, 118.7001953125, 123.419921875, 128.1396484375, 132.859375, 137.5791015625, 142.298828125, 147.0185546875, 151.73828125, 156.4580078125, 161.177734375, 165.8974609375, 170.6171875, 175.3369140625, 180.056640625, 184.7763671875, 189.49609375, 194.2158203125, 198.935546875, 203.6552734375, 208.375]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 14.0, 39.0, 98.0, 231.0, 279.0, 207.0, 100.0, 28.0, 16.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-151.9634246826172, -148.54812622070312, -145.13282775878906, -141.717529296875, -138.30221557617188, -134.8869171142578, -131.47161865234375, -128.0563201904297, -124.64102172851562, -121.22572326660156, -117.8104248046875, -114.3951187133789, -110.97982025146484, -107.56452178955078, -104.14921569824219, -100.73391723632812, -97.31861877441406, -93.9033203125, -90.48802185058594, -87.07271575927734, -83.65741729736328, -80.24211883544922, -76.82681274414062, -73.41151428222656, -69.9962158203125, -66.58091735839844, -63.16561508178711, -59.75031280517578, -56.33501434326172, -52.919715881347656, -49.50441360473633, -46.089111328125, -42.673805236816406, -39.258506774902344, -35.843204498291016, -32.42790222167969, -29.012603759765625, -25.59730339050293, -22.182003021240234, -18.76670265197754, -15.351402282714844, -11.936101913452148, -8.520801544189453, -5.105501174926758, -1.6902008056640625, 1.7250995635986328, 5.140399932861328, 8.555700302124023, 11.971000671386719, 15.386301040649414, 18.80160140991211, 22.216901779174805, 25.6322021484375, 29.047502517700195, 32.46280288696289, 35.87810516357422, 39.29340362548828, 42.708702087402344, 46.12400436401367, 49.539306640625, 52.95460510253906, 56.369903564453125, 59.78520584106445, 63.20050811767578, 66.61580657958984]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 0.0, 2.0, 5.0, 10.0, 11.0, 12.0, 16.0, 11.0, 17.0, 20.0, 22.0, 26.0, 29.0, 23.0, 38.0, 33.0, 54.0, 41.0, 25.0, 35.0, 40.0, 46.0, 34.0, 37.0, 39.0, 48.0, 37.0, 35.0, 26.0, 35.0, 41.0, 17.0, 23.0, 22.0, 14.0, 13.0, 14.0, 8.0, 11.0, 13.0, 1.0, 6.0, 4.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-75.00352478027344, -72.58134460449219, -70.1591567993164, -67.73697662353516, -65.31478881835938, -62.892608642578125, -60.47042465209961, -58.048240661621094, -55.626060485839844, -53.20387649536133, -50.78169250488281, -48.35951232910156, -45.93732833862305, -43.51514434814453, -41.092960357666016, -38.6707763671875, -36.248592376708984, -33.82640838623047, -31.404226303100586, -28.98204231262207, -26.559860229492188, -24.137676239013672, -21.715492248535156, -19.293310165405273, -16.871126174926758, -14.448943138122559, -12.02676010131836, -9.604576110839844, -7.1823930740356445, -4.760210037231445, -2.3380260467529297, 0.08415603637695312, 2.5063400268554688, 4.928523063659668, 7.350706577301025, 9.772890090942383, 12.195073127746582, 14.617256164550781, 17.039440155029297, 19.46162223815918, 21.883806228637695, 24.30599021911621, 26.728172302246094, 29.15035629272461, 31.572540283203125, 33.994720458984375, 36.416908264160156, 38.839088439941406, 41.26127243041992, 43.68345642089844, 46.10564041137695, 48.52782440185547, 50.95000457763672, 53.372188568115234, 55.79437255859375, 58.216552734375, 60.63874053955078, 63.0609245300293, 65.48310852050781, 67.90528869628906, 70.32747650146484, 72.7496566772461, 75.17184448242188, 77.59402465820312, 80.01620483398438]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 2.0, 5.0, 3.0, 7.0, 6.0, 19.0, 22.0, 11.0, 20.0, 24.0, 30.0, 44.0, 32.0, 43.0, 47.0, 53.0, 55.0, 55.0, 49.0, 52.0, 48.0, 43.0, 48.0, 49.0, 42.0, 33.0, 30.0, 30.0, 19.0, 21.0, 13.0, 10.0, 8.0, 10.0, 9.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.32421875, -5.116455078125, -4.90869140625, -4.700927734375, -4.4931640625, -4.285400390625, -4.07763671875, -3.869873046875, -3.662109375, -3.454345703125, -3.24658203125, -3.038818359375, -2.8310546875, -2.623291015625, -2.41552734375, -2.207763671875, -2.0, -1.792236328125, -1.58447265625, -1.376708984375, -1.1689453125, -0.961181640625, -0.75341796875, -0.545654296875, -0.337890625, -0.130126953125, 0.07763671875, 0.285400390625, 0.4931640625, 0.700927734375, 0.90869140625, 1.116455078125, 1.32421875, 1.531982421875, 1.73974609375, 1.947509765625, 2.1552734375, 2.363037109375, 2.57080078125, 2.778564453125, 2.986328125, 3.194091796875, 3.40185546875, 3.609619140625, 3.8173828125, 4.025146484375, 4.23291015625, 4.440673828125, 4.6484375, 4.856201171875, 5.06396484375, 5.271728515625, 5.4794921875, 5.687255859375, 5.89501953125, 6.102783203125, 6.310546875, 6.518310546875, 6.72607421875, 6.933837890625, 7.1416015625, 7.349365234375, 7.55712890625, 7.764892578125, 7.97265625]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 4.0, 7.0, 7.0, 18.0, 31.0, 36.0, 48.0, 76.0, 143.0, 242.0, 391.0, 629.0, 1219.0, 2020.0, 3859.0, 6958.0, 13468.0, 26319.0, 54455.0, 121746.0, 363655.0, 264614.0, 97236.0, 44825.0, 22020.0, 11161.0, 5991.0, 3178.0, 1741.0, 1018.0, 601.0, 307.0, 186.0, 115.0, 92.0, 48.0, 27.0, 22.0, 15.0, 18.0, 4.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.484375, -1.4346771240234375, -1.384979248046875, -1.3352813720703125, -1.28558349609375, -1.2358856201171875, -1.186187744140625, -1.1364898681640625, -1.0867919921875, -1.0370941162109375, -0.987396240234375, -0.9376983642578125, -0.88800048828125, -0.8383026123046875, -0.788604736328125, -0.7389068603515625, -0.689208984375, -0.6395111083984375, -0.589813232421875, -0.5401153564453125, -0.49041748046875, -0.4407196044921875, -0.391021728515625, -0.3413238525390625, -0.2916259765625, -0.2419281005859375, -0.192230224609375, -0.1425323486328125, -0.09283447265625, -0.0431365966796875, 0.006561279296875, 0.0562591552734375, 0.10595703125, 0.1556549072265625, 0.205352783203125, 0.2550506591796875, 0.30474853515625, 0.3544464111328125, 0.404144287109375, 0.4538421630859375, 0.5035400390625, 0.5532379150390625, 0.602935791015625, 0.6526336669921875, 0.70233154296875, 0.7520294189453125, 0.801727294921875, 0.8514251708984375, 0.901123046875, 0.9508209228515625, 1.000518798828125, 1.0502166748046875, 1.09991455078125, 1.1496124267578125, 1.199310302734375, 1.2490081787109375, 1.2987060546875, 1.3484039306640625, 1.398101806640625, 1.4477996826171875, 1.49749755859375, 1.5471954345703125, 1.596893310546875, 1.6465911865234375, 1.6962890625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 4.0, 0.0, 8.0, 4.0, 7.0, 15.0, 14.0, 15.0, 12.0, 18.0, 20.0, 29.0, 19.0, 34.0, 27.0, 31.0, 41.0, 33.0, 35.0, 35.0, 34.0, 45.0, 1064.0, 47.0, 32.0, 37.0, 38.0, 24.0, 44.0, 40.0, 22.0, 28.0, 30.0, 25.0, 26.0, 19.0, 9.0, 16.0, 13.0, 12.0, 8.0, 6.0, 1.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-3.36328125, -3.259246826171875, -3.15521240234375, -3.051177978515625, -2.9471435546875, -2.843109130859375, -2.73907470703125, -2.635040283203125, -2.531005859375, -2.426971435546875, -2.32293701171875, -2.218902587890625, -2.1148681640625, -2.010833740234375, -1.90679931640625, -1.802764892578125, -1.69873046875, -1.594696044921875, -1.49066162109375, -1.386627197265625, -1.2825927734375, -1.178558349609375, -1.07452392578125, -0.970489501953125, -0.866455078125, -0.762420654296875, -0.65838623046875, -0.554351806640625, -0.4503173828125, -0.346282958984375, -0.24224853515625, -0.138214111328125, -0.0341796875, 0.069854736328125, 0.17388916015625, 0.277923583984375, 0.3819580078125, 0.485992431640625, 0.59002685546875, 0.694061279296875, 0.798095703125, 0.902130126953125, 1.00616455078125, 1.110198974609375, 1.2142333984375, 1.318267822265625, 1.42230224609375, 1.526336669921875, 1.63037109375, 1.734405517578125, 1.83843994140625, 1.942474365234375, 2.0465087890625, 2.150543212890625, 2.25457763671875, 2.358612060546875, 2.462646484375, 2.566680908203125, 2.67071533203125, 2.774749755859375, 2.8787841796875, 2.982818603515625, 3.08685302734375, 3.190887451171875, 3.294921875]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 5.0, 4.0, 3.0, 4.0, 5.0, 11.0, 22.0, 23.0, 37.0, 42.0, 58.0, 85.0, 122.0, 149.0, 250.0, 359.0, 421.0, 693.0, 1007.0, 1478.0, 2151.0, 3320.0, 4927.0, 7381.0, 11329.0, 17300.0, 27011.0, 43338.0, 69572.0, 118030.0, 1311003.0, 206918.0, 101485.0, 60741.0, 37924.0, 23883.0, 15397.0, 9995.0, 6757.0, 4448.0, 3050.0, 2009.0, 1422.0, 898.0, 585.0, 450.0, 325.0, 244.0, 147.0, 83.0, 75.0, 53.0, 34.0, 19.0, 18.0, 14.0, 13.0, 6.0, 0.0, 3.0, 4.0, 7.0, 1.0], "bins": [-0.9306640625, -0.901458740234375, -0.87225341796875, -0.843048095703125, -0.8138427734375, -0.784637451171875, -0.75543212890625, -0.726226806640625, -0.697021484375, -0.667816162109375, -0.63861083984375, -0.609405517578125, -0.5802001953125, -0.550994873046875, -0.52178955078125, -0.492584228515625, -0.46337890625, -0.434173583984375, -0.40496826171875, -0.375762939453125, -0.3465576171875, -0.317352294921875, -0.28814697265625, -0.258941650390625, -0.229736328125, -0.200531005859375, -0.17132568359375, -0.142120361328125, -0.1129150390625, -0.083709716796875, -0.05450439453125, -0.025299072265625, 0.00390625, 0.033111572265625, 0.06231689453125, 0.091522216796875, 0.1207275390625, 0.149932861328125, 0.17913818359375, 0.208343505859375, 0.237548828125, 0.266754150390625, 0.29595947265625, 0.325164794921875, 0.3543701171875, 0.383575439453125, 0.41278076171875, 0.441986083984375, 0.47119140625, 0.500396728515625, 0.52960205078125, 0.558807373046875, 0.5880126953125, 0.617218017578125, 0.64642333984375, 0.675628662109375, 0.704833984375, 0.734039306640625, 0.76324462890625, 0.792449951171875, 0.8216552734375, 0.850860595703125, 0.88006591796875, 0.909271240234375, 0.9384765625]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 6.0, 6.0, 2.0, 4.0, 8.0, 5.0, 12.0, 12.0, 12.0, 21.0, 40.0, 43.0, 65.0, 68.0, 84.0, 110.0, 99.0, 88.0, 76.0, 62.0, 52.0, 28.0, 19.0, 13.0, 13.0, 6.0, 11.0, 10.0, 4.0, 4.0, 6.0, 5.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0007228851318359375, -0.0007003545761108398, -0.0006778240203857422, -0.0006552934646606445, -0.0006327629089355469, -0.0006102323532104492, -0.0005877017974853516, -0.0005651712417602539, -0.0005426406860351562, -0.0005201101303100586, -0.0004975795745849609, -0.0004750490188598633, -0.0004525184631347656, -0.00042998790740966797, -0.0004074573516845703, -0.00038492679595947266, -0.000362396240234375, -0.00033986568450927734, -0.0003173351287841797, -0.00029480457305908203, -0.0002722740173339844, -0.0002497434616088867, -0.00022721290588378906, -0.0002046823501586914, -0.00018215179443359375, -0.0001596212387084961, -0.00013709068298339844, -0.00011456012725830078, -9.202957153320312e-05, -6.949901580810547e-05, -4.696846008300781e-05, -2.4437904357910156e-05, -1.9073486328125e-06, 2.0623207092285156e-05, 4.315376281738281e-05, 6.568431854248047e-05, 8.821487426757812e-05, 0.00011074542999267578, 0.00013327598571777344, 0.0001558065414428711, 0.00017833709716796875, 0.0002008676528930664, 0.00022339820861816406, 0.0002459287643432617, 0.0002684593200683594, 0.00029098987579345703, 0.0003135204315185547, 0.00033605098724365234, 0.00035858154296875, 0.00038111209869384766, 0.0004036426544189453, 0.00042617321014404297, 0.0004487037658691406, 0.0004712343215942383, 0.0004937648773193359, 0.0005162954330444336, 0.0005388259887695312, 0.0005613565444946289, 0.0005838871002197266, 0.0006064176559448242, 0.0006289482116699219, 0.0006514787673950195, 0.0006740093231201172, 0.0006965398788452148, 0.0007190704345703125]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 5.0, 7.0, 6.0, 8.0, 14.0, 20.0, 19.0, 26.0, 36.0, 62.0, 117.0, 154.0, 292.0, 668.0, 102853.0, 942588.0, 794.0, 343.0, 169.0, 114.0, 65.0, 51.0, 37.0, 21.0, 14.0, 14.0, 11.0, 5.0, 5.0, 10.0, 3.0, 6.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01557159423828125, -0.015070557594299316, -0.014569520950317383, -0.01406848430633545, -0.013567447662353516, -0.013066411018371582, -0.012565374374389648, -0.012064337730407715, -0.011563301086425781, -0.011062264442443848, -0.010561227798461914, -0.01006019115447998, -0.009559154510498047, -0.009058117866516113, -0.00855708122253418, -0.008056044578552246, -0.0075550079345703125, -0.007053971290588379, -0.006552934646606445, -0.006051898002624512, -0.005550861358642578, -0.0050498247146606445, -0.004548788070678711, -0.004047751426696777, -0.0035467147827148438, -0.00304567813873291, -0.0025446414947509766, -0.002043604850769043, -0.0015425682067871094, -0.0010415315628051758, -0.0005404949188232422, -3.9458274841308594e-05, 0.000461578369140625, 0.0009626150131225586, 0.0014636516571044922, 0.0019646883010864258, 0.0024657249450683594, 0.002966761589050293, 0.0034677982330322266, 0.00396883487701416, 0.004469871520996094, 0.004970908164978027, 0.005471944808959961, 0.0059729814529418945, 0.006474018096923828, 0.006975054740905762, 0.007476091384887695, 0.007977128028869629, 0.008478164672851562, 0.008979201316833496, 0.00948023796081543, 0.009981274604797363, 0.010482311248779297, 0.01098334789276123, 0.011484384536743164, 0.011985421180725098, 0.012486457824707031, 0.012987494468688965, 0.013488531112670898, 0.013989567756652832, 0.014490604400634766, 0.0149916410446167, 0.015492677688598633, 0.015993714332580566, 0.0164947509765625]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 39.0, 498.0, 435.0, 40.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005622499738819897, -0.0005189164076000452, -0.0004755828995257616, -0.0004322493332438171, -0.00038891579606570303, -0.000345582258887589, -0.00030224869260564446, -0.0002589151554275304, -0.00021558161824941635, -0.0001722480810713023, -0.000128914529341273, -8.558097761124372e-05, -4.224744043312967e-05, 1.0860967449843884e-06, 4.44196630269289e-05, 8.775320020504296e-05, 0.00013108673738315701, 0.00017442027456127107, 0.00021775382629130036, 0.00026108737802132964, 0.0003044209151994437, 0.00034775445237755775, 0.00039108801865950227, 0.0004344215558376163, 0.0004777550930157304, 0.0005210886592976749, 0.0005644221673719585, 0.000607755733653903, 0.0006510892417281866, 0.0006944228080101311, 0.0007377563742920756, 0.0007810898823663592, 0.0008244235068559647, 0.0008677570731379092, 0.0009110905812121928, 0.0009544241474941373, 0.0009977576555684209, 0.0010410912800580263, 0.00108442478813231, 0.0011277582962065935, 0.0011710918042808771, 0.0012144253123551607, 0.0012577589368447661, 0.0013010924449190497, 0.0013444259529933333, 0.0013877595774829388, 0.0014310930855572224, 0.001474426593631506, 0.0015177602181211114, 0.001561093726195395, 0.0016044273506850004, 0.001647760858759284, 0.0016910943668335676, 0.0017344278749078512, 0.0017777614993974566, 0.0018210950074717402, 0.0018644286319613457, 0.0019077621400356293, 0.0019510957645252347, 0.0019944291561841965, 0.0020377628970891237, 0.0020810964051634073, 0.002124429913237691, 0.0021677634213119745, 0.002211096929386258]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 4.0, 2.0, 2.0, 9.0, 9.0, 15.0, 11.0, 9.0, 18.0, 21.0, 15.0, 16.0, 19.0, 23.0, 31.0, 35.0, 20.0, 24.0, 36.0, 28.0, 31.0, 40.0, 45.0, 35.0, 47.0, 42.0, 29.0, 35.0, 24.0, 22.0, 26.0, 32.0, 35.0, 29.0, 19.0, 23.0, 16.0, 14.0, 22.0, 12.0, 23.0, 13.0, 4.0, 4.0, 9.0, 5.0, 5.0, 4.0, 2.0, 4.0, 2.0, 5.0, 2.0, 0.0, 2.0], "bins": [-0.0002599358558654785, -0.0002520829439163208, -0.0002442300319671631, -0.00023637712001800537, -0.00022852420806884766, -0.00022067129611968994, -0.00021281838417053223, -0.0002049654722213745, -0.0001971125602722168, -0.00018925964832305908, -0.00018140673637390137, -0.00017355382442474365, -0.00016570091247558594, -0.00015784800052642822, -0.0001499950885772705, -0.0001421421766281128, -0.00013428926467895508, -0.00012643635272979736, -0.00011858344078063965, -0.00011073052883148193, -0.00010287761688232422, -9.50247049331665e-05, -8.717179298400879e-05, -7.931888103485107e-05, -7.146596908569336e-05, -6.361305713653564e-05, -5.576014518737793e-05, -4.7907233238220215e-05, -4.00543212890625e-05, -3.2201409339904785e-05, -2.434849739074707e-05, -1.6495585441589355e-05, -8.64267349243164e-06, -7.897615432739258e-07, 7.063150405883789e-06, 1.4916062355041504e-05, 2.276897430419922e-05, 3.0621886253356934e-05, 3.847479820251465e-05, 4.632771015167236e-05, 5.418062210083008e-05, 6.203353404998779e-05, 6.988644599914551e-05, 7.773935794830322e-05, 8.559226989746094e-05, 9.344518184661865e-05, 0.00010129809379577637, 0.00010915100574493408, 0.0001170039176940918, 0.0001248568296432495, 0.00013270974159240723, 0.00014056265354156494, 0.00014841556549072266, 0.00015626847743988037, 0.00016412138938903809, 0.0001719743013381958, 0.00017982721328735352, 0.00018768012523651123, 0.00019553303718566895, 0.00020338594913482666, 0.00021123886108398438, 0.0002190917730331421, 0.0002269446849822998, 0.00023479759693145752, 0.00024265050888061523]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 2.0, 5.0, 3.0, 7.0, 6.0, 19.0, 22.0, 11.0, 20.0, 24.0, 30.0, 44.0, 32.0, 43.0, 47.0, 53.0, 55.0, 55.0, 49.0, 52.0, 48.0, 43.0, 48.0, 49.0, 42.0, 33.0, 30.0, 30.0, 19.0, 21.0, 13.0, 10.0, 8.0, 10.0, 9.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.32421875, -5.116455078125, -4.90869140625, -4.700927734375, -4.4931640625, -4.285400390625, -4.07763671875, -3.869873046875, -3.662109375, -3.454345703125, -3.24658203125, -3.038818359375, -2.8310546875, -2.623291015625, -2.41552734375, -2.207763671875, -2.0, -1.792236328125, -1.58447265625, -1.376708984375, -1.1689453125, -0.961181640625, -0.75341796875, -0.545654296875, -0.337890625, -0.130126953125, 0.07763671875, 0.285400390625, 0.4931640625, 0.700927734375, 0.90869140625, 1.116455078125, 1.32421875, 1.531982421875, 1.73974609375, 1.947509765625, 2.1552734375, 2.363037109375, 2.57080078125, 2.778564453125, 2.986328125, 3.194091796875, 3.40185546875, 3.609619140625, 3.8173828125, 4.025146484375, 4.23291015625, 4.440673828125, 4.6484375, 4.856201171875, 5.06396484375, 5.271728515625, 5.4794921875, 5.687255859375, 5.89501953125, 6.102783203125, 6.310546875, 6.518310546875, 6.72607421875, 6.933837890625, 7.1416015625, 7.349365234375, 7.55712890625, 7.764892578125, 7.97265625]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 8.0, 8.0, 7.0, 16.0, 28.0, 37.0, 57.0, 72.0, 131.0, 186.0, 283.0, 497.0, 910.0, 1935.0, 5170.0, 17664.0, 84783.0, 556543.0, 313093.0, 48808.0, 11377.0, 3615.0, 1508.0, 700.0, 412.0, 248.0, 135.0, 101.0, 85.0, 41.0, 32.0, 22.0, 16.0, 14.0, 1.0, 8.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.83203125, -6.6104736328125, -6.388916015625, -6.1673583984375, -5.94580078125, -5.7242431640625, -5.502685546875, -5.2811279296875, -5.0595703125, -4.8380126953125, -4.616455078125, -4.3948974609375, -4.17333984375, -3.9517822265625, -3.730224609375, -3.5086669921875, -3.287109375, -3.0655517578125, -2.843994140625, -2.6224365234375, -2.40087890625, -2.1793212890625, -1.957763671875, -1.7362060546875, -1.5146484375, -1.2930908203125, -1.071533203125, -0.8499755859375, -0.62841796875, -0.4068603515625, -0.185302734375, 0.0362548828125, 0.2578125, 0.4793701171875, 0.700927734375, 0.9224853515625, 1.14404296875, 1.3656005859375, 1.587158203125, 1.8087158203125, 2.0302734375, 2.2518310546875, 2.473388671875, 2.6949462890625, 2.91650390625, 3.1380615234375, 3.359619140625, 3.5811767578125, 3.802734375, 4.0242919921875, 4.245849609375, 4.4674072265625, 4.68896484375, 4.9105224609375, 5.132080078125, 5.3536376953125, 5.5751953125, 5.7967529296875, 6.018310546875, 6.2398681640625, 6.46142578125, 6.6829833984375, 6.904541015625, 7.1260986328125, 7.34765625]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 3.0, 6.0, 9.0, 9.0, 16.0, 11.0, 17.0, 22.0, 26.0, 26.0, 47.0, 33.0, 47.0, 47.0, 53.0, 63.0, 156.0, 1923.0, 122.0, 51.0, 58.0, 42.0, 38.0, 44.0, 29.0, 26.0, 22.0, 15.0, 22.0, 9.0, 18.0, 8.0, 9.0, 5.0, 15.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.765625, -19.0703125, -18.375, -17.6796875, -16.984375, -16.2890625, -15.59375, -14.8984375, -14.203125, -13.5078125, -12.8125, -12.1171875, -11.421875, -10.7265625, -10.03125, -9.3359375, -8.640625, -7.9453125, -7.25, -6.5546875, -5.859375, -5.1640625, -4.46875, -3.7734375, -3.078125, -2.3828125, -1.6875, -0.9921875, -0.296875, 0.3984375, 1.09375, 1.7890625, 2.484375, 3.1796875, 3.875, 4.5703125, 5.265625, 5.9609375, 6.65625, 7.3515625, 8.046875, 8.7421875, 9.4375, 10.1328125, 10.828125, 11.5234375, 12.21875, 12.9140625, 13.609375, 14.3046875, 15.0, 15.6953125, 16.390625, 17.0859375, 17.78125, 18.4765625, 19.171875, 19.8671875, 20.5625, 21.2578125, 21.953125, 22.6484375, 23.34375, 24.0390625, 24.734375]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 13.0, 6.0, 8.0, 7.0, 21.0, 9.0, 20.0, 13.0, 18.0, 27.0, 31.0, 58.0, 70.0, 86.0, 158.0, 401.0, 1559.0, 3054640.0, 86864.0, 911.0, 285.0, 138.0, 89.0, 49.0, 62.0, 31.0, 26.0, 30.0, 16.0, 12.0, 14.0, 12.0, 11.0, 6.0, 2.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-57.5625, -55.95654296875, -54.3505859375, -52.74462890625, -51.138671875, -49.53271484375, -47.9267578125, -46.32080078125, -44.71484375, -43.10888671875, -41.5029296875, -39.89697265625, -38.291015625, -36.68505859375, -35.0791015625, -33.47314453125, -31.8671875, -30.26123046875, -28.6552734375, -27.04931640625, -25.443359375, -23.83740234375, -22.2314453125, -20.62548828125, -19.01953125, -17.41357421875, -15.8076171875, -14.20166015625, -12.595703125, -10.98974609375, -9.3837890625, -7.77783203125, -6.171875, -4.56591796875, -2.9599609375, -1.35400390625, 0.251953125, 1.85791015625, 3.4638671875, 5.06982421875, 6.67578125, 8.28173828125, 9.8876953125, 11.49365234375, 13.099609375, 14.70556640625, 16.3115234375, 17.91748046875, 19.5234375, 21.12939453125, 22.7353515625, 24.34130859375, 25.947265625, 27.55322265625, 29.1591796875, 30.76513671875, 32.37109375, 33.97705078125, 35.5830078125, 37.18896484375, 38.794921875, 40.40087890625, 42.0068359375, 43.61279296875, 45.21875]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 23.0, 272.0, 547.0, 159.0, 10.0, 4.0, 3.0], "bins": [-83.44695281982422, -82.04154205322266, -80.6361312866211, -79.23072052001953, -77.82530975341797, -76.4198989868164, -75.01448822021484, -73.60906982421875, -72.20365905761719, -70.79824829101562, -69.39283752441406, -67.9874267578125, -66.58201599121094, -65.17660522460938, -63.77119064331055, -62.365779876708984, -60.96037292480469, -59.554962158203125, -58.14955139160156, -56.744140625, -55.33872985839844, -53.93331527709961, -52.52790451049805, -51.122493743896484, -49.71708297729492, -48.31167221069336, -46.9062614440918, -45.500850677490234, -44.095436096191406, -42.690025329589844, -41.28461456298828, -39.87920379638672, -38.473793029785156, -37.068382263183594, -35.66297149658203, -34.25756072998047, -32.852149963378906, -31.44673728942871, -30.041324615478516, -28.635913848876953, -27.230504989624023, -25.82509422302246, -24.419681549072266, -23.014270782470703, -21.60886001586914, -20.203449249267578, -18.798038482666016, -17.39262580871582, -15.987215042114258, -14.581804275512695, -13.176392555236816, -11.770980834960938, -10.365570068359375, -8.960159301757812, -7.554747581481934, -6.149335861206055, -4.743925094604492, -3.3385138511657715, -1.9331026077270508, -0.5276913642883301, 0.8777198791503906, 2.2831311225891113, 3.688542366027832, 5.093954086303711, 6.499364852905273]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 0.0, 4.0, 3.0, 9.0, 5.0, 6.0, 9.0, 20.0, 6.0, 18.0, 16.0, 15.0, 15.0, 19.0, 21.0, 30.0, 21.0, 24.0, 30.0, 23.0, 33.0, 40.0, 32.0, 38.0, 39.0, 47.0, 37.0, 36.0, 37.0, 30.0, 33.0, 38.0, 34.0, 30.0, 23.0, 18.0, 26.0, 23.0, 9.0, 12.0, 18.0, 15.0, 14.0, 10.0, 5.0, 8.0, 4.0, 5.0, 8.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-50.20411682128906, -48.70069122314453, -47.197265625, -45.69384002685547, -44.19041442871094, -42.68699264526367, -41.18356704711914, -39.68014144897461, -38.17671585083008, -36.67329025268555, -35.169864654541016, -33.666439056396484, -32.16301727294922, -30.659589767456055, -29.156166076660156, -27.652740478515625, -26.149314880371094, -24.645889282226562, -23.14246368408203, -21.639039993286133, -20.1356143951416, -18.63218879699707, -17.128765106201172, -15.62533950805664, -14.12191390991211, -12.618488311767578, -11.115063667297363, -9.611639022827148, -8.108213424682617, -6.604788303375244, -5.101363182067871, -3.5979385375976562, -2.0945167541503906, -0.5910916328430176, 0.9123334884643555, 2.4157586097717285, 3.9191837310791016, 5.422608852386475, 6.926033973693848, 8.429458618164062, 9.932884216308594, 11.436309814453125, 12.93973445892334, 14.443159103393555, 15.946584701538086, 17.450010299682617, 18.953433990478516, 20.456859588623047, 21.960285186767578, 23.46371078491211, 24.96713638305664, 26.47056007385254, 27.97398567199707, 29.4774112701416, 30.9808349609375, 32.48426055908203, 33.98768615722656, 35.491111755371094, 36.994537353515625, 38.497962951660156, 40.00138854980469, 41.50481033325195, 43.008235931396484, 44.511661529541016, 46.01508712768555]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 3.0, 1.0, 8.0, 12.0, 17.0, 11.0, 21.0, 12.0, 29.0, 28.0, 45.0, 28.0, 52.0, 44.0, 57.0, 57.0, 57.0, 49.0, 37.0, 62.0, 44.0, 52.0, 50.0, 35.0, 35.0, 35.0, 24.0, 18.0, 16.0, 15.0, 9.0, 12.0, 9.0, 6.0, 5.0, 3.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.51953125, -5.30352783203125, -5.0875244140625, -4.87152099609375, -4.655517578125, -4.43951416015625, -4.2235107421875, -4.00750732421875, -3.79150390625, -3.57550048828125, -3.3594970703125, -3.14349365234375, -2.927490234375, -2.71148681640625, -2.4954833984375, -2.27947998046875, -2.0634765625, -1.84747314453125, -1.6314697265625, -1.41546630859375, -1.199462890625, -0.98345947265625, -0.7674560546875, -0.55145263671875, -0.33544921875, -0.11944580078125, 0.0965576171875, 0.31256103515625, 0.528564453125, 0.74456787109375, 0.9605712890625, 1.17657470703125, 1.392578125, 1.60858154296875, 1.8245849609375, 2.04058837890625, 2.256591796875, 2.47259521484375, 2.6885986328125, 2.90460205078125, 3.12060546875, 3.33660888671875, 3.5526123046875, 3.76861572265625, 3.984619140625, 4.20062255859375, 4.4166259765625, 4.63262939453125, 4.8486328125, 5.06463623046875, 5.2806396484375, 5.49664306640625, 5.712646484375, 5.92864990234375, 6.1446533203125, 6.36065673828125, 6.57666015625, 6.79266357421875, 7.0086669921875, 7.22467041015625, 7.440673828125, 7.65667724609375, 7.8726806640625, 8.08868408203125, 8.3046875]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [4.0, 5.0, 3.0, 3.0, 5.0, 4.0, 6.0, 9.0, 14.0, 14.0, 17.0, 23.0, 29.0, 37.0, 53.0, 59.0, 80.0, 151.0, 186.0, 358.0, 1003.0, 5358.0, 55784.0, 1275761.0, 2686306.0, 155490.0, 10618.0, 1604.0, 528.0, 235.0, 144.0, 86.0, 73.0, 53.0, 52.0, 30.0, 23.0, 23.0, 19.0, 12.0, 8.0, 5.0, 6.0, 8.0, 0.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.3984375, -13.8028564453125, -13.207275390625, -12.6116943359375, -12.01611328125, -11.4205322265625, -10.824951171875, -10.2293701171875, -9.6337890625, -9.0382080078125, -8.442626953125, -7.8470458984375, -7.25146484375, -6.6558837890625, -6.060302734375, -5.4647216796875, -4.869140625, -4.2735595703125, -3.677978515625, -3.0823974609375, -2.48681640625, -1.8912353515625, -1.295654296875, -0.7000732421875, -0.1044921875, 0.4910888671875, 1.086669921875, 1.6822509765625, 2.27783203125, 2.8734130859375, 3.468994140625, 4.0645751953125, 4.66015625, 5.2557373046875, 5.851318359375, 6.4468994140625, 7.04248046875, 7.6380615234375, 8.233642578125, 8.8292236328125, 9.4248046875, 10.0203857421875, 10.615966796875, 11.2115478515625, 11.80712890625, 12.4027099609375, 12.998291015625, 13.5938720703125, 14.189453125, 14.7850341796875, 15.380615234375, 15.9761962890625, 16.57177734375, 17.1673583984375, 17.762939453125, 18.3585205078125, 18.9541015625, 19.5496826171875, 20.145263671875, 20.7408447265625, 21.33642578125, 21.9320068359375, 22.527587890625, 23.1231689453125, 23.71875]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 10.0, 4.0, 11.0, 19.0, 33.0, 35.0, 56.0, 107.0, 146.0, 200.0, 332.0, 453.0, 702.0, 673.0, 446.0, 311.0, 189.0, 123.0, 80.0, 42.0, 38.0, 19.0, 13.0, 13.0, 13.0, 2.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.390625, -29.543212890625, -28.69580078125, -27.848388671875, -27.0009765625, -26.153564453125, -25.30615234375, -24.458740234375, -23.611328125, -22.763916015625, -21.91650390625, -21.069091796875, -20.2216796875, -19.374267578125, -18.52685546875, -17.679443359375, -16.83203125, -15.984619140625, -15.13720703125, -14.289794921875, -13.4423828125, -12.594970703125, -11.74755859375, -10.900146484375, -10.052734375, -9.205322265625, -8.35791015625, -7.510498046875, -6.6630859375, -5.815673828125, -4.96826171875, -4.120849609375, -3.2734375, -2.426025390625, -1.57861328125, -0.731201171875, 0.1162109375, 0.963623046875, 1.81103515625, 2.658447265625, 3.505859375, 4.353271484375, 5.20068359375, 6.048095703125, 6.8955078125, 7.742919921875, 8.59033203125, 9.437744140625, 10.28515625, 11.132568359375, 11.97998046875, 12.827392578125, 13.6748046875, 14.522216796875, 15.36962890625, 16.217041015625, 17.064453125, 17.911865234375, 18.75927734375, 19.606689453125, 20.4541015625, 21.301513671875, 22.14892578125, 22.996337890625, 23.84375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 7.0, 2.0, 6.0, 11.0, 15.0, 27.0, 26.0, 49.0, 86.0, 100.0, 157.0, 273.0, 506.0, 3405.0, 2774772.0, 1411047.0, 2550.0, 510.0, 276.0, 154.0, 115.0, 60.0, 39.0, 27.0, 29.0, 7.0, 7.0, 7.0, 7.0, 8.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.3125, -71.4501953125, -68.587890625, -65.7255859375, -62.86328125, -60.0009765625, -57.138671875, -54.2763671875, -51.4140625, -48.5517578125, -45.689453125, -42.8271484375, -39.96484375, -37.1025390625, -34.240234375, -31.3779296875, -28.515625, -25.6533203125, -22.791015625, -19.9287109375, -17.06640625, -14.2041015625, -11.341796875, -8.4794921875, -5.6171875, -2.7548828125, 0.107421875, 2.9697265625, 5.83203125, 8.6943359375, 11.556640625, 14.4189453125, 17.28125, 20.1435546875, 23.005859375, 25.8681640625, 28.73046875, 31.5927734375, 34.455078125, 37.3173828125, 40.1796875, 43.0419921875, 45.904296875, 48.7666015625, 51.62890625, 54.4912109375, 57.353515625, 60.2158203125, 63.078125, 65.9404296875, 68.802734375, 71.6650390625, 74.52734375, 77.3896484375, 80.251953125, 83.1142578125, 85.9765625, 88.8388671875, 91.701171875, 94.5634765625, 97.42578125, 100.2880859375, 103.150390625, 106.0126953125, 108.875]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 9.0, 30.0, 88.0, 180.0, 288.0, 227.0, 140.0, 38.0, 14.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.565298080444336, -26.61611557006836, -22.666933059692383, -18.717750549316406, -14.768567085266113, -10.81938362121582, -6.870201110839844, -2.921018600463867, 1.0281639099121094, 4.977346420288086, 8.926528930664062, 12.875712394714355, 16.824893951416016, 20.774078369140625, 24.7232608795166, 28.672443389892578, 32.62162780761719, 36.5708122253418, 40.51999282836914, 44.46917724609375, 48.418357849121094, 52.3675422668457, 56.31672668457031, 60.265907287597656, 64.215087890625, 68.16426849365234, 72.11345672607422, 76.06263732910156, 80.0118179321289, 83.96099853515625, 87.91018676757812, 91.85936737060547, 95.80855560302734, 99.75773620605469, 103.70692443847656, 107.6561050415039, 111.60528564453125, 115.55447387695312, 119.50365447998047, 123.45283508300781, 127.40201568603516, 131.3511962890625, 135.30038452148438, 139.2495574951172, 143.19874572753906, 147.14793395996094, 151.09710693359375, 155.04629516601562, 158.9954833984375, 162.94467163085938, 166.8938446044922, 170.84303283691406, 174.79222106933594, 178.74139404296875, 182.69058227539062, 186.6397705078125, 190.5889434814453, 194.5381317138672, 198.4873046875, 202.43649291992188, 206.38568115234375, 210.33485412597656, 214.28404235839844, 218.23321533203125, 222.18240356445312]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 0.0, 4.0, 7.0, 4.0, 11.0, 10.0, 14.0, 13.0, 18.0, 16.0, 12.0, 18.0, 32.0, 34.0, 31.0, 21.0, 47.0, 37.0, 48.0, 46.0, 39.0, 38.0, 36.0, 47.0, 36.0, 44.0, 53.0, 38.0, 37.0, 29.0, 24.0, 26.0, 24.0, 21.0, 20.0, 16.0, 10.0, 16.0, 8.0, 5.0, 3.0, 6.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-68.73452758789062, -66.69884490966797, -64.66316223144531, -62.62747573852539, -60.59178924560547, -58.55610656738281, -56.520423889160156, -54.484737396240234, -52.44905090332031, -50.413368225097656, -48.377681732177734, -46.34199905395508, -44.306312561035156, -42.2706298828125, -40.234947204589844, -38.19926071166992, -36.163578033447266, -34.12789535522461, -32.09220886230469, -30.05652618408203, -28.02083969116211, -25.985157012939453, -23.949472427368164, -21.913787841796875, -19.878103256225586, -17.842418670654297, -15.806734085083008, -13.771050453186035, -11.735365867614746, -9.699681282043457, -7.663997650146484, -5.628313064575195, -3.5926284790039062, -1.5569441318511963, 0.47874021530151367, 2.5144243240356445, 4.550108909606934, 6.585793495178223, 8.621477127075195, 10.657161712646484, 12.692846298217773, 14.728530883789062, 16.76421546936035, 18.79990005493164, 20.835582733154297, 22.87126922607422, 24.906951904296875, 26.942636489868164, 28.978321075439453, 31.014005661010742, 33.04969024658203, 35.08537292480469, 37.12105941772461, 39.156742095947266, 41.19242858886719, 43.228111267089844, 45.2637939453125, 47.299476623535156, 49.33516311645508, 51.370845794677734, 53.406532287597656, 55.44221496582031, 57.47789764404297, 59.51358413696289, 61.54927062988281]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 6.0, 7.0, 13.0, 7.0, 14.0, 16.0, 20.0, 23.0, 34.0, 45.0, 37.0, 33.0, 52.0, 53.0, 61.0, 48.0, 57.0, 61.0, 62.0, 44.0, 54.0, 34.0, 40.0, 33.0, 33.0, 28.0, 18.0, 14.0, 15.0, 12.0, 9.0, 7.0, 4.0, 3.0, 6.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.86328125, -5.63385009765625, -5.4044189453125, -5.17498779296875, -4.945556640625, -4.71612548828125, -4.4866943359375, -4.25726318359375, -4.02783203125, -3.79840087890625, -3.5689697265625, -3.33953857421875, -3.110107421875, -2.88067626953125, -2.6512451171875, -2.42181396484375, -2.1923828125, -1.96295166015625, -1.7335205078125, -1.50408935546875, -1.274658203125, -1.04522705078125, -0.8157958984375, -0.58636474609375, -0.35693359375, -0.12750244140625, 0.1019287109375, 0.33135986328125, 0.560791015625, 0.79022216796875, 1.0196533203125, 1.24908447265625, 1.478515625, 1.70794677734375, 1.9373779296875, 2.16680908203125, 2.396240234375, 2.62567138671875, 2.8551025390625, 3.08453369140625, 3.31396484375, 3.54339599609375, 3.7728271484375, 4.00225830078125, 4.231689453125, 4.46112060546875, 4.6905517578125, 4.91998291015625, 5.1494140625, 5.37884521484375, 5.6082763671875, 5.83770751953125, 6.067138671875, 6.29656982421875, 6.5260009765625, 6.75543212890625, 6.98486328125, 7.21429443359375, 7.4437255859375, 7.67315673828125, 7.902587890625, 8.13201904296875, 8.3614501953125, 8.59088134765625, 8.8203125]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 5.0, 11.0, 8.0, 13.0, 26.0, 34.0, 51.0, 82.0, 156.0, 245.0, 499.0, 831.0, 1574.0, 2902.0, 5565.0, 10765.0, 22057.0, 46289.0, 108495.0, 382727.0, 292566.0, 92841.0, 40864.0, 19507.0, 9670.0, 4940.0, 2684.0, 1373.0, 758.0, 414.0, 246.0, 133.0, 71.0, 60.0, 37.0, 16.0, 11.0, 10.0, 8.0, 0.0, 7.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8701171875, -1.8115234375, -1.7529296875, -1.6943359375, -1.6357421875, -1.5771484375, -1.5185546875, -1.4599609375, -1.4013671875, -1.3427734375, -1.2841796875, -1.2255859375, -1.1669921875, -1.1083984375, -1.0498046875, -0.9912109375, -0.9326171875, -0.8740234375, -0.8154296875, -0.7568359375, -0.6982421875, -0.6396484375, -0.5810546875, -0.5224609375, -0.4638671875, -0.4052734375, -0.3466796875, -0.2880859375, -0.2294921875, -0.1708984375, -0.1123046875, -0.0537109375, 0.0048828125, 0.0634765625, 0.1220703125, 0.1806640625, 0.2392578125, 0.2978515625, 0.3564453125, 0.4150390625, 0.4736328125, 0.5322265625, 0.5908203125, 0.6494140625, 0.7080078125, 0.7666015625, 0.8251953125, 0.8837890625, 0.9423828125, 1.0009765625, 1.0595703125, 1.1181640625, 1.1767578125, 1.2353515625, 1.2939453125, 1.3525390625, 1.4111328125, 1.4697265625, 1.5283203125, 1.5869140625, 1.6455078125, 1.7041015625, 1.7626953125, 1.8212890625, 1.8798828125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 7.0, 9.0, 8.0, 2.0, 9.0, 9.0, 14.0, 21.0, 19.0, 14.0, 14.0, 26.0, 26.0, 33.0, 35.0, 36.0, 44.0, 35.0, 37.0, 51.0, 1068.0, 52.0, 56.0, 32.0, 43.0, 34.0, 53.0, 36.0, 30.0, 30.0, 19.0, 15.0, 22.0, 10.0, 16.0, 11.0, 11.0, 12.0, 13.0, 7.0, 4.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-4.2578125, -4.13885498046875, -4.0198974609375, -3.90093994140625, -3.781982421875, -3.66302490234375, -3.5440673828125, -3.42510986328125, -3.30615234375, -3.18719482421875, -3.0682373046875, -2.94927978515625, -2.830322265625, -2.71136474609375, -2.5924072265625, -2.47344970703125, -2.3544921875, -2.23553466796875, -2.1165771484375, -1.99761962890625, -1.878662109375, -1.75970458984375, -1.6407470703125, -1.52178955078125, -1.40283203125, -1.28387451171875, -1.1649169921875, -1.04595947265625, -0.927001953125, -0.80804443359375, -0.6890869140625, -0.57012939453125, -0.451171875, -0.33221435546875, -0.2132568359375, -0.09429931640625, 0.024658203125, 0.14361572265625, 0.2625732421875, 0.38153076171875, 0.50048828125, 0.61944580078125, 0.7384033203125, 0.85736083984375, 0.976318359375, 1.09527587890625, 1.2142333984375, 1.33319091796875, 1.4521484375, 1.57110595703125, 1.6900634765625, 1.80902099609375, 1.927978515625, 2.04693603515625, 2.1658935546875, 2.28485107421875, 2.40380859375, 2.52276611328125, 2.6417236328125, 2.76068115234375, 2.879638671875, 2.99859619140625, 3.1175537109375, 3.23651123046875, 3.35546875]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 1.0, 8.0, 6.0, 8.0, 7.0, 6.0, 16.0, 20.0, 30.0, 41.0, 88.0, 97.0, 154.0, 212.0, 321.0, 531.0, 766.0, 1177.0, 1732.0, 2731.0, 4157.0, 6355.0, 9660.0, 15437.0, 25256.0, 43443.0, 76951.0, 154355.0, 1399073.0, 160879.0, 78836.0, 44544.0, 25973.0, 15746.0, 9907.0, 6347.0, 4201.0, 2771.0, 1724.0, 1115.0, 780.0, 528.0, 392.0, 216.0, 180.0, 115.0, 74.0, 57.0, 45.0, 28.0, 13.0, 11.0, 7.0, 9.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1826171875, -1.1462554931640625, -1.109893798828125, -1.0735321044921875, -1.03717041015625, -1.0008087158203125, -0.964447021484375, -0.9280853271484375, -0.8917236328125, -0.8553619384765625, -0.819000244140625, -0.7826385498046875, -0.74627685546875, -0.7099151611328125, -0.673553466796875, -0.6371917724609375, -0.600830078125, -0.5644683837890625, -0.528106689453125, -0.4917449951171875, -0.45538330078125, -0.4190216064453125, -0.382659912109375, -0.3462982177734375, -0.3099365234375, -0.2735748291015625, -0.237213134765625, -0.2008514404296875, -0.16448974609375, -0.1281280517578125, -0.091766357421875, -0.0554046630859375, -0.01904296875, 0.0173187255859375, 0.053680419921875, 0.0900421142578125, 0.12640380859375, 0.1627655029296875, 0.199127197265625, 0.2354888916015625, 0.2718505859375, 0.3082122802734375, 0.344573974609375, 0.3809356689453125, 0.41729736328125, 0.4536590576171875, 0.490020751953125, 0.5263824462890625, 0.562744140625, 0.5991058349609375, 0.635467529296875, 0.6718292236328125, 0.70819091796875, 0.7445526123046875, 0.780914306640625, 0.8172760009765625, 0.8536376953125, 0.8899993896484375, 0.926361083984375, 0.9627227783203125, 0.99908447265625, 1.0354461669921875, 1.071807861328125, 1.1081695556640625, 1.14453125]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 4.0, 10.0, 10.0, 16.0, 18.0, 28.0, 32.0, 32.0, 44.0, 61.0, 88.0, 90.0, 86.0, 80.0, 88.0, 76.0, 58.0, 47.0, 38.0, 21.0, 20.0, 7.0, 16.0, 4.0, 10.0, 4.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004775524139404297, -0.0004595629870891571, -0.0004415735602378845, -0.00042358413338661194, -0.00040559470653533936, -0.00038760527968406677, -0.0003696158528327942, -0.0003516264259815216, -0.000333636999130249, -0.00031564757227897644, -0.00029765814542770386, -0.0002796687185764313, -0.0002616792917251587, -0.0002436898648738861, -0.00022570043802261353, -0.00020771101117134094, -0.00018972158432006836, -0.00017173215746879578, -0.0001537427306175232, -0.0001357533037662506, -0.00011776387691497803, -9.977445006370544e-05, -8.178502321243286e-05, -6.379559636116028e-05, -4.5806169509887695e-05, -2.7816742658615112e-05, -9.82731580734253e-06, 8.162111043930054e-06, 2.6151537895202637e-05, 4.414096474647522e-05, 6.21303915977478e-05, 8.011981844902039e-05, 9.810924530029297e-05, 0.00011609867215156555, 0.00013408809900283813, 0.00015207752585411072, 0.0001700669527053833, 0.00018805637955665588, 0.00020604580640792847, 0.00022403523325920105, 0.00024202466011047363, 0.0002600140869617462, 0.0002780035138130188, 0.0002959929406642914, 0.00031398236751556396, 0.00033197179436683655, 0.00034996122121810913, 0.0003679506480693817, 0.0003859400749206543, 0.0004039295017719269, 0.00042191892862319946, 0.00043990835547447205, 0.00045789778232574463, 0.0004758872091770172, 0.0004938766360282898, 0.0005118660628795624, 0.000529855489730835, 0.0005478449165821075, 0.0005658343434333801, 0.0005838237702846527, 0.0006018131971359253, 0.0006198026239871979, 0.0006377920508384705, 0.000655781477689743, 0.0006737709045410156]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 7.0, 4.0, 9.0, 13.0, 5.0, 3.0, 9.0, 28.0, 17.0, 41.0, 51.0, 92.0, 204.0, 370.0, 1346.0, 1043122.0, 2380.0, 389.0, 173.0, 104.0, 54.0, 42.0, 22.0, 12.0, 16.0, 14.0, 7.0, 7.0, 1.0, 4.0, 2.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0177154541015625, -0.01724386215209961, -0.01677227020263672, -0.016300678253173828, -0.015829086303710938, -0.015357494354248047, -0.014885902404785156, -0.014414310455322266, -0.013942718505859375, -0.013471126556396484, -0.012999534606933594, -0.012527942657470703, -0.012056350708007812, -0.011584758758544922, -0.011113166809082031, -0.01064157485961914, -0.01016998291015625, -0.00969839096069336, -0.009226799011230469, -0.008755207061767578, -0.008283615112304688, -0.007812023162841797, -0.007340431213378906, -0.006868839263916016, -0.006397247314453125, -0.005925655364990234, -0.005454063415527344, -0.004982471466064453, -0.0045108795166015625, -0.004039287567138672, -0.0035676956176757812, -0.0030961036682128906, -0.00262451171875, -0.0021529197692871094, -0.0016813278198242188, -0.0012097358703613281, -0.0007381439208984375, -0.0002665519714355469, 0.00020503997802734375, 0.0006766319274902344, 0.001148223876953125, 0.0016198158264160156, 0.0020914077758789062, 0.002562999725341797, 0.0030345916748046875, 0.003506183624267578, 0.003977775573730469, 0.004449367523193359, 0.00492095947265625, 0.005392551422119141, 0.005864143371582031, 0.006335735321044922, 0.0068073272705078125, 0.007278919219970703, 0.007750511169433594, 0.008222103118896484, 0.008693695068359375, 0.009165287017822266, 0.009636878967285156, 0.010108470916748047, 0.010580062866210938, 0.011051654815673828, 0.011523246765136719, 0.01199483871459961, 0.0124664306640625]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 45.0, 323.0, 511.0, 122.0, 9.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001843601348809898, -0.0018089509103447199, -0.0017743004718795419, -0.0017396500334143639, -0.0017049995949491858, -0.0016703491564840078, -0.0016356987180188298, -0.0016010482795536518, -0.0015663978410884738, -0.0015317474026232958, -0.0014970969641581178, -0.0014624465256929398, -0.0014277960872277617, -0.0013931456487625837, -0.0013584952102974057, -0.0013238447718322277, -0.0012891942169517279, -0.0012545437784865499, -0.0012198933400213718, -0.0011852429015561938, -0.0011505924630910158, -0.0011159420246258378, -0.0010812915861606598, -0.0010466411476954818, -0.0010119907092303038, -0.0009773402707651258, -0.0009426898322999477, -0.0009080393938347697, -0.0008733889553695917, -0.0008387385169044137, -0.0008040880784392357, -0.0007694376399740577, -0.0007347872015088797, -0.0007001367630437016, -0.0006654863245785236, -0.0006308358861133456, -0.0005961854476481676, -0.0005615350091829896, -0.0005268845707178116, -0.0004922341322526336, -0.00045758363557979465, -0.00042293319711461663, -0.0003882827586494386, -0.0003536323201842606, -0.0003189818817190826, -0.0002843314432539046, -0.0002496809756848961, -0.0002150305372197181, -0.00018038009875454009, -0.00014572966028936207, -0.00011107921454822645, -7.642876880709082e-05, -4.1778330341912806e-05, -7.127891876734793e-06, 2.7522561140358448e-05, 6.217299960553646e-05, 9.682343807071447e-05, 0.0001314738765358925, 0.0001661243150010705, 0.00020077476801816374, 0.00023542520648334175, 0.00027007563039660454, 0.000304726097965613, 0.000339376536430791, 0.00037402697489596903]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 4.0, 3.0, 1.0, 2.0, 3.0, 0.0, 5.0, 6.0, 4.0, 11.0, 13.0, 10.0, 12.0, 20.0, 17.0, 15.0, 30.0, 31.0, 19.0, 28.0, 37.0, 36.0, 37.0, 41.0, 44.0, 31.0, 44.0, 42.0, 41.0, 32.0, 32.0, 35.0, 35.0, 33.0, 27.0, 32.0, 25.0, 22.0, 30.0, 25.0, 14.0, 10.0, 10.0, 7.0, 5.0, 8.0, 14.0, 8.0, 8.0, 3.0, 4.0, 2.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00018525123596191406, -0.0001787003129720688, -0.0001721493899822235, -0.00016559846699237823, -0.00015904754400253296, -0.00015249662101268768, -0.0001459456980228424, -0.00013939477503299713, -0.00013284385204315186, -0.00012629292905330658, -0.0001197420060634613, -0.00011319108307361603, -0.00010664016008377075, -0.00010008923709392548, -9.35383141040802e-05, -8.698739111423492e-05, -8.043646812438965e-05, -7.388554513454437e-05, -6.73346221446991e-05, -6.078369915485382e-05, -5.4232776165008545e-05, -4.768185317516327e-05, -4.113093018531799e-05, -3.458000719547272e-05, -2.802908420562744e-05, -2.1478161215782166e-05, -1.492723822593689e-05, -8.376315236091614e-06, -1.8253922462463379e-06, 4.725530743598938e-06, 1.1276453733444214e-05, 1.782737672328949e-05, 2.4378299713134766e-05, 3.092922270298004e-05, 3.748014569282532e-05, 4.403106868267059e-05, 5.058199167251587e-05, 5.7132914662361145e-05, 6.368383765220642e-05, 7.02347606420517e-05, 7.678568363189697e-05, 8.333660662174225e-05, 8.988752961158752e-05, 9.64384526014328e-05, 0.00010298937559127808, 0.00010954029858112335, 0.00011609122157096863, 0.0001226421445608139, 0.00012919306755065918, 0.00013574399054050446, 0.00014229491353034973, 0.000148845836520195, 0.00015539675951004028, 0.00016194768249988556, 0.00016849860548973083, 0.0001750495284795761, 0.0001816004514694214, 0.00018815137445926666, 0.00019470229744911194, 0.00020125322043895721, 0.0002078041434288025, 0.00021435506641864777, 0.00022090598940849304, 0.00022745691239833832, 0.0002340078353881836]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 6.0, 7.0, 13.0, 7.0, 14.0, 16.0, 20.0, 23.0, 34.0, 45.0, 37.0, 33.0, 52.0, 53.0, 61.0, 48.0, 57.0, 61.0, 62.0, 44.0, 54.0, 34.0, 40.0, 33.0, 33.0, 28.0, 18.0, 14.0, 15.0, 12.0, 9.0, 7.0, 4.0, 3.0, 6.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.86328125, -5.63385009765625, -5.4044189453125, -5.17498779296875, -4.945556640625, -4.71612548828125, -4.4866943359375, -4.25726318359375, -4.02783203125, -3.79840087890625, -3.5689697265625, -3.33953857421875, -3.110107421875, -2.88067626953125, -2.6512451171875, -2.42181396484375, -2.1923828125, -1.96295166015625, -1.7335205078125, -1.50408935546875, -1.274658203125, -1.04522705078125, -0.8157958984375, -0.58636474609375, -0.35693359375, -0.12750244140625, 0.1019287109375, 0.33135986328125, 0.560791015625, 0.79022216796875, 1.0196533203125, 1.24908447265625, 1.478515625, 1.70794677734375, 1.9373779296875, 2.16680908203125, 2.396240234375, 2.62567138671875, 2.8551025390625, 3.08453369140625, 3.31396484375, 3.54339599609375, 3.7728271484375, 4.00225830078125, 4.231689453125, 4.46112060546875, 4.6905517578125, 4.91998291015625, 5.1494140625, 5.37884521484375, 5.6082763671875, 5.83770751953125, 6.067138671875, 6.29656982421875, 6.5260009765625, 6.75543212890625, 6.98486328125, 7.21429443359375, 7.4437255859375, 7.67315673828125, 7.902587890625, 8.13201904296875, 8.3614501953125, 8.59088134765625, 8.8203125]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 13.0, 13.0, 15.0, 26.0, 39.0, 67.0, 115.0, 174.0, 265.0, 480.0, 788.0, 1410.0, 2739.0, 5427.0, 12391.0, 32807.0, 112905.0, 519850.0, 261101.0, 60781.0, 20234.0, 8370.0, 3880.0, 2011.0, 1074.0, 644.0, 389.0, 214.0, 111.0, 77.0, 53.0, 35.0, 24.0, 13.0, 7.0, 8.0, 4.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.896484375, -3.745269775390625, -3.59405517578125, -3.442840576171875, -3.2916259765625, -3.140411376953125, -2.98919677734375, -2.837982177734375, -2.686767578125, -2.535552978515625, -2.38433837890625, -2.233123779296875, -2.0819091796875, -1.930694580078125, -1.77947998046875, -1.628265380859375, -1.47705078125, -1.325836181640625, -1.17462158203125, -1.023406982421875, -0.8721923828125, -0.720977783203125, -0.56976318359375, -0.418548583984375, -0.267333984375, -0.116119384765625, 0.03509521484375, 0.186309814453125, 0.3375244140625, 0.488739013671875, 0.63995361328125, 0.791168212890625, 0.9423828125, 1.093597412109375, 1.24481201171875, 1.396026611328125, 1.5472412109375, 1.698455810546875, 1.84967041015625, 2.000885009765625, 2.152099609375, 2.303314208984375, 2.45452880859375, 2.605743408203125, 2.7569580078125, 2.908172607421875, 3.05938720703125, 3.210601806640625, 3.36181640625, 3.513031005859375, 3.66424560546875, 3.815460205078125, 3.9666748046875, 4.117889404296875, 4.26910400390625, 4.420318603515625, 4.571533203125, 4.722747802734375, 4.87396240234375, 5.025177001953125, 5.1763916015625, 5.327606201171875, 5.47882080078125, 5.630035400390625, 5.78125]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 5.0, 7.0, 10.0, 8.0, 14.0, 14.0, 22.0, 19.0, 29.0, 36.0, 30.0, 29.0, 44.0, 38.0, 41.0, 57.0, 47.0, 130.0, 1915.0, 123.0, 64.0, 50.0, 45.0, 41.0, 41.0, 34.0, 31.0, 22.0, 16.0, 16.0, 18.0, 14.0, 7.0, 8.0, 9.0, 2.0, 2.0, 2.0, 8.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-26.875, -26.158935546875, -25.44287109375, -24.726806640625, -24.0107421875, -23.294677734375, -22.57861328125, -21.862548828125, -21.146484375, -20.430419921875, -19.71435546875, -18.998291015625, -18.2822265625, -17.566162109375, -16.85009765625, -16.134033203125, -15.41796875, -14.701904296875, -13.98583984375, -13.269775390625, -12.5537109375, -11.837646484375, -11.12158203125, -10.405517578125, -9.689453125, -8.973388671875, -8.25732421875, -7.541259765625, -6.8251953125, -6.109130859375, -5.39306640625, -4.677001953125, -3.9609375, -3.244873046875, -2.52880859375, -1.812744140625, -1.0966796875, -0.380615234375, 0.33544921875, 1.051513671875, 1.767578125, 2.483642578125, 3.19970703125, 3.915771484375, 4.6318359375, 5.347900390625, 6.06396484375, 6.780029296875, 7.49609375, 8.212158203125, 8.92822265625, 9.644287109375, 10.3603515625, 11.076416015625, 11.79248046875, 12.508544921875, 13.224609375, 13.940673828125, 14.65673828125, 15.372802734375, 16.0888671875, 16.804931640625, 17.52099609375, 18.237060546875, 18.953125]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 7.0, 4.0, 2.0, 2.0, 9.0, 6.0, 7.0, 12.0, 16.0, 13.0, 17.0, 31.0, 26.0, 39.0, 50.0, 78.0, 127.0, 222.0, 598.0, 2546.0, 898669.0, 2238971.0, 2838.0, 626.0, 257.0, 165.0, 78.0, 57.0, 39.0, 34.0, 42.0, 23.0, 23.0, 20.0, 10.0, 12.0, 14.0, 8.0, 6.0, 3.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.40625, -31.20703125, -30.0078125, -28.80859375, -27.609375, -26.41015625, -25.2109375, -24.01171875, -22.8125, -21.61328125, -20.4140625, -19.21484375, -18.015625, -16.81640625, -15.6171875, -14.41796875, -13.21875, -12.01953125, -10.8203125, -9.62109375, -8.421875, -7.22265625, -6.0234375, -4.82421875, -3.625, -2.42578125, -1.2265625, -0.02734375, 1.171875, 2.37109375, 3.5703125, 4.76953125, 5.96875, 7.16796875, 8.3671875, 9.56640625, 10.765625, 11.96484375, 13.1640625, 14.36328125, 15.5625, 16.76171875, 17.9609375, 19.16015625, 20.359375, 21.55859375, 22.7578125, 23.95703125, 25.15625, 26.35546875, 27.5546875, 28.75390625, 29.953125, 31.15234375, 32.3515625, 33.55078125, 34.75, 35.94921875, 37.1484375, 38.34765625, 39.546875, 40.74609375, 41.9453125, 43.14453125, 44.34375]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 12.0, 238.0, 599.0, 148.0, 17.0], "bins": [-154.3876953125, -151.8712921142578, -149.35488891601562, -146.83848571777344, -144.32208251953125, -141.8056640625, -139.2892608642578, -136.77285766601562, -134.25645446777344, -131.74005126953125, -129.22364807128906, -126.70723724365234, -124.19083404541016, -121.67443084716797, -119.15802764892578, -116.64161682128906, -114.12521362304688, -111.60881042480469, -109.0924072265625, -106.57599639892578, -104.0595932006836, -101.5431900024414, -99.02678680419922, -96.5103759765625, -93.99398040771484, -91.47757720947266, -88.96117401123047, -86.44476318359375, -83.92835998535156, -81.41195678710938, -78.89555358886719, -76.379150390625, -73.86274719238281, -71.34634399414062, -68.82994079589844, -66.31352996826172, -63.79712677001953, -61.280723571777344, -58.764320373535156, -56.2479133605957, -53.73150634765625, -51.21510314941406, -48.69869613647461, -46.18229293823242, -43.66588592529297, -41.14948272705078, -38.633079528808594, -36.11667251586914, -33.60026550292969, -31.083860397338867, -28.567455291748047, -26.05105209350586, -23.534645080566406, -21.01824188232422, -18.5018367767334, -15.985431671142578, -13.469026565551758, -10.952621459960938, -8.436216354370117, -5.919812202453613, -3.403407096862793, -0.8870019912719727, 1.6294021606445312, 4.145807266235352, 6.662211894989014]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 6.0, 8.0, 12.0, 7.0, 8.0, 13.0, 32.0, 26.0, 23.0, 23.0, 35.0, 23.0, 25.0, 33.0, 33.0, 42.0, 46.0, 34.0, 45.0, 46.0, 34.0, 36.0, 38.0, 30.0, 41.0, 27.0, 37.0, 33.0, 34.0, 21.0, 13.0, 22.0, 16.0, 16.0, 19.0, 10.0, 5.0, 10.0, 5.0, 4.0, 6.0, 6.0, 5.0, 1.0, 5.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-60.764896392822266, -58.82918930053711, -56.89348602294922, -54.95777893066406, -53.022071838378906, -51.086368560791016, -49.15066146850586, -47.21495819091797, -45.27925109863281, -43.343544006347656, -41.407840728759766, -39.47213363647461, -37.53643035888672, -35.60072326660156, -33.665016174316406, -31.729310989379883, -29.79360580444336, -27.857900619506836, -25.922195434570312, -23.986488342285156, -22.050783157348633, -20.11507797241211, -18.179370880126953, -16.24366569519043, -14.307960510253906, -12.372255325317383, -10.436549186706543, -8.500843048095703, -6.56513786315918, -4.629432678222656, -2.6937265396118164, -0.7580204010009766, 1.1776847839355469, 3.1133904457092285, 5.04909610748291, 6.984801769256592, 8.920507431030273, 10.856212615966797, 12.791918754577637, 14.727624893188477, 16.663330078125, 18.599035263061523, 20.534740447998047, 22.470447540283203, 24.406152725219727, 26.34185791015625, 28.277565002441406, 30.21327018737793, 32.14897537231445, 34.08468246459961, 36.0203857421875, 37.956092834472656, 39.89179992675781, 41.8275032043457, 43.76321029663086, 45.69891357421875, 47.634620666503906, 49.57032775878906, 51.50603103637695, 53.44173812866211, 55.37744140625, 57.313148498535156, 59.24885559082031, 61.18456268310547, 63.12026596069336]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 8.0, 4.0, 11.0, 10.0, 13.0, 14.0, 20.0, 25.0, 29.0, 36.0, 42.0, 39.0, 41.0, 64.0, 52.0, 47.0, 49.0, 58.0, 58.0, 62.0, 39.0, 43.0, 43.0, 27.0, 39.0, 27.0, 22.0, 15.0, 19.0, 11.0, 11.0, 10.0, 4.0, 6.0, 6.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.80078125, -5.56793212890625, -5.3350830078125, -5.10223388671875, -4.869384765625, -4.63653564453125, -4.4036865234375, -4.17083740234375, -3.93798828125, -3.70513916015625, -3.4722900390625, -3.23944091796875, -3.006591796875, -2.77374267578125, -2.5408935546875, -2.30804443359375, -2.0751953125, -1.84234619140625, -1.6094970703125, -1.37664794921875, -1.143798828125, -0.91094970703125, -0.6781005859375, -0.44525146484375, -0.21240234375, 0.02044677734375, 0.2532958984375, 0.48614501953125, 0.718994140625, 0.95184326171875, 1.1846923828125, 1.41754150390625, 1.650390625, 1.88323974609375, 2.1160888671875, 2.34893798828125, 2.581787109375, 2.81463623046875, 3.0474853515625, 3.28033447265625, 3.51318359375, 3.74603271484375, 3.9788818359375, 4.21173095703125, 4.444580078125, 4.67742919921875, 4.9102783203125, 5.14312744140625, 5.3759765625, 5.60882568359375, 5.8416748046875, 6.07452392578125, 6.307373046875, 6.54022216796875, 6.7730712890625, 7.00592041015625, 7.23876953125, 7.47161865234375, 7.7044677734375, 7.93731689453125, 8.170166015625, 8.40301513671875, 8.6358642578125, 8.86871337890625, 9.1015625]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 10.0, 9.0, 7.0, 10.0, 16.0, 15.0, 20.0, 20.0, 28.0, 37.0, 49.0, 37.0, 47.0, 88.0, 323.0, 5576.0, 2864937.0, 1319603.0, 2864.0, 226.0, 72.0, 55.0, 37.0, 36.0, 36.0, 27.0, 12.0, 18.0, 13.0, 14.0, 14.0, 11.0, 7.0, 8.0, 2.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.125, -35.69287109375, -34.2607421875, -32.82861328125, -31.396484375, -29.96435546875, -28.5322265625, -27.10009765625, -25.66796875, -24.23583984375, -22.8037109375, -21.37158203125, -19.939453125, -18.50732421875, -17.0751953125, -15.64306640625, -14.2109375, -12.77880859375, -11.3466796875, -9.91455078125, -8.482421875, -7.05029296875, -5.6181640625, -4.18603515625, -2.75390625, -1.32177734375, 0.1103515625, 1.54248046875, 2.974609375, 4.40673828125, 5.8388671875, 7.27099609375, 8.703125, 10.13525390625, 11.5673828125, 12.99951171875, 14.431640625, 15.86376953125, 17.2958984375, 18.72802734375, 20.16015625, 21.59228515625, 23.0244140625, 24.45654296875, 25.888671875, 27.32080078125, 28.7529296875, 30.18505859375, 31.6171875, 33.04931640625, 34.4814453125, 35.91357421875, 37.345703125, 38.77783203125, 40.2099609375, 41.64208984375, 43.07421875, 44.50634765625, 45.9384765625, 47.37060546875, 48.802734375, 50.23486328125, 51.6669921875, 53.09912109375, 54.53125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 5.0, 11.0, 22.0, 30.0, 42.0, 72.0, 118.0, 201.0, 327.0, 568.0, 843.0, 789.0, 443.0, 250.0, 134.0, 98.0, 56.0, 34.0, 22.0, 3.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.3125, -35.39697265625, -34.4814453125, -33.56591796875, -32.650390625, -31.73486328125, -30.8193359375, -29.90380859375, -28.98828125, -28.07275390625, -27.1572265625, -26.24169921875, -25.326171875, -24.41064453125, -23.4951171875, -22.57958984375, -21.6640625, -20.74853515625, -19.8330078125, -18.91748046875, -18.001953125, -17.08642578125, -16.1708984375, -15.25537109375, -14.33984375, -13.42431640625, -12.5087890625, -11.59326171875, -10.677734375, -9.76220703125, -8.8466796875, -7.93115234375, -7.015625, -6.10009765625, -5.1845703125, -4.26904296875, -3.353515625, -2.43798828125, -1.5224609375, -0.60693359375, 0.30859375, 1.22412109375, 2.1396484375, 3.05517578125, 3.970703125, 4.88623046875, 5.8017578125, 6.71728515625, 7.6328125, 8.54833984375, 9.4638671875, 10.37939453125, 11.294921875, 12.21044921875, 13.1259765625, 14.04150390625, 14.95703125, 15.87255859375, 16.7880859375, 17.70361328125, 18.619140625, 19.53466796875, 20.4501953125, 21.36572265625, 22.28125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 4.0, 6.0, 10.0, 21.0, 47.0, 65.0, 89.0, 107.0, 183.0, 324.0, 700.0, 5428.0, 4013674.0, 171043.0, 1468.0, 465.0, 218.0, 138.0, 93.0, 61.0, 34.0, 38.0, 27.0, 20.0, 8.0, 5.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.8125, -85.7255859375, -82.638671875, -79.5517578125, -76.46484375, -73.3779296875, -70.291015625, -67.2041015625, -64.1171875, -61.0302734375, -57.943359375, -54.8564453125, -51.76953125, -48.6826171875, -45.595703125, -42.5087890625, -39.421875, -36.3349609375, -33.248046875, -30.1611328125, -27.07421875, -23.9873046875, -20.900390625, -17.8134765625, -14.7265625, -11.6396484375, -8.552734375, -5.4658203125, -2.37890625, 0.7080078125, 3.794921875, 6.8818359375, 9.96875, 13.0556640625, 16.142578125, 19.2294921875, 22.31640625, 25.4033203125, 28.490234375, 31.5771484375, 34.6640625, 37.7509765625, 40.837890625, 43.9248046875, 47.01171875, 50.0986328125, 53.185546875, 56.2724609375, 59.359375, 62.4462890625, 65.533203125, 68.6201171875, 71.70703125, 74.7939453125, 77.880859375, 80.9677734375, 84.0546875, 87.1416015625, 90.228515625, 93.3154296875, 96.40234375, 99.4892578125, 102.576171875, 105.6630859375, 108.75]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 11.0, 29.0, 45.0, 87.0, 172.0, 161.0, 181.0, 146.0, 95.0, 50.0, 16.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.82491302490234, -70.96292114257812, -68.1009292602539, -65.23893737792969, -62.376953125, -59.51496124267578, -56.65296936035156, -53.790977478027344, -50.92898941040039, -48.06699752807617, -45.20500946044922, -42.343017578125, -39.48102569580078, -36.61903762817383, -33.75704574584961, -30.895055770874023, -28.033065795898438, -25.17107582092285, -22.309085845947266, -19.447093963623047, -16.58510398864746, -13.723114013671875, -10.861122131347656, -7.99913215637207, -5.137142181396484, -2.2751517295837402, 0.5868387222290039, 3.4488296508789062, 6.310819625854492, 9.172809600830078, 12.034801483154297, 14.896791458129883, 17.75878143310547, 20.620771408081055, 23.48276138305664, 26.34475326538086, 29.206743240356445, 32.06873321533203, 34.93072509765625, 37.79271697998047, 40.65470504760742, 43.51669692993164, 46.378684997558594, 49.24067687988281, 52.10266876220703, 54.964656829833984, 57.8266487121582, 60.688636779785156, 63.550628662109375, 66.4126205444336, 69.27461242675781, 72.1365966796875, 74.99858856201172, 77.86058044433594, 80.72257232666016, 83.58456420898438, 86.44654846191406, 89.30854034423828, 92.1705322265625, 95.03251647949219, 97.8945083618164, 100.75650024414062, 103.61849212646484, 106.48048400878906, 109.34247589111328]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 7.0, 3.0, 4.0, 6.0, 6.0, 11.0, 15.0, 19.0, 16.0, 14.0, 23.0, 26.0, 29.0, 35.0, 31.0, 33.0, 36.0, 30.0, 31.0, 33.0, 37.0, 30.0, 43.0, 47.0, 48.0, 35.0, 43.0, 36.0, 36.0, 26.0, 30.0, 19.0, 23.0, 15.0, 22.0, 21.0, 18.0, 19.0, 11.0, 10.0, 10.0, 4.0, 6.0, 4.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-58.76618957519531, -57.00148010253906, -55.23677062988281, -53.47206115722656, -51.70735168457031, -49.94264221191406, -48.17793655395508, -46.41322708129883, -44.64851760864258, -42.88380813598633, -41.11909866333008, -39.35438919067383, -37.589683532714844, -35.824974060058594, -34.060264587402344, -32.295555114746094, -30.530845642089844, -28.766136169433594, -27.001426696777344, -25.236719131469727, -23.472009658813477, -21.707300186157227, -19.94259262084961, -18.17788314819336, -16.41317367553711, -14.64846420288086, -12.883755683898926, -11.119047164916992, -9.354337692260742, -7.589628219604492, -5.824919700622559, -4.060211181640625, -2.295501708984375, -0.5307927131652832, 1.2339162826538086, 2.9986252784729004, 4.763334274291992, 6.528043746948242, 8.292752265930176, 10.05746078491211, 11.82217025756836, 13.58687973022461, 15.351588249206543, 17.116296768188477, 18.881006240844727, 20.645715713500977, 22.410423278808594, 24.175132751464844, 25.939842224121094, 27.704551696777344, 29.469261169433594, 31.23396873474121, 32.998680114746094, 34.763389587402344, 36.52809524536133, 38.29280471801758, 40.05751419067383, 41.82222366333008, 43.58693313598633, 45.35164260864258, 47.11634826660156, 48.88105773925781, 50.64576721191406, 52.41047668457031, 54.17518615722656]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 14.0, 11.0, 13.0, 10.0, 22.0, 17.0, 25.0, 33.0, 36.0, 43.0, 52.0, 55.0, 58.0, 51.0, 55.0, 54.0, 48.0, 43.0, 51.0, 62.0, 38.0, 49.0, 25.0, 26.0, 22.0, 22.0, 17.0, 11.0, 13.0, 13.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.578125, -6.33642578125, -6.0947265625, -5.85302734375, -5.611328125, -5.36962890625, -5.1279296875, -4.88623046875, -4.64453125, -4.40283203125, -4.1611328125, -3.91943359375, -3.677734375, -3.43603515625, -3.1943359375, -2.95263671875, -2.7109375, -2.46923828125, -2.2275390625, -1.98583984375, -1.744140625, -1.50244140625, -1.2607421875, -1.01904296875, -0.77734375, -0.53564453125, -0.2939453125, -0.05224609375, 0.189453125, 0.43115234375, 0.6728515625, 0.91455078125, 1.15625, 1.39794921875, 1.6396484375, 1.88134765625, 2.123046875, 2.36474609375, 2.6064453125, 2.84814453125, 3.08984375, 3.33154296875, 3.5732421875, 3.81494140625, 4.056640625, 4.29833984375, 4.5400390625, 4.78173828125, 5.0234375, 5.26513671875, 5.5068359375, 5.74853515625, 5.990234375, 6.23193359375, 6.4736328125, 6.71533203125, 6.95703125, 7.19873046875, 7.4404296875, 7.68212890625, 7.923828125, 8.16552734375, 8.4072265625, 8.64892578125, 8.890625]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 8.0, 6.0, 3.0, 10.0, 9.0, 18.0, 27.0, 37.0, 43.0, 73.0, 119.0, 185.0, 266.0, 452.0, 736.0, 1250.0, 1995.0, 3315.0, 5540.0, 9569.0, 16791.0, 30733.0, 60585.0, 130427.0, 352279.0, 234638.0, 95739.0, 46347.0, 24503.0, 13438.0, 7729.0, 4667.0, 2640.0, 1656.0, 1023.0, 607.0, 394.0, 240.0, 150.0, 96.0, 61.0, 39.0, 37.0, 21.0, 18.0, 12.0, 5.0, 9.0, 5.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-1.517578125, -1.46832275390625, -1.4190673828125, -1.36981201171875, -1.320556640625, -1.27130126953125, -1.2220458984375, -1.17279052734375, -1.12353515625, -1.07427978515625, -1.0250244140625, -0.97576904296875, -0.926513671875, -0.87725830078125, -0.8280029296875, -0.77874755859375, -0.7294921875, -0.68023681640625, -0.6309814453125, -0.58172607421875, -0.532470703125, -0.48321533203125, -0.4339599609375, -0.38470458984375, -0.33544921875, -0.28619384765625, -0.2369384765625, -0.18768310546875, -0.138427734375, -0.08917236328125, -0.0399169921875, 0.00933837890625, 0.05859375, 0.10784912109375, 0.1571044921875, 0.20635986328125, 0.255615234375, 0.30487060546875, 0.3541259765625, 0.40338134765625, 0.45263671875, 0.50189208984375, 0.5511474609375, 0.60040283203125, 0.649658203125, 0.69891357421875, 0.7481689453125, 0.79742431640625, 0.8466796875, 0.89593505859375, 0.9451904296875, 0.99444580078125, 1.043701171875, 1.09295654296875, 1.1422119140625, 1.19146728515625, 1.24072265625, 1.28997802734375, 1.3392333984375, 1.38848876953125, 1.437744140625, 1.48699951171875, 1.5362548828125, 1.58551025390625, 1.634765625]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 8.0, 10.0, 9.0, 8.0, 10.0, 10.0, 11.0, 9.0, 15.0, 11.0, 19.0, 24.0, 27.0, 27.0, 39.0, 34.0, 36.0, 42.0, 40.0, 29.0, 40.0, 31.0, 1067.0, 35.0, 39.0, 31.0, 31.0, 29.0, 34.0, 29.0, 21.0, 40.0, 29.0, 18.0, 15.0, 15.0, 17.0, 9.0, 11.0, 12.0, 8.0, 6.0, 8.0, 11.0, 4.0, 7.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.505859375, -3.39508056640625, -3.2843017578125, -3.17352294921875, -3.062744140625, -2.95196533203125, -2.8411865234375, -2.73040771484375, -2.61962890625, -2.50885009765625, -2.3980712890625, -2.28729248046875, -2.176513671875, -2.06573486328125, -1.9549560546875, -1.84417724609375, -1.7333984375, -1.62261962890625, -1.5118408203125, -1.40106201171875, -1.290283203125, -1.17950439453125, -1.0687255859375, -0.95794677734375, -0.84716796875, -0.73638916015625, -0.6256103515625, -0.51483154296875, -0.404052734375, -0.29327392578125, -0.1824951171875, -0.07171630859375, 0.0390625, 0.14984130859375, 0.2606201171875, 0.37139892578125, 0.482177734375, 0.59295654296875, 0.7037353515625, 0.81451416015625, 0.92529296875, 1.03607177734375, 1.1468505859375, 1.25762939453125, 1.368408203125, 1.47918701171875, 1.5899658203125, 1.70074462890625, 1.8115234375, 1.92230224609375, 2.0330810546875, 2.14385986328125, 2.254638671875, 2.36541748046875, 2.4761962890625, 2.58697509765625, 2.69775390625, 2.80853271484375, 2.9193115234375, 3.03009033203125, 3.140869140625, 3.25164794921875, 3.3624267578125, 3.47320556640625, 3.583984375]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [5.0, 7.0, 3.0, 13.0, 9.0, 13.0, 19.0, 33.0, 36.0, 56.0, 87.0, 104.0, 168.0, 203.0, 298.0, 440.0, 582.0, 838.0, 1144.0, 1582.0, 2255.0, 3218.0, 4434.0, 6294.0, 8935.0, 13213.0, 19828.0, 30285.0, 47059.0, 75228.0, 129871.0, 1325561.0, 169406.0, 91320.0, 55593.0, 35365.0, 23133.0, 15158.0, 10421.0, 7089.0, 5132.0, 3663.0, 2597.0, 1831.0, 1331.0, 944.0, 693.0, 504.0, 321.0, 244.0, 167.0, 133.0, 99.0, 63.0, 42.0, 23.0, 18.0, 15.0, 11.0, 4.0, 3.0, 3.0, 4.0, 1.0], "bins": [-0.99365234375, -0.9622879028320312, -0.9309234619140625, -0.8995590209960938, -0.868194580078125, -0.8368301391601562, -0.8054656982421875, -0.7741012573242188, -0.74273681640625, -0.7113723754882812, -0.6800079345703125, -0.6486434936523438, -0.617279052734375, -0.5859146118164062, -0.5545501708984375, -0.5231857299804688, -0.4918212890625, -0.46045684814453125, -0.4290924072265625, -0.39772796630859375, -0.366363525390625, -0.33499908447265625, -0.3036346435546875, -0.27227020263671875, -0.24090576171875, -0.20954132080078125, -0.1781768798828125, -0.14681243896484375, -0.115447998046875, -0.08408355712890625, -0.0527191162109375, -0.02135467529296875, 0.010009765625, 0.04137420654296875, 0.0727386474609375, 0.10410308837890625, 0.135467529296875, 0.16683197021484375, 0.1981964111328125, 0.22956085205078125, 0.26092529296875, 0.29228973388671875, 0.3236541748046875, 0.35501861572265625, 0.386383056640625, 0.41774749755859375, 0.4491119384765625, 0.48047637939453125, 0.5118408203125, 0.5432052612304688, 0.5745697021484375, 0.6059341430664062, 0.637298583984375, 0.6686630249023438, 0.7000274658203125, 0.7313919067382812, 0.76275634765625, 0.7941207885742188, 0.8254852294921875, 0.8568496704101562, 0.888214111328125, 0.9195785522460938, 0.9509429931640625, 0.9823074340820312, 1.013671875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 5.0, 2.0, 2.0, 1.0, 4.0, 6.0, 6.0, 10.0, 13.0, 6.0, 15.0, 21.0, 32.0, 31.0, 55.0, 51.0, 73.0, 69.0, 79.0, 92.0, 64.0, 73.0, 64.0, 39.0, 41.0, 30.0, 19.0, 17.0, 17.0, 12.0, 13.0, 11.0, 9.0, 4.0, 3.0, 1.0, 3.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007805824279785156, -0.0007577091455459595, -0.0007348358631134033, -0.0007119625806808472, -0.000689089298248291, -0.0006662160158157349, -0.0006433427333831787, -0.0006204694509506226, -0.0005975961685180664, -0.0005747228860855103, -0.0005518496036529541, -0.000528976321220398, -0.0005061030387878418, -0.00048322975635528564, -0.0004603564739227295, -0.00043748319149017334, -0.0004146099090576172, -0.00039173662662506104, -0.0003688633441925049, -0.00034599006175994873, -0.0003231167793273926, -0.0003002434968948364, -0.0002773702144622803, -0.0002544969320297241, -0.00023162364959716797, -0.00020875036716461182, -0.00018587708473205566, -0.0001630038022994995, -0.00014013051986694336, -0.00011725723743438721, -9.438395500183105e-05, -7.15106725692749e-05, -4.863739013671875e-05, -2.5764107704162598e-05, -2.8908252716064453e-06, 1.9982457160949707e-05, 4.285573959350586e-05, 6.572902202606201e-05, 8.860230445861816e-05, 0.00011147558689117432, 0.00013434886932373047, 0.00015722215175628662, 0.00018009543418884277, 0.00020296871662139893, 0.00022584199905395508, 0.00024871528148651123, 0.0002715885639190674, 0.00029446184635162354, 0.0003173351287841797, 0.00034020841121673584, 0.000363081693649292, 0.00038595497608184814, 0.0004088282585144043, 0.00043170154094696045, 0.0004545748233795166, 0.00047744810581207275, 0.0005003213882446289, 0.0005231946706771851, 0.0005460679531097412, 0.0005689412355422974, 0.0005918145179748535, 0.0006146878004074097, 0.0006375610828399658, 0.000660434365272522, 0.0006833076477050781]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 6.0, 8.0, 9.0, 11.0, 11.0, 16.0, 10.0, 36.0, 46.0, 71.0, 112.0, 220.0, 399.0, 1419.0, 1039656.0, 5402.0, 501.0, 234.0, 129.0, 81.0, 53.0, 23.0, 29.0, 17.0, 15.0, 7.0, 6.0, 7.0, 1.0, 6.0, 3.0, 2.0, 0.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0162353515625, -0.015625715255737305, -0.01501607894897461, -0.014406442642211914, -0.013796806335449219, -0.013187170028686523, -0.012577533721923828, -0.011967897415161133, -0.011358261108398438, -0.010748624801635742, -0.010138988494873047, -0.009529352188110352, -0.008919715881347656, -0.008310079574584961, -0.007700443267822266, -0.00709080696105957, -0.006481170654296875, -0.00587153434753418, -0.005261898040771484, -0.004652261734008789, -0.004042625427246094, -0.0034329891204833984, -0.002823352813720703, -0.002213716506958008, -0.0016040802001953125, -0.0009944438934326172, -0.0003848075866699219, 0.00022482872009277344, 0.0008344650268554688, 0.001444101333618164, 0.0020537376403808594, 0.0026633739471435547, 0.00327301025390625, 0.0038826465606689453, 0.004492282867431641, 0.005101919174194336, 0.005711555480957031, 0.0063211917877197266, 0.006930828094482422, 0.007540464401245117, 0.008150100708007812, 0.008759737014770508, 0.009369373321533203, 0.009979009628295898, 0.010588645935058594, 0.011198282241821289, 0.011807918548583984, 0.01241755485534668, 0.013027191162109375, 0.01363682746887207, 0.014246463775634766, 0.014856100082397461, 0.015465736389160156, 0.01607537269592285, 0.016685009002685547, 0.017294645309448242, 0.017904281616210938, 0.018513917922973633, 0.019123554229736328, 0.019733190536499023, 0.02034282684326172, 0.020952463150024414, 0.02156209945678711, 0.022171735763549805, 0.0227813720703125]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 74.0, 669.0, 257.0, 12.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0031098618637770414, -0.00304033188149333, -0.002970801666378975, -0.00290127145126462, -0.0028317414689809084, -0.002762211486697197, -0.002692681271582842, -0.002623151056468487, -0.0025536210741847754, -0.002484091091901064, -0.002414560876786709, -0.0023450306616723537, -0.0022755006793886423, -0.002205970697104931, -0.002136440481990576, -0.0020669102668762207, -0.0019973802845925093, -0.001927850185893476, -0.0018583200871944427, -0.0017887899884954095, -0.0017192598897963762, -0.001649729791097343, -0.0015801996923983097, -0.0015106695936992764, -0.0014411394950002432, -0.00137160939630121, -0.0013020792976021767, -0.0012325491989031434, -0.0011630191002041101, -0.0010934890015050769, -0.0010239589028060436, -0.0009544288041070104, -0.0008848987054079771, -0.0008153686067089438, -0.0007458385080099106, -0.0006763084093108773, -0.0006067783106118441, -0.0005372482119128108, -0.00046771811321377754, -0.0003981880145147443, -0.000328657915815711, -0.00025912781711667776, -0.0001895977184176445, -0.00012006761971861124, -5.053752101957798e-05, 1.899257767945528e-05, 8.852267637848854e-05, 0.0001580527750775218, 0.00022758287377655506, 0.0002971129724755883, 0.0003666430711746216, 0.00043617316987365484, 0.0005057032685726881, 0.0005752333672717214, 0.0006447634659707546, 0.0007142935646697879, 0.0007838236633688211, 0.0008533537620678544, 0.0009228838607668877, 0.000992413959465921, 0.0010619440581649542, 0.0011314741568639874, 0.0012010042555630207, 0.001270534354262054, 0.0013400644529610872]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 1.0, 5.0, 4.0, 4.0, 8.0, 3.0, 6.0, 7.0, 14.0, 12.0, 12.0, 13.0, 22.0, 17.0, 26.0, 26.0, 21.0, 21.0, 28.0, 45.0, 42.0, 30.0, 29.0, 30.0, 44.0, 33.0, 31.0, 41.0, 35.0, 25.0, 30.0, 36.0, 33.0, 26.0, 33.0, 24.0, 20.0, 19.0, 31.0, 23.0, 14.0, 14.0, 11.0, 16.0, 12.0, 7.0, 7.0, 2.0, 2.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0003173351287841797, -0.000307643786072731, -0.00029795244336128235, -0.0002882611006498337, -0.000278569757938385, -0.00026887841522693634, -0.00025918707251548767, -0.000249495729804039, -0.00023980438709259033, -0.00023011304438114166, -0.000220421701669693, -0.00021073035895824432, -0.00020103901624679565, -0.00019134767353534698, -0.00018165633082389832, -0.00017196498811244965, -0.00016227364540100098, -0.0001525823026895523, -0.00014289095997810364, -0.00013319961726665497, -0.0001235082745552063, -0.00011381693184375763, -0.00010412558913230896, -9.443424642086029e-05, -8.474290370941162e-05, -7.505156099796295e-05, -6.536021828651428e-05, -5.566887557506561e-05, -4.597753286361694e-05, -3.6286190152168274e-05, -2.6594847440719604e-05, -1.6903504729270935e-05, -7.212162017822266e-06, 2.479180693626404e-06, 1.2170523405075073e-05, 2.1861866116523743e-05, 3.155320882797241e-05, 4.124455153942108e-05, 5.093589425086975e-05, 6.062723696231842e-05, 7.031857967376709e-05, 8.000992238521576e-05, 8.970126509666443e-05, 9.93926078081131e-05, 0.00010908395051956177, 0.00011877529323101044, 0.0001284666359424591, 0.00013815797865390778, 0.00014784932136535645, 0.00015754066407680511, 0.00016723200678825378, 0.00017692334949970245, 0.00018661469221115112, 0.0001963060349225998, 0.00020599737763404846, 0.00021568872034549713, 0.0002253800630569458, 0.00023507140576839447, 0.00024476274847984314, 0.0002544540911912918, 0.0002641454339027405, 0.00027383677661418915, 0.0002835281193256378, 0.0002932194620370865, 0.00030291080474853516]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 14.0, 11.0, 13.0, 10.0, 22.0, 17.0, 25.0, 33.0, 36.0, 43.0, 52.0, 55.0, 58.0, 51.0, 55.0, 54.0, 48.0, 43.0, 51.0, 62.0, 38.0, 49.0, 25.0, 26.0, 22.0, 22.0, 17.0, 11.0, 13.0, 13.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.578125, -6.33642578125, -6.0947265625, -5.85302734375, -5.611328125, -5.36962890625, -5.1279296875, -4.88623046875, -4.64453125, -4.40283203125, -4.1611328125, -3.91943359375, -3.677734375, -3.43603515625, -3.1943359375, -2.95263671875, -2.7109375, -2.46923828125, -2.2275390625, -1.98583984375, -1.744140625, -1.50244140625, -1.2607421875, -1.01904296875, -0.77734375, -0.53564453125, -0.2939453125, -0.05224609375, 0.189453125, 0.43115234375, 0.6728515625, 0.91455078125, 1.15625, 1.39794921875, 1.6396484375, 1.88134765625, 2.123046875, 2.36474609375, 2.6064453125, 2.84814453125, 3.08984375, 3.33154296875, 3.5732421875, 3.81494140625, 4.056640625, 4.29833984375, 4.5400390625, 4.78173828125, 5.0234375, 5.26513671875, 5.5068359375, 5.74853515625, 5.990234375, 6.23193359375, 6.4736328125, 6.71533203125, 6.95703125, 7.19873046875, 7.4404296875, 7.68212890625, 7.923828125, 8.16552734375, 8.4072265625, 8.64892578125, 8.890625]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 7.0, 2.0, 7.0, 9.0, 9.0, 9.0, 29.0, 25.0, 51.0, 59.0, 113.0, 163.0, 220.0, 347.0, 511.0, 850.0, 1352.0, 2563.0, 5228.0, 12490.0, 36839.0, 162991.0, 589000.0, 172510.0, 38644.0, 12717.0, 5337.0, 2621.0, 1411.0, 893.0, 530.0, 340.0, 232.0, 164.0, 98.0, 52.0, 38.0, 36.0, 21.0, 16.0, 14.0, 4.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0390625, -3.89227294921875, -3.7454833984375, -3.59869384765625, -3.451904296875, -3.30511474609375, -3.1583251953125, -3.01153564453125, -2.86474609375, -2.71795654296875, -2.5711669921875, -2.42437744140625, -2.277587890625, -2.13079833984375, -1.9840087890625, -1.83721923828125, -1.6904296875, -1.54364013671875, -1.3968505859375, -1.25006103515625, -1.103271484375, -0.95648193359375, -0.8096923828125, -0.66290283203125, -0.51611328125, -0.36932373046875, -0.2225341796875, -0.07574462890625, 0.071044921875, 0.21783447265625, 0.3646240234375, 0.51141357421875, 0.658203125, 0.80499267578125, 0.9517822265625, 1.09857177734375, 1.245361328125, 1.39215087890625, 1.5389404296875, 1.68572998046875, 1.83251953125, 1.97930908203125, 2.1260986328125, 2.27288818359375, 2.419677734375, 2.56646728515625, 2.7132568359375, 2.86004638671875, 3.0068359375, 3.15362548828125, 3.3004150390625, 3.44720458984375, 3.593994140625, 3.74078369140625, 3.8875732421875, 4.03436279296875, 4.18115234375, 4.32794189453125, 4.4747314453125, 4.62152099609375, 4.768310546875, 4.91510009765625, 5.0618896484375, 5.20867919921875, 5.35546875]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 5.0, 6.0, 4.0, 4.0, 6.0, 6.0, 12.0, 10.0, 10.0, 12.0, 14.0, 12.0, 14.0, 18.0, 18.0, 35.0, 17.0, 22.0, 39.0, 37.0, 44.0, 33.0, 32.0, 44.0, 150.0, 1841.0, 136.0, 59.0, 42.0, 45.0, 26.0, 17.0, 29.0, 34.0, 23.0, 27.0, 27.0, 16.0, 20.0, 23.0, 11.0, 12.0, 12.0, 11.0, 9.0, 4.0, 5.0, 4.0, 8.0, 3.0, 6.0, 2.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.109375, -15.562744140625, -15.01611328125, -14.469482421875, -13.9228515625, -13.376220703125, -12.82958984375, -12.282958984375, -11.736328125, -11.189697265625, -10.64306640625, -10.096435546875, -9.5498046875, -9.003173828125, -8.45654296875, -7.909912109375, -7.36328125, -6.816650390625, -6.27001953125, -5.723388671875, -5.1767578125, -4.630126953125, -4.08349609375, -3.536865234375, -2.990234375, -2.443603515625, -1.89697265625, -1.350341796875, -0.8037109375, -0.257080078125, 0.28955078125, 0.836181640625, 1.3828125, 1.929443359375, 2.47607421875, 3.022705078125, 3.5693359375, 4.115966796875, 4.66259765625, 5.209228515625, 5.755859375, 6.302490234375, 6.84912109375, 7.395751953125, 7.9423828125, 8.489013671875, 9.03564453125, 9.582275390625, 10.12890625, 10.675537109375, 11.22216796875, 11.768798828125, 12.3154296875, 12.862060546875, 13.40869140625, 13.955322265625, 14.501953125, 15.048583984375, 15.59521484375, 16.141845703125, 16.6884765625, 17.235107421875, 17.78173828125, 18.328369140625, 18.875]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 4.0, 6.0, 6.0, 5.0, 8.0, 3.0, 4.0, 12.0, 13.0, 10.0, 17.0, 17.0, 16.0, 18.0, 31.0, 31.0, 37.0, 61.0, 75.0, 92.0, 152.0, 236.0, 423.0, 1080.0, 11133.0, 3073677.0, 55294.0, 1787.0, 537.0, 266.0, 165.0, 121.0, 88.0, 53.0, 36.0, 33.0, 28.0, 19.0, 18.0, 16.0, 12.0, 13.0, 8.0, 12.0, 12.0, 4.0, 8.0, 3.0, 4.0, 7.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-31.03125, -30.109375, -29.1875, -28.265625, -27.34375, -26.421875, -25.5, -24.578125, -23.65625, -22.734375, -21.8125, -20.890625, -19.96875, -19.046875, -18.125, -17.203125, -16.28125, -15.359375, -14.4375, -13.515625, -12.59375, -11.671875, -10.75, -9.828125, -8.90625, -7.984375, -7.0625, -6.140625, -5.21875, -4.296875, -3.375, -2.453125, -1.53125, -0.609375, 0.3125, 1.234375, 2.15625, 3.078125, 4.0, 4.921875, 5.84375, 6.765625, 7.6875, 8.609375, 9.53125, 10.453125, 11.375, 12.296875, 13.21875, 14.140625, 15.0625, 15.984375, 16.90625, 17.828125, 18.75, 19.671875, 20.59375, 21.515625, 22.4375, 23.359375, 24.28125, 25.203125, 26.125, 27.046875, 27.96875]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 30.0, 54.0, 113.0, 194.0, 231.0, 187.0, 112.0, 58.0, 17.0, 7.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-34.9527473449707, -34.24595260620117, -33.539154052734375, -32.832359313964844, -32.12556076049805, -31.418766021728516, -30.71196937561035, -30.005172729492188, -29.298376083374023, -28.59157943725586, -27.884782791137695, -27.17798614501953, -26.47119140625, -25.764394760131836, -25.057598114013672, -24.350801467895508, -23.644004821777344, -22.93720817565918, -22.230411529541016, -21.523616790771484, -20.81682014465332, -20.110023498535156, -19.403226852416992, -18.696430206298828, -17.989635467529297, -17.282838821411133, -16.57604217529297, -15.869246482849121, -15.162449836730957, -14.45565414428711, -13.748857498168945, -13.042060852050781, -12.335264205932617, -11.628467559814453, -10.921671867370605, -10.214875221252441, -9.508078575134277, -8.80128288269043, -8.094486236572266, -7.387689590454102, -6.680893421173096, -5.97409725189209, -5.267300605773926, -4.56050443649292, -3.853708028793335, -3.14691162109375, -2.440115451812744, -1.73331880569458, -1.0265226364135742, -0.31972628831863403, 0.38707005977630615, 1.0938663482666016, 1.8006627559661865, 2.5074591636657715, 3.2142553329467773, 3.9210519790649414, 4.627848148345947, 5.334644317626953, 6.041440963745117, 6.748237133026123, 7.455033302307129, 8.161829948425293, 8.86862564086914, 9.575422286987305, 10.282218933105469]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 4.0, 2.0, 2.0, 6.0, 11.0, 16.0, 9.0, 11.0, 20.0, 12.0, 16.0, 21.0, 35.0, 30.0, 28.0, 30.0, 47.0, 33.0, 34.0, 44.0, 43.0, 44.0, 49.0, 41.0, 34.0, 39.0, 46.0, 41.0, 26.0, 30.0, 26.0, 23.0, 24.0, 20.0, 14.0, 13.0, 10.0, 10.0, 10.0, 16.0, 8.0, 7.0, 5.0, 8.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0], "bins": [-62.84747314453125, -60.8697509765625, -58.892024993896484, -56.914302825927734, -54.936580657958984, -52.95885467529297, -50.98113250732422, -49.00341033935547, -47.02568817138672, -45.04796600341797, -43.07024002075195, -41.0925178527832, -39.11479568481445, -37.13706970214844, -35.15934753417969, -33.18162536621094, -31.203899383544922, -29.22617530822754, -27.24845314025879, -25.270729064941406, -23.293006896972656, -21.315282821655273, -19.33755874633789, -17.35983657836914, -15.382112503051758, -13.404389381408691, -11.426666259765625, -9.448942184448242, -7.471219062805176, -5.493495941162109, -3.5157718658447266, -1.5380487442016602, 0.4396781921386719, 2.4174015522003174, 4.395124912261963, 6.3728485107421875, 8.350571632385254, 10.32829475402832, 12.306018829345703, 14.28374195098877, 16.261465072631836, 18.23918914794922, 20.21691131591797, 22.19463539123535, 24.172359466552734, 26.150081634521484, 28.127805709838867, 30.10552978515625, 32.083251953125, 34.06097412109375, 36.038700103759766, 38.016422271728516, 39.994144439697266, 41.97187042236328, 43.94959259033203, 45.92731475830078, 47.90503692626953, 49.88275909423828, 51.8604850769043, 53.83820724487305, 55.8159294128418, 57.79365539550781, 59.77137756347656, 61.74909973144531, 63.72682571411133]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 9.0, 11.0, 12.0, 14.0, 12.0, 22.0, 22.0, 27.0, 40.0, 30.0, 52.0, 62.0, 38.0, 61.0, 50.0, 58.0, 48.0, 58.0, 45.0, 52.0, 46.0, 41.0, 34.0, 36.0, 25.0, 20.0, 18.0, 12.0, 16.0, 8.0, 8.0, 4.0, 6.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.71484375, -6.47271728515625, -6.2305908203125, -5.98846435546875, -5.746337890625, -5.50421142578125, -5.2620849609375, -5.01995849609375, -4.77783203125, -4.53570556640625, -4.2935791015625, -4.05145263671875, -3.809326171875, -3.56719970703125, -3.3250732421875, -3.08294677734375, -2.8408203125, -2.59869384765625, -2.3565673828125, -2.11444091796875, -1.872314453125, -1.63018798828125, -1.3880615234375, -1.14593505859375, -0.90380859375, -0.66168212890625, -0.4195556640625, -0.17742919921875, 0.064697265625, 0.30682373046875, 0.5489501953125, 0.79107666015625, 1.033203125, 1.27532958984375, 1.5174560546875, 1.75958251953125, 2.001708984375, 2.24383544921875, 2.4859619140625, 2.72808837890625, 2.97021484375, 3.21234130859375, 3.4544677734375, 3.69659423828125, 3.938720703125, 4.18084716796875, 4.4229736328125, 4.66510009765625, 4.9072265625, 5.14935302734375, 5.3914794921875, 5.63360595703125, 5.875732421875, 6.11785888671875, 6.3599853515625, 6.60211181640625, 6.84423828125, 7.08636474609375, 7.3284912109375, 7.57061767578125, 7.812744140625, 8.05487060546875, 8.2969970703125, 8.53912353515625, 8.78125]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 6.0, 4.0, 5.0, 15.0, 9.0, 21.0, 20.0, 38.0, 43.0, 53.0, 105.0, 155.0, 384.0, 988.0, 3468.0, 16770.0, 130084.0, 1333955.0, 2338937.0, 326879.0, 33467.0, 6077.0, 1621.0, 564.0, 248.0, 109.0, 79.0, 52.0, 36.0, 18.0, 19.0, 13.0, 11.0, 12.0, 8.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.84375, -11.408203125, -10.97265625, -10.537109375, -10.1015625, -9.666015625, -9.23046875, -8.794921875, -8.359375, -7.923828125, -7.48828125, -7.052734375, -6.6171875, -6.181640625, -5.74609375, -5.310546875, -4.875, -4.439453125, -4.00390625, -3.568359375, -3.1328125, -2.697265625, -2.26171875, -1.826171875, -1.390625, -0.955078125, -0.51953125, -0.083984375, 0.3515625, 0.787109375, 1.22265625, 1.658203125, 2.09375, 2.529296875, 2.96484375, 3.400390625, 3.8359375, 4.271484375, 4.70703125, 5.142578125, 5.578125, 6.013671875, 6.44921875, 6.884765625, 7.3203125, 7.755859375, 8.19140625, 8.626953125, 9.0625, 9.498046875, 9.93359375, 10.369140625, 10.8046875, 11.240234375, 11.67578125, 12.111328125, 12.546875, 12.982421875, 13.41796875, 13.853515625, 14.2890625, 14.724609375, 15.16015625, 15.595703125, 16.03125]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 6.0, 6.0, 9.0, 12.0, 11.0, 11.0, 18.0, 32.0, 33.0, 31.0, 60.0, 89.0, 96.0, 134.0, 195.0, 229.0, 314.0, 415.0, 445.0, 413.0, 369.0, 288.0, 181.0, 165.0, 132.0, 87.0, 67.0, 55.0, 33.0, 36.0, 23.0, 18.0, 15.0, 11.0, 9.0, 4.0, 8.0, 6.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-17.734375, -17.251708984375, -16.76904296875, -16.286376953125, -15.8037109375, -15.321044921875, -14.83837890625, -14.355712890625, -13.873046875, -13.390380859375, -12.90771484375, -12.425048828125, -11.9423828125, -11.459716796875, -10.97705078125, -10.494384765625, -10.01171875, -9.529052734375, -9.04638671875, -8.563720703125, -8.0810546875, -7.598388671875, -7.11572265625, -6.633056640625, -6.150390625, -5.667724609375, -5.18505859375, -4.702392578125, -4.2197265625, -3.737060546875, -3.25439453125, -2.771728515625, -2.2890625, -1.806396484375, -1.32373046875, -0.841064453125, -0.3583984375, 0.124267578125, 0.60693359375, 1.089599609375, 1.572265625, 2.054931640625, 2.53759765625, 3.020263671875, 3.5029296875, 3.985595703125, 4.46826171875, 4.950927734375, 5.43359375, 5.916259765625, 6.39892578125, 6.881591796875, 7.3642578125, 7.846923828125, 8.32958984375, 8.812255859375, 9.294921875, 9.777587890625, 10.26025390625, 10.742919921875, 11.2255859375, 11.708251953125, 12.19091796875, 12.673583984375, 13.15625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 6.0, 4.0, 8.0, 11.0, 20.0, 27.0, 33.0, 59.0, 59.0, 93.0, 125.0, 202.0, 339.0, 807.0, 17193.0, 4067243.0, 105476.0, 1494.0, 392.0, 204.0, 142.0, 89.0, 62.0, 46.0, 38.0, 32.0, 17.0, 16.0, 9.0, 10.0, 7.0, 8.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.25, -61.7451171875, -59.240234375, -56.7353515625, -54.23046875, -51.7255859375, -49.220703125, -46.7158203125, -44.2109375, -41.7060546875, -39.201171875, -36.6962890625, -34.19140625, -31.6865234375, -29.181640625, -26.6767578125, -24.171875, -21.6669921875, -19.162109375, -16.6572265625, -14.15234375, -11.6474609375, -9.142578125, -6.6376953125, -4.1328125, -1.6279296875, 0.876953125, 3.3818359375, 5.88671875, 8.3916015625, 10.896484375, 13.4013671875, 15.90625, 18.4111328125, 20.916015625, 23.4208984375, 25.92578125, 28.4306640625, 30.935546875, 33.4404296875, 35.9453125, 38.4501953125, 40.955078125, 43.4599609375, 45.96484375, 48.4697265625, 50.974609375, 53.4794921875, 55.984375, 58.4892578125, 60.994140625, 63.4990234375, 66.00390625, 68.5087890625, 71.013671875, 73.5185546875, 76.0234375, 78.5283203125, 81.033203125, 83.5380859375, 86.04296875, 88.5478515625, 91.052734375, 93.5576171875, 96.0625]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [2.0, 4.0, 35.0, 187.0, 404.0, 276.0, 99.0, 12.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.736621856689453, -23.39528465270996, -17.05394744873047, -10.71261215209961, -4.371274948120117, 1.970062255859375, 8.311397552490234, 14.65273666381836, 20.99407196044922, 27.33540916442871, 33.6767463684082, 40.01808166503906, 46.35942077636719, 52.70075607299805, 59.042091369628906, 65.38343048095703, 71.72476196289062, 78.06610107421875, 84.40743255615234, 90.74877166748047, 97.0901107788086, 103.43144226074219, 109.77278137207031, 116.11412048339844, 122.45545959472656, 128.7967987060547, 135.1381378173828, 141.47946166992188, 147.82080078125, 154.16213989257812, 160.50347900390625, 166.84481811523438, 173.18614196777344, 179.52748107910156, 185.8688201904297, 192.21014404296875, 198.55148315429688, 204.892822265625, 211.23416137695312, 217.57550048828125, 223.91683959960938, 230.2581787109375, 236.59951782226562, 242.94085693359375, 249.2821807861328, 255.62351989746094, 261.96484375, 268.30621337890625, 274.64752197265625, 280.9888610839844, 287.3302001953125, 293.6715393066406, 300.01287841796875, 306.3542175292969, 312.695556640625, 319.036865234375, 325.37823486328125, 331.7195739746094, 338.0609130859375, 344.4022521972656, 350.74359130859375, 357.0849304199219, 363.42626953125, 369.767578125, 376.1089172363281]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 2.0, 3.0, 2.0, 4.0, 3.0, 8.0, 3.0, 5.0, 11.0, 11.0, 15.0, 11.0, 14.0, 16.0, 12.0, 17.0, 18.0, 28.0, 40.0, 30.0, 46.0, 25.0, 39.0, 29.0, 35.0, 41.0, 31.0, 33.0, 40.0, 43.0, 29.0, 50.0, 29.0, 34.0, 35.0, 28.0, 17.0, 23.0, 20.0, 18.0, 12.0, 16.0, 16.0, 21.0, 13.0, 5.0, 13.0, 4.0, 5.0, 0.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-48.63189697265625, -47.01860427856445, -45.405311584472656, -43.79201889038086, -42.17872619628906, -40.56543731689453, -38.952144622802734, -37.33885192871094, -35.72555923461914, -34.112266540527344, -32.49897384643555, -30.885683059692383, -29.272390365600586, -27.65909767150879, -26.045806884765625, -24.432514190673828, -22.81922149658203, -21.205928802490234, -19.592636108398438, -17.979345321655273, -16.366052627563477, -14.75275993347168, -13.1394681930542, -11.526176452636719, -9.912883758544922, -8.299591064453125, -6.6862993240356445, -5.073007106781006, -3.459714889526367, -1.8464221954345703, -0.23313045501708984, 1.3801612854003906, 2.9934539794921875, 4.606746196746826, 6.220038414001465, 7.8333306312561035, 9.446622848510742, 11.059915542602539, 12.67320728302002, 14.2864990234375, 15.899791717529297, 17.513084411621094, 19.12637710571289, 20.739667892456055, 22.35296058654785, 23.96625328063965, 25.579544067382812, 27.19283676147461, 28.806129455566406, 30.419422149658203, 32.03271484375, 33.6460075378418, 35.259300231933594, 36.872589111328125, 38.48588180541992, 40.09917449951172, 41.712467193603516, 43.32575988769531, 44.93905258178711, 46.552345275878906, 48.16563415527344, 49.7789306640625, 51.39221954345703, 53.00551223754883, 54.618804931640625]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 10.0, 14.0, 12.0, 14.0, 17.0, 23.0, 28.0, 34.0, 39.0, 44.0, 51.0, 48.0, 61.0, 50.0, 48.0, 47.0, 39.0, 53.0, 51.0, 51.0, 46.0, 34.0, 39.0, 29.0, 21.0, 20.0, 17.0, 15.0, 13.0, 6.0, 8.0, 8.0, 3.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.98828125, -6.74896240234375, -6.5096435546875, -6.27032470703125, -6.031005859375, -5.79168701171875, -5.5523681640625, -5.31304931640625, -5.07373046875, -4.83441162109375, -4.5950927734375, -4.35577392578125, -4.116455078125, -3.87713623046875, -3.6378173828125, -3.39849853515625, -3.1591796875, -2.91986083984375, -2.6805419921875, -2.44122314453125, -2.201904296875, -1.96258544921875, -1.7232666015625, -1.48394775390625, -1.24462890625, -1.00531005859375, -0.7659912109375, -0.52667236328125, -0.287353515625, -0.04803466796875, 0.1912841796875, 0.43060302734375, 0.669921875, 0.90924072265625, 1.1485595703125, 1.38787841796875, 1.627197265625, 1.86651611328125, 2.1058349609375, 2.34515380859375, 2.58447265625, 2.82379150390625, 3.0631103515625, 3.30242919921875, 3.541748046875, 3.78106689453125, 4.0203857421875, 4.25970458984375, 4.4990234375, 4.73834228515625, 4.9776611328125, 5.21697998046875, 5.456298828125, 5.69561767578125, 5.9349365234375, 6.17425537109375, 6.41357421875, 6.65289306640625, 6.8922119140625, 7.13153076171875, 7.370849609375, 7.61016845703125, 7.8494873046875, 8.08880615234375, 8.328125]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 5.0, 3.0, 4.0, 9.0, 10.0, 15.0, 16.0, 28.0, 35.0, 63.0, 83.0, 123.0, 163.0, 298.0, 460.0, 681.0, 1087.0, 1662.0, 2710.0, 4253.0, 6971.0, 11049.0, 18459.0, 31801.0, 57978.0, 113699.0, 257519.0, 274422.0, 120616.0, 60967.0, 33334.0, 19221.0, 11679.0, 6973.0, 4519.0, 2770.0, 1701.0, 1103.0, 753.0, 438.0, 271.0, 195.0, 141.0, 77.0, 59.0, 45.0, 26.0, 21.0, 14.0, 10.0, 9.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0], "bins": [-1.37109375, -1.3269195556640625, -1.282745361328125, -1.2385711669921875, -1.19439697265625, -1.1502227783203125, -1.106048583984375, -1.0618743896484375, -1.0177001953125, -0.9735260009765625, -0.929351806640625, -0.8851776123046875, -0.84100341796875, -0.7968292236328125, -0.752655029296875, -0.7084808349609375, -0.664306640625, -0.6201324462890625, -0.575958251953125, -0.5317840576171875, -0.48760986328125, -0.4434356689453125, -0.399261474609375, -0.3550872802734375, -0.3109130859375, -0.2667388916015625, -0.222564697265625, -0.1783905029296875, -0.13421630859375, -0.0900421142578125, -0.045867919921875, -0.0016937255859375, 0.04248046875, 0.0866546630859375, 0.130828857421875, 0.1750030517578125, 0.21917724609375, 0.2633514404296875, 0.307525634765625, 0.3516998291015625, 0.3958740234375, 0.4400482177734375, 0.484222412109375, 0.5283966064453125, 0.57257080078125, 0.6167449951171875, 0.660919189453125, 0.7050933837890625, 0.749267578125, 0.7934417724609375, 0.837615966796875, 0.8817901611328125, 0.92596435546875, 0.9701385498046875, 1.014312744140625, 1.0584869384765625, 1.1026611328125, 1.1468353271484375, 1.191009521484375, 1.2351837158203125, 1.27935791015625, 1.3235321044921875, 1.367706298828125, 1.4118804931640625, 1.4560546875]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 4.0, 6.0, 11.0, 15.0, 9.0, 14.0, 13.0, 18.0, 19.0, 19.0, 20.0, 28.0, 35.0, 34.0, 33.0, 35.0, 36.0, 41.0, 39.0, 45.0, 1057.0, 35.0, 38.0, 41.0, 38.0, 45.0, 24.0, 28.0, 29.0, 19.0, 25.0, 32.0, 15.0, 19.0, 18.0, 17.0, 13.0, 10.0, 12.0, 7.0, 8.0, 6.0, 8.0, 2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.41796875, -3.30548095703125, -3.1929931640625, -3.08050537109375, -2.968017578125, -2.85552978515625, -2.7430419921875, -2.63055419921875, -2.51806640625, -2.40557861328125, -2.2930908203125, -2.18060302734375, -2.068115234375, -1.95562744140625, -1.8431396484375, -1.73065185546875, -1.6181640625, -1.50567626953125, -1.3931884765625, -1.28070068359375, -1.168212890625, -1.05572509765625, -0.9432373046875, -0.83074951171875, -0.71826171875, -0.60577392578125, -0.4932861328125, -0.38079833984375, -0.268310546875, -0.15582275390625, -0.0433349609375, 0.06915283203125, 0.181640625, 0.29412841796875, 0.4066162109375, 0.51910400390625, 0.631591796875, 0.74407958984375, 0.8565673828125, 0.96905517578125, 1.08154296875, 1.19403076171875, 1.3065185546875, 1.41900634765625, 1.531494140625, 1.64398193359375, 1.7564697265625, 1.86895751953125, 1.9814453125, 2.09393310546875, 2.2064208984375, 2.31890869140625, 2.431396484375, 2.54388427734375, 2.6563720703125, 2.76885986328125, 2.88134765625, 2.99383544921875, 3.1063232421875, 3.21881103515625, 3.331298828125, 3.44378662109375, 3.5562744140625, 3.66876220703125, 3.78125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 7.0, 2.0, 6.0, 11.0, 11.0, 16.0, 28.0, 30.0, 47.0, 63.0, 84.0, 121.0, 176.0, 278.0, 373.0, 580.0, 856.0, 1159.0, 1695.0, 2632.0, 3699.0, 5556.0, 8286.0, 12188.0, 18595.0, 28645.0, 45748.0, 75078.0, 136509.0, 1340858.0, 174582.0, 89314.0, 53259.0, 33099.0, 21323.0, 13566.0, 9069.0, 6204.0, 4164.0, 2874.0, 1961.0, 1322.0, 929.0, 658.0, 428.0, 330.0, 218.0, 161.0, 99.0, 88.0, 62.0, 36.0, 8.0, 15.0, 20.0, 6.0, 6.0, 3.0, 2.0, 3.0, 1.0, 3.0], "bins": [-1.0361328125, -1.0034027099609375, -0.970672607421875, -0.9379425048828125, -0.90521240234375, -0.8724822998046875, -0.839752197265625, -0.8070220947265625, -0.7742919921875, -0.7415618896484375, -0.708831787109375, -0.6761016845703125, -0.64337158203125, -0.6106414794921875, -0.577911376953125, -0.5451812744140625, -0.512451171875, -0.4797210693359375, -0.446990966796875, -0.4142608642578125, -0.38153076171875, -0.3488006591796875, -0.316070556640625, -0.2833404541015625, -0.2506103515625, -0.2178802490234375, -0.185150146484375, -0.1524200439453125, -0.11968994140625, -0.0869598388671875, -0.054229736328125, -0.0214996337890625, 0.01123046875, 0.0439605712890625, 0.076690673828125, 0.1094207763671875, 0.14215087890625, 0.1748809814453125, 0.207611083984375, 0.2403411865234375, 0.2730712890625, 0.3058013916015625, 0.338531494140625, 0.3712615966796875, 0.40399169921875, 0.4367218017578125, 0.469451904296875, 0.5021820068359375, 0.534912109375, 0.5676422119140625, 0.600372314453125, 0.6331024169921875, 0.66583251953125, 0.6985626220703125, 0.731292724609375, 0.7640228271484375, 0.7967529296875, 0.8294830322265625, 0.862213134765625, 0.8949432373046875, 0.92767333984375, 0.9604034423828125, 0.993133544921875, 1.0258636474609375, 1.05859375]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 5.0, 7.0, 8.0, 12.0, 14.0, 12.0, 20.0, 29.0, 39.0, 58.0, 69.0, 88.0, 82.0, 102.0, 106.0, 73.0, 60.0, 48.0, 52.0, 26.0, 22.0, 13.0, 14.0, 7.0, 8.0, 8.0, 6.0, 5.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.0008983612060546875, -0.0008749961853027344, -0.0008516311645507812, -0.0008282661437988281, -0.000804901123046875, -0.0007815361022949219, -0.0007581710815429688, -0.0007348060607910156, -0.0007114410400390625, -0.0006880760192871094, -0.0006647109985351562, -0.0006413459777832031, -0.00061798095703125, -0.0005946159362792969, -0.0005712509155273438, -0.0005478858947753906, -0.0005245208740234375, -0.0005011558532714844, -0.00047779083251953125, -0.0004544258117675781, -0.000431060791015625, -0.0004076957702636719, -0.00038433074951171875, -0.0003609657287597656, -0.0003376007080078125, -0.0003142356872558594, -0.00029087066650390625, -0.0002675056457519531, -0.000244140625, -0.00022077560424804688, -0.00019741058349609375, -0.00017404556274414062, -0.0001506805419921875, -0.00012731552124023438, -0.00010395050048828125, -8.058547973632812e-05, -5.7220458984375e-05, -3.3855438232421875e-05, -1.049041748046875e-05, 1.2874603271484375e-05, 3.62396240234375e-05, 5.9604644775390625e-05, 8.296966552734375e-05, 0.00010633468627929688, 0.00012969970703125, 0.00015306472778320312, 0.00017642974853515625, 0.00019979476928710938, 0.0002231597900390625, 0.0002465248107910156, 0.00026988983154296875, 0.0002932548522949219, 0.000316619873046875, 0.0003399848937988281, 0.00036334991455078125, 0.0003867149353027344, 0.0004100799560546875, 0.0004334449768066406, 0.00045680999755859375, 0.0004801750183105469, 0.0005035400390625, 0.0005269050598144531, 0.0005502700805664062, 0.0005736351013183594, 0.0005970001220703125]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 8.0, 10.0, 7.0, 17.0, 15.0, 24.0, 36.0, 40.0, 71.0, 112.0, 233.0, 503.0, 3098.0, 1040164.0, 3126.0, 517.0, 208.0, 122.0, 84.0, 44.0, 31.0, 20.0, 14.0, 11.0, 9.0, 7.0, 2.0, 1.0, 6.0, 4.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01375579833984375, -0.013216376304626465, -0.01267695426940918, -0.012137532234191895, -0.01159811019897461, -0.011058688163757324, -0.010519266128540039, -0.009979844093322754, -0.009440422058105469, -0.008901000022888184, -0.008361577987670898, -0.007822155952453613, -0.007282733917236328, -0.006743311882019043, -0.006203889846801758, -0.005664467811584473, -0.0051250457763671875, -0.004585623741149902, -0.004046201705932617, -0.003506779670715332, -0.002967357635498047, -0.0024279356002807617, -0.0018885135650634766, -0.0013490915298461914, -0.0008096694946289062, -0.0002702474594116211, 0.00026917457580566406, 0.0008085966110229492, 0.0013480186462402344, 0.0018874406814575195, 0.0024268627166748047, 0.00296628475189209, 0.003505706787109375, 0.00404512882232666, 0.004584550857543945, 0.0051239728927612305, 0.005663394927978516, 0.006202816963195801, 0.006742238998413086, 0.007281661033630371, 0.007821083068847656, 0.008360505104064941, 0.008899927139282227, 0.009439349174499512, 0.009978771209716797, 0.010518193244934082, 0.011057615280151367, 0.011597037315368652, 0.012136459350585938, 0.012675881385803223, 0.013215303421020508, 0.013754725456237793, 0.014294147491455078, 0.014833569526672363, 0.015372991561889648, 0.015912413597106934, 0.01645183563232422, 0.016991257667541504, 0.01753067970275879, 0.018070101737976074, 0.01860952377319336, 0.019148945808410645, 0.01968836784362793, 0.020227789878845215, 0.0207672119140625]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 11.0, 36.0, 181.0, 360.0, 256.0, 125.0, 31.0, 9.0, 4.0], "bins": [-0.0018274596659466624, -0.001796373981051147, -0.0017652882961556315, -0.001734202727675438, -0.0017031170427799225, -0.001672031357884407, -0.0016409456729888916, -0.0016098599880933762, -0.0015787743031978607, -0.0015476886183023453, -0.0015166029334068298, -0.0014855173649266362, -0.0014544316800311208, -0.0014233459951356053, -0.00139226031024009, -0.0013611746253445745, -0.0013300890568643808, -0.0012990033719688654, -0.00126791768707335, -0.0012368321185931563, -0.001205746433697641, -0.0011746607488021255, -0.00114357506390661, -0.0011124893790110946, -0.001081403810530901, -0.0010503181256353855, -0.00101923244073987, -0.0009881468722596765, -0.000957061187364161, -0.0009259755024686456, -0.0008948898175731301, -0.0008638041326776147, -0.0008327183313667774, -0.000801632646471262, -0.0007705470197834074, -0.000739461334887892, -0.0007083757082000375, -0.000677290023304522, -0.0006462043384090066, -0.0006151186535134912, -0.0005840330850332975, -0.0005529474001377821, -0.0005218617734499276, -0.0004907760885544121, -0.00045969043276272714, -0.00042860477697104216, -0.0003975190920755267, -0.00036643343628384173, -0.0003353477513883263, -0.0003042620955966413, -0.00027317641070112586, -0.00024209075490944088, -0.0002110050991177559, -0.0001799194433260709, -0.0001488337729824707, -0.00011774810263887048, -8.666244684718549e-05, -5.557678377954289e-05, -2.4491120711900294e-05, 6.5945423557423055e-06, 3.7680205423384905e-05, 6.876586121506989e-05, 9.98515315586701e-05, 0.00013093720190227032, 0.0001620228576939553]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 3.0, 2.0, 5.0, 3.0, 5.0, 3.0, 4.0, 4.0, 12.0, 5.0, 17.0, 17.0, 23.0, 20.0, 26.0, 26.0, 30.0, 32.0, 36.0, 42.0, 28.0, 35.0, 45.0, 39.0, 44.0, 37.0, 51.0, 45.0, 33.0, 44.0, 41.0, 34.0, 33.0, 29.0, 20.0, 22.0, 29.0, 12.0, 22.0, 8.0, 12.0, 4.0, 7.0, 5.0, 3.0, 4.0, 3.0, 4.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00026863813400268555, -0.00025929044932127, -0.00024994276463985443, -0.00024059507995843887, -0.00023124739527702332, -0.00022189971059560776, -0.0002125520259141922, -0.00020320434123277664, -0.00019385665655136108, -0.00018450897186994553, -0.00017516128718852997, -0.0001658136025071144, -0.00015646591782569885, -0.0001471182331442833, -0.00013777054846286774, -0.00012842286378145218, -0.00011907517910003662, -0.00010972749441862106, -0.0001003798097372055, -9.103212505578995e-05, -8.168444037437439e-05, -7.233675569295883e-05, -6.298907101154327e-05, -5.3641386330127716e-05, -4.429370164871216e-05, -3.49460169672966e-05, -2.5598332285881042e-05, -1.6250647604465485e-05, -6.902962923049927e-06, 2.444721758365631e-06, 1.1792406439781189e-05, 2.1140091121196747e-05, 3.0487775802612305e-05, 3.983546048402786e-05, 4.918314516544342e-05, 5.853082984685898e-05, 6.787851452827454e-05, 7.72261992096901e-05, 8.657388389110565e-05, 9.592156857252121e-05, 0.00010526925325393677, 0.00011461693793535233, 0.00012396462261676788, 0.00013331230729818344, 0.000142659991979599, 0.00015200767666101456, 0.00016135536134243011, 0.00017070304602384567, 0.00018005073070526123, 0.0001893984153866768, 0.00019874610006809235, 0.0002080937847495079, 0.00021744146943092346, 0.00022678915411233902, 0.00023613683879375458, 0.00024548452347517014, 0.0002548322081565857, 0.00026417989283800125, 0.0002735275775194168, 0.00028287526220083237, 0.0002922229468822479, 0.0003015706315636635, 0.00031091831624507904, 0.0003202660009264946, 0.00032961368560791016]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 10.0, 14.0, 12.0, 14.0, 17.0, 23.0, 28.0, 34.0, 39.0, 44.0, 51.0, 48.0, 61.0, 50.0, 48.0, 47.0, 39.0, 53.0, 51.0, 51.0, 46.0, 34.0, 39.0, 29.0, 21.0, 20.0, 17.0, 15.0, 13.0, 6.0, 8.0, 8.0, 3.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.98828125, -6.74896240234375, -6.5096435546875, -6.27032470703125, -6.031005859375, -5.79168701171875, -5.5523681640625, -5.31304931640625, -5.07373046875, -4.83441162109375, -4.5950927734375, -4.35577392578125, -4.116455078125, -3.87713623046875, -3.6378173828125, -3.39849853515625, -3.1591796875, -2.91986083984375, -2.6805419921875, -2.44122314453125, -2.201904296875, -1.96258544921875, -1.7232666015625, -1.48394775390625, -1.24462890625, -1.00531005859375, -0.7659912109375, -0.52667236328125, -0.287353515625, -0.04803466796875, 0.1912841796875, 0.43060302734375, 0.669921875, 0.90924072265625, 1.1485595703125, 1.38787841796875, 1.627197265625, 1.86651611328125, 2.1058349609375, 2.34515380859375, 2.58447265625, 2.82379150390625, 3.0631103515625, 3.30242919921875, 3.541748046875, 3.78106689453125, 4.0203857421875, 4.25970458984375, 4.4990234375, 4.73834228515625, 4.9776611328125, 5.21697998046875, 5.456298828125, 5.69561767578125, 5.9349365234375, 6.17425537109375, 6.41357421875, 6.65289306640625, 6.8922119140625, 7.13153076171875, 7.370849609375, 7.61016845703125, 7.8494873046875, 8.08880615234375, 8.328125]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 6.0, 6.0, 19.0, 27.0, 27.0, 62.0, 116.0, 160.0, 293.0, 550.0, 892.0, 1762.0, 3564.0, 7703.0, 19266.0, 59402.0, 249970.0, 502785.0, 139724.0, 37413.0, 13317.0, 5708.0, 2726.0, 1286.0, 720.0, 441.0, 230.0, 165.0, 89.0, 58.0, 27.0, 12.0, 11.0, 10.0, 6.0, 1.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.296875, -4.1502685546875, -4.003662109375, -3.8570556640625, -3.71044921875, -3.5638427734375, -3.417236328125, -3.2706298828125, -3.1240234375, -2.9774169921875, -2.830810546875, -2.6842041015625, -2.53759765625, -2.3909912109375, -2.244384765625, -2.0977783203125, -1.951171875, -1.8045654296875, -1.657958984375, -1.5113525390625, -1.36474609375, -1.2181396484375, -1.071533203125, -0.9249267578125, -0.7783203125, -0.6317138671875, -0.485107421875, -0.3385009765625, -0.19189453125, -0.0452880859375, 0.101318359375, 0.2479248046875, 0.39453125, 0.5411376953125, 0.687744140625, 0.8343505859375, 0.98095703125, 1.1275634765625, 1.274169921875, 1.4207763671875, 1.5673828125, 1.7139892578125, 1.860595703125, 2.0072021484375, 2.15380859375, 2.3004150390625, 2.447021484375, 2.5936279296875, 2.740234375, 2.8868408203125, 3.033447265625, 3.1800537109375, 3.32666015625, 3.4732666015625, 3.619873046875, 3.7664794921875, 3.9130859375, 4.0596923828125, 4.206298828125, 4.3529052734375, 4.49951171875, 4.6461181640625, 4.792724609375, 4.9393310546875, 5.0859375]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 6.0, 5.0, 5.0, 4.0, 8.0, 11.0, 12.0, 16.0, 14.0, 13.0, 20.0, 26.0, 30.0, 28.0, 36.0, 30.0, 41.0, 42.0, 51.0, 75.0, 1553.0, 512.0, 70.0, 55.0, 32.0, 44.0, 41.0, 39.0, 29.0, 34.0, 24.0, 21.0, 16.0, 17.0, 20.0, 14.0, 11.0, 4.0, 8.0, 9.0, 6.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-18.140625, -17.46826171875, -16.7958984375, -16.12353515625, -15.451171875, -14.77880859375, -14.1064453125, -13.43408203125, -12.76171875, -12.08935546875, -11.4169921875, -10.74462890625, -10.072265625, -9.39990234375, -8.7275390625, -8.05517578125, -7.3828125, -6.71044921875, -6.0380859375, -5.36572265625, -4.693359375, -4.02099609375, -3.3486328125, -2.67626953125, -2.00390625, -1.33154296875, -0.6591796875, 0.01318359375, 0.685546875, 1.35791015625, 2.0302734375, 2.70263671875, 3.375, 4.04736328125, 4.7197265625, 5.39208984375, 6.064453125, 6.73681640625, 7.4091796875, 8.08154296875, 8.75390625, 9.42626953125, 10.0986328125, 10.77099609375, 11.443359375, 12.11572265625, 12.7880859375, 13.46044921875, 14.1328125, 14.80517578125, 15.4775390625, 16.14990234375, 16.822265625, 17.49462890625, 18.1669921875, 18.83935546875, 19.51171875, 20.18408203125, 20.8564453125, 21.52880859375, 22.201171875, 22.87353515625, 23.5458984375, 24.21826171875, 24.890625]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 7.0, 3.0, 9.0, 8.0, 7.0, 5.0, 18.0, 15.0, 20.0, 29.0, 19.0, 37.0, 45.0, 53.0, 79.0, 117.0, 167.0, 277.0, 561.0, 2015.0, 543358.0, 2594755.0, 2598.0, 603.0, 288.0, 167.0, 118.0, 79.0, 52.0, 42.0, 31.0, 17.0, 14.0, 13.0, 20.0, 11.0, 10.0, 6.0, 6.0, 5.0, 3.0, 8.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0], "bins": [-42.40625, -41.261962890625, -40.11767578125, -38.973388671875, -37.8291015625, -36.684814453125, -35.54052734375, -34.396240234375, -33.251953125, -32.107666015625, -30.96337890625, -29.819091796875, -28.6748046875, -27.530517578125, -26.38623046875, -25.241943359375, -24.09765625, -22.953369140625, -21.80908203125, -20.664794921875, -19.5205078125, -18.376220703125, -17.23193359375, -16.087646484375, -14.943359375, -13.799072265625, -12.65478515625, -11.510498046875, -10.3662109375, -9.221923828125, -8.07763671875, -6.933349609375, -5.7890625, -4.644775390625, -3.50048828125, -2.356201171875, -1.2119140625, -0.067626953125, 1.07666015625, 2.220947265625, 3.365234375, 4.509521484375, 5.65380859375, 6.798095703125, 7.9423828125, 9.086669921875, 10.23095703125, 11.375244140625, 12.51953125, 13.663818359375, 14.80810546875, 15.952392578125, 17.0966796875, 18.240966796875, 19.38525390625, 20.529541015625, 21.673828125, 22.818115234375, 23.96240234375, 25.106689453125, 26.2509765625, 27.395263671875, 28.53955078125, 29.683837890625, 30.828125]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 5.0, 28.0, 90.0, 196.0, 258.0, 211.0, 142.0, 58.0, 16.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.856503963470459, -4.860631942749023, -3.864760160446167, -2.8688883781433105, -1.873016357421875, -0.8771443367004395, 0.11872720718383789, 1.1145992279052734, 2.110471248626709, 3.1063432693481445, 4.102214813232422, 5.098086833953857, 6.093958854675293, 7.0898308753967285, 8.085702896118164, 9.081574440002441, 10.077445983886719, 11.073317527770996, 12.06919002532959, 13.065061569213867, 14.060934066772461, 15.056805610656738, 16.052677154541016, 17.04854965209961, 18.044422149658203, 19.040294647216797, 20.036165237426758, 21.03203773498535, 22.027910232543945, 23.023780822753906, 24.0196533203125, 25.015525817871094, 26.011398315429688, 27.00727081298828, 28.003141403198242, 28.999013900756836, 29.99488639831543, 30.99075698852539, 31.986629486083984, 32.98250198364258, 33.97837448120117, 34.974246978759766, 35.97011947631836, 36.96598815917969, 37.96186065673828, 38.957733154296875, 39.95360565185547, 40.94947814941406, 41.945350646972656, 42.94122314453125, 43.937095642089844, 44.93296813964844, 45.928836822509766, 46.92470932006836, 47.92058181762695, 48.91645431518555, 49.912322998046875, 50.90819549560547, 51.90406799316406, 52.899940490722656, 53.895809173583984, 54.89168167114258, 55.88755416870117, 56.883426666259766, 57.87929916381836]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 7.0, 5.0, 5.0, 8.0, 7.0, 10.0, 16.0, 12.0, 10.0, 18.0, 18.0, 22.0, 31.0, 24.0, 25.0, 24.0, 27.0, 26.0, 35.0, 30.0, 46.0, 35.0, 44.0, 41.0, 34.0, 27.0, 31.0, 48.0, 40.0, 24.0, 39.0, 32.0, 32.0, 26.0, 19.0, 20.0, 14.0, 18.0, 9.0, 11.0, 10.0, 12.0, 12.0, 4.0, 8.0, 6.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-65.90167999267578, -63.87305450439453, -61.844425201416016, -59.815799713134766, -57.78717041015625, -55.758544921875, -53.72991943359375, -51.7012939453125, -49.672664642333984, -47.644039154052734, -45.61540985107422, -43.58678436279297, -41.55815887451172, -39.5295295715332, -37.50090408325195, -35.47227478027344, -33.44364929199219, -31.415021896362305, -29.386394500732422, -27.357769012451172, -25.32914161682129, -23.300514221191406, -21.271888732910156, -19.243261337280273, -17.21463394165039, -15.186006546020508, -13.157380104064941, -11.128753662109375, -9.100126266479492, -7.071498870849609, -5.042872428894043, -3.0142459869384766, -0.9856109619140625, 1.043015956878662, 3.0716428756713867, 5.100269794464111, 7.128896713256836, 9.157524108886719, 11.186150550842285, 13.214776992797852, 15.243404388427734, 17.272031784057617, 19.3006591796875, 21.32928466796875, 23.357912063598633, 25.386539459228516, 27.415164947509766, 29.44379234313965, 31.47241973876953, 33.50104522705078, 35.5296745300293, 37.55830001831055, 39.58692932128906, 41.61555480957031, 43.64418029785156, 45.67280578613281, 47.70143508911133, 49.73006057739258, 51.758689880371094, 53.787315368652344, 55.815940856933594, 57.84457015991211, 59.87319564819336, 61.901824951171875, 63.930450439453125]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 3.0, 4.0, 6.0, 12.0, 13.0, 10.0, 19.0, 14.0, 18.0, 31.0, 42.0, 34.0, 53.0, 48.0, 49.0, 52.0, 52.0, 52.0, 45.0, 55.0, 50.0, 44.0, 56.0, 44.0, 30.0, 31.0, 36.0, 21.0, 18.0, 16.0, 14.0, 13.0, 5.0, 10.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.109375, -6.8643798828125, -6.619384765625, -6.3743896484375, -6.12939453125, -5.8843994140625, -5.639404296875, -5.3944091796875, -5.1494140625, -4.9044189453125, -4.659423828125, -4.4144287109375, -4.16943359375, -3.9244384765625, -3.679443359375, -3.4344482421875, -3.189453125, -2.9444580078125, -2.699462890625, -2.4544677734375, -2.20947265625, -1.9644775390625, -1.719482421875, -1.4744873046875, -1.2294921875, -0.9844970703125, -0.739501953125, -0.4945068359375, -0.24951171875, -0.0045166015625, 0.240478515625, 0.4854736328125, 0.73046875, 0.9754638671875, 1.220458984375, 1.4654541015625, 1.71044921875, 1.9554443359375, 2.200439453125, 2.4454345703125, 2.6904296875, 2.9354248046875, 3.180419921875, 3.4254150390625, 3.67041015625, 3.9154052734375, 4.160400390625, 4.4053955078125, 4.650390625, 4.8953857421875, 5.140380859375, 5.3853759765625, 5.63037109375, 5.8753662109375, 6.120361328125, 6.3653564453125, 6.6103515625, 6.8553466796875, 7.100341796875, 7.3453369140625, 7.59033203125, 7.8353271484375, 8.080322265625, 8.3253173828125, 8.5703125]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 6.0, 11.0, 13.0, 10.0, 17.0, 25.0, 26.0, 35.0, 51.0, 93.0, 132.0, 236.0, 916.0, 6605.0, 149383.0, 3359691.0, 657115.0, 17200.0, 1805.0, 402.0, 183.0, 83.0, 58.0, 38.0, 34.0, 30.0, 25.0, 14.0, 14.0, 8.0, 5.0, 7.0, 7.0, 1.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.53125, -20.780517578125, -20.02978515625, -19.279052734375, -18.5283203125, -17.777587890625, -17.02685546875, -16.276123046875, -15.525390625, -14.774658203125, -14.02392578125, -13.273193359375, -12.5224609375, -11.771728515625, -11.02099609375, -10.270263671875, -9.51953125, -8.768798828125, -8.01806640625, -7.267333984375, -6.5166015625, -5.765869140625, -5.01513671875, -4.264404296875, -3.513671875, -2.762939453125, -2.01220703125, -1.261474609375, -0.5107421875, 0.239990234375, 0.99072265625, 1.741455078125, 2.4921875, 3.242919921875, 3.99365234375, 4.744384765625, 5.4951171875, 6.245849609375, 6.99658203125, 7.747314453125, 8.498046875, 9.248779296875, 9.99951171875, 10.750244140625, 11.5009765625, 12.251708984375, 13.00244140625, 13.753173828125, 14.50390625, 15.254638671875, 16.00537109375, 16.756103515625, 17.5068359375, 18.257568359375, 19.00830078125, 19.759033203125, 20.509765625, 21.260498046875, 22.01123046875, 22.761962890625, 23.5126953125, 24.263427734375, 25.01416015625, 25.764892578125, 26.515625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 6.0, 6.0, 6.0, 5.0, 13.0, 23.0, 22.0, 42.0, 60.0, 68.0, 79.0, 101.0, 153.0, 189.0, 299.0, 369.0, 472.0, 430.0, 423.0, 346.0, 270.0, 198.0, 117.0, 95.0, 71.0, 51.0, 46.0, 34.0, 22.0, 24.0, 6.0, 12.0, 10.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-20.84375, -20.313232421875, -19.78271484375, -19.252197265625, -18.7216796875, -18.191162109375, -17.66064453125, -17.130126953125, -16.599609375, -16.069091796875, -15.53857421875, -15.008056640625, -14.4775390625, -13.947021484375, -13.41650390625, -12.885986328125, -12.35546875, -11.824951171875, -11.29443359375, -10.763916015625, -10.2333984375, -9.702880859375, -9.17236328125, -8.641845703125, -8.111328125, -7.580810546875, -7.05029296875, -6.519775390625, -5.9892578125, -5.458740234375, -4.92822265625, -4.397705078125, -3.8671875, -3.336669921875, -2.80615234375, -2.275634765625, -1.7451171875, -1.214599609375, -0.68408203125, -0.153564453125, 0.376953125, 0.907470703125, 1.43798828125, 1.968505859375, 2.4990234375, 3.029541015625, 3.56005859375, 4.090576171875, 4.62109375, 5.151611328125, 5.68212890625, 6.212646484375, 6.7431640625, 7.273681640625, 7.80419921875, 8.334716796875, 8.865234375, 9.395751953125, 9.92626953125, 10.456787109375, 10.9873046875, 11.517822265625, 12.04833984375, 12.578857421875, 13.109375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 13.0, 20.0, 9.0, 29.0, 34.0, 44.0, 74.0, 93.0, 152.0, 209.0, 351.0, 751.0, 8333.0, 3971930.0, 209361.0, 1592.0, 433.0, 266.0, 192.0, 123.0, 67.0, 58.0, 44.0, 34.0, 26.0, 15.0, 13.0, 5.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.5625, -66.0, -63.4375, -60.875, -58.3125, -55.75, -53.1875, -50.625, -48.0625, -45.5, -42.9375, -40.375, -37.8125, -35.25, -32.6875, -30.125, -27.5625, -25.0, -22.4375, -19.875, -17.3125, -14.75, -12.1875, -9.625, -7.0625, -4.5, -1.9375, 0.625, 3.1875, 5.75, 8.3125, 10.875, 13.4375, 16.0, 18.5625, 21.125, 23.6875, 26.25, 28.8125, 31.375, 33.9375, 36.5, 39.0625, 41.625, 44.1875, 46.75, 49.3125, 51.875, 54.4375, 57.0, 59.5625, 62.125, 64.6875, 67.25, 69.8125, 72.375, 74.9375, 77.5, 80.0625, 82.625, 85.1875, 87.75, 90.3125, 92.875, 95.4375]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 9.0, 46.0, 146.0, 315.0, 310.0, 129.0, 41.0, 13.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-128.89718627929688, -123.5195083618164, -118.14183044433594, -112.76414489746094, -107.386474609375, -102.0087890625, -96.63111114501953, -91.25343322753906, -85.8757553100586, -80.49807739257812, -75.12039947509766, -69.74272155761719, -64.36503601074219, -58.987361907958984, -53.60968017578125, -48.23200225830078, -42.85432434082031, -37.476646423339844, -32.098968505859375, -26.72128677368164, -21.343608856201172, -15.965930938720703, -10.588249206542969, -5.2105712890625, 0.16710662841796875, 5.544785499572754, 10.922464370727539, 16.30014419555664, 21.67782211303711, 27.055500030517578, 32.43318176269531, 37.81085968017578, 43.18852233886719, 48.566200256347656, 53.943878173828125, 59.32155990600586, 64.69923400878906, 70.07691955566406, 75.45459747314453, 80.832275390625, 86.20995330810547, 91.58763122558594, 96.9653091430664, 102.34298706054688, 107.72067260742188, 113.09834289550781, 118.47602844238281, 123.85370635986328, 129.23138427734375, 134.60906982421875, 139.9867401123047, 145.3644256591797, 150.74209594726562, 156.11978149414062, 161.49746704101562, 166.87513732910156, 172.2528076171875, 177.6304931640625, 183.00816345214844, 188.38584899902344, 193.76351928710938, 199.14120483398438, 204.51889038085938, 209.8965606689453, 215.2742462158203]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 3.0, 0.0, 4.0, 6.0, 9.0, 11.0, 10.0, 11.0, 21.0, 14.0, 18.0, 15.0, 28.0, 34.0, 20.0, 27.0, 34.0, 40.0, 46.0, 23.0, 33.0, 39.0, 46.0, 45.0, 33.0, 40.0, 22.0, 39.0, 30.0, 31.0, 44.0, 33.0, 27.0, 28.0, 19.0, 19.0, 21.0, 13.0, 10.0, 10.0, 13.0, 4.0, 9.0, 3.0, 8.0, 3.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0], "bins": [-54.411285400390625, -52.87126922607422, -51.33125305175781, -49.79123306274414, -48.251216888427734, -46.71120071411133, -45.171180725097656, -43.63116455078125, -42.091148376464844, -40.55113220214844, -39.01111602783203, -37.47109603881836, -35.93107986450195, -34.39106369018555, -32.851043701171875, -31.31102752685547, -29.771011352539062, -28.230995178222656, -26.690977096557617, -25.150959014892578, -23.610942840576172, -22.070926666259766, -20.530908584594727, -18.990890502929688, -17.45087432861328, -15.910857200622559, -14.370840072631836, -12.830822944641113, -11.29080581665039, -9.750788688659668, -8.210771560668945, -6.670754432678223, -5.1307373046875, -3.5907201766967773, -2.0507030487060547, -0.510685920715332, 1.0293312072753906, 2.5693483352661133, 4.109365463256836, 5.649382591247559, 7.189399719238281, 8.729416847229004, 10.269433975219727, 11.80945110321045, 13.349468231201172, 14.889485359191895, 16.429502487182617, 17.969520568847656, 19.509536743164062, 21.04955291748047, 22.589570999145508, 24.129589080810547, 25.669605255126953, 27.20962142944336, 28.7496395111084, 30.289657592773438, 31.829673767089844, 33.36968994140625, 34.909706115722656, 36.44972610473633, 37.989742279052734, 39.52975845336914, 41.06977844238281, 42.60979461669922, 44.149810791015625]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 8.0, 10.0, 7.0, 7.0, 18.0, 7.0, 21.0, 25.0, 27.0, 38.0, 42.0, 35.0, 52.0, 46.0, 56.0, 51.0, 44.0, 45.0, 47.0, 47.0, 54.0, 42.0, 53.0, 51.0, 26.0, 29.0, 21.0, 19.0, 14.0, 18.0, 14.0, 5.0, 9.0, 6.0, 8.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.52734375, -6.28887939453125, -6.0504150390625, -5.81195068359375, -5.573486328125, -5.33502197265625, -5.0965576171875, -4.85809326171875, -4.61962890625, -4.38116455078125, -4.1427001953125, -3.90423583984375, -3.665771484375, -3.42730712890625, -3.1888427734375, -2.95037841796875, -2.7119140625, -2.47344970703125, -2.2349853515625, -1.99652099609375, -1.758056640625, -1.51959228515625, -1.2811279296875, -1.04266357421875, -0.80419921875, -0.56573486328125, -0.3272705078125, -0.08880615234375, 0.149658203125, 0.38812255859375, 0.6265869140625, 0.86505126953125, 1.103515625, 1.34197998046875, 1.5804443359375, 1.81890869140625, 2.057373046875, 2.29583740234375, 2.5343017578125, 2.77276611328125, 3.01123046875, 3.24969482421875, 3.4881591796875, 3.72662353515625, 3.965087890625, 4.20355224609375, 4.4420166015625, 4.68048095703125, 4.9189453125, 5.15740966796875, 5.3958740234375, 5.63433837890625, 5.872802734375, 6.11126708984375, 6.3497314453125, 6.58819580078125, 6.82666015625, 7.06512451171875, 7.3035888671875, 7.54205322265625, 7.780517578125, 8.01898193359375, 8.2574462890625, 8.49591064453125, 8.734375]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 2.0, 4.0, 7.0, 10.0, 20.0, 30.0, 38.0, 79.0, 107.0, 153.0, 236.0, 413.0, 683.0, 1105.0, 1972.0, 3104.0, 5496.0, 9727.0, 17631.0, 32146.0, 64208.0, 136390.0, 349026.0, 225522.0, 96522.0, 47405.0, 24866.0, 13465.0, 7452.0, 4342.0, 2476.0, 1543.0, 900.0, 588.0, 330.0, 200.0, 129.0, 81.0, 47.0, 29.0, 20.0, 12.0, 16.0, 9.0, 3.0, 9.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.69921875, -1.645751953125, -1.59228515625, -1.538818359375, -1.4853515625, -1.431884765625, -1.37841796875, -1.324951171875, -1.271484375, -1.218017578125, -1.16455078125, -1.111083984375, -1.0576171875, -1.004150390625, -0.95068359375, -0.897216796875, -0.84375, -0.790283203125, -0.73681640625, -0.683349609375, -0.6298828125, -0.576416015625, -0.52294921875, -0.469482421875, -0.416015625, -0.362548828125, -0.30908203125, -0.255615234375, -0.2021484375, -0.148681640625, -0.09521484375, -0.041748046875, 0.01171875, 0.065185546875, 0.11865234375, 0.172119140625, 0.2255859375, 0.279052734375, 0.33251953125, 0.385986328125, 0.439453125, 0.492919921875, 0.54638671875, 0.599853515625, 0.6533203125, 0.706787109375, 0.76025390625, 0.813720703125, 0.8671875, 0.920654296875, 0.97412109375, 1.027587890625, 1.0810546875, 1.134521484375, 1.18798828125, 1.241455078125, 1.294921875, 1.348388671875, 1.40185546875, 1.455322265625, 1.5087890625, 1.562255859375, 1.61572265625, 1.669189453125, 1.72265625]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 6.0, 3.0, 3.0, 2.0, 3.0, 3.0, 9.0, 6.0, 12.0, 8.0, 8.0, 14.0, 11.0, 15.0, 15.0, 26.0, 35.0, 28.0, 21.0, 31.0, 33.0, 17.0, 40.0, 41.0, 40.0, 52.0, 34.0, 1060.0, 35.0, 40.0, 29.0, 18.0, 22.0, 34.0, 27.0, 29.0, 21.0, 34.0, 22.0, 20.0, 18.0, 17.0, 12.0, 13.0, 14.0, 14.0, 11.0, 7.0, 5.0, 4.0, 4.0, 4.0, 1.0, 1.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0], "bins": [-3.275390625, -3.170318603515625, -3.06524658203125, -2.960174560546875, -2.8551025390625, -2.750030517578125, -2.64495849609375, -2.539886474609375, -2.434814453125, -2.329742431640625, -2.22467041015625, -2.119598388671875, -2.0145263671875, -1.909454345703125, -1.80438232421875, -1.699310302734375, -1.59423828125, -1.489166259765625, -1.38409423828125, -1.279022216796875, -1.1739501953125, -1.068878173828125, -0.96380615234375, -0.858734130859375, -0.753662109375, -0.648590087890625, -0.54351806640625, -0.438446044921875, -0.3333740234375, -0.228302001953125, -0.12322998046875, -0.018157958984375, 0.0869140625, 0.191986083984375, 0.29705810546875, 0.402130126953125, 0.5072021484375, 0.612274169921875, 0.71734619140625, 0.822418212890625, 0.927490234375, 1.032562255859375, 1.13763427734375, 1.242706298828125, 1.3477783203125, 1.452850341796875, 1.55792236328125, 1.662994384765625, 1.76806640625, 1.873138427734375, 1.97821044921875, 2.083282470703125, 2.1883544921875, 2.293426513671875, 2.39849853515625, 2.503570556640625, 2.608642578125, 2.713714599609375, 2.81878662109375, 2.923858642578125, 3.0289306640625, 3.134002685546875, 3.23907470703125, 3.344146728515625, 3.44921875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 5.0, 12.0, 19.0, 27.0, 27.0, 32.0, 61.0, 78.0, 118.0, 129.0, 220.0, 331.0, 401.0, 574.0, 773.0, 1172.0, 1640.0, 2287.0, 3195.0, 4634.0, 6619.0, 9597.0, 13832.0, 20557.0, 30809.0, 46527.0, 71982.0, 124887.0, 1316716.0, 178314.0, 90302.0, 56313.0, 36934.0, 24512.0, 16377.0, 11054.0, 7757.0, 5352.0, 3702.0, 2676.0, 1856.0, 1366.0, 946.0, 703.0, 476.0, 356.0, 284.0, 184.0, 119.0, 88.0, 67.0, 31.0, 32.0, 22.0, 17.0, 17.0, 11.0, 2.0, 7.0, 4.0, 3.0], "bins": [-0.94921875, -0.9192962646484375, -0.889373779296875, -0.8594512939453125, -0.82952880859375, -0.7996063232421875, -0.769683837890625, -0.7397613525390625, -0.7098388671875, -0.6799163818359375, -0.649993896484375, -0.6200714111328125, -0.59014892578125, -0.5602264404296875, -0.530303955078125, -0.5003814697265625, -0.470458984375, -0.4405364990234375, -0.410614013671875, -0.3806915283203125, -0.35076904296875, -0.3208465576171875, -0.290924072265625, -0.2610015869140625, -0.2310791015625, -0.2011566162109375, -0.171234130859375, -0.1413116455078125, -0.11138916015625, -0.0814666748046875, -0.051544189453125, -0.0216217041015625, 0.00830078125, 0.0382232666015625, 0.068145751953125, 0.0980682373046875, 0.12799072265625, 0.1579132080078125, 0.187835693359375, 0.2177581787109375, 0.2476806640625, 0.2776031494140625, 0.307525634765625, 0.3374481201171875, 0.36737060546875, 0.3972930908203125, 0.427215576171875, 0.4571380615234375, 0.487060546875, 0.5169830322265625, 0.546905517578125, 0.5768280029296875, 0.60675048828125, 0.6366729736328125, 0.666595458984375, 0.6965179443359375, 0.7264404296875, 0.7563629150390625, 0.786285400390625, 0.8162078857421875, 0.84613037109375, 0.8760528564453125, 0.905975341796875, 0.9358978271484375, 0.9658203125]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 3.0, 5.0, 4.0, 9.0, 8.0, 8.0, 14.0, 14.0, 11.0, 14.0, 17.0, 25.0, 28.0, 31.0, 39.0, 40.0, 46.0, 50.0, 49.0, 65.0, 56.0, 59.0, 67.0, 50.0, 49.0, 42.0, 25.0, 21.0, 15.0, 21.0, 19.0, 17.0, 12.0, 6.0, 11.0, 13.0, 7.0, 5.0, 7.0, 5.0, 4.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0005207061767578125, -0.0005050599575042725, -0.0004894137382507324, -0.0004737675189971924, -0.00045812129974365234, -0.0004424750804901123, -0.00042682886123657227, -0.0004111826419830322, -0.0003955364227294922, -0.00037989020347595215, -0.0003642439842224121, -0.00034859776496887207, -0.00033295154571533203, -0.000317305326461792, -0.00030165910720825195, -0.0002860128879547119, -0.0002703666687011719, -0.00025472044944763184, -0.0002390742301940918, -0.00022342801094055176, -0.00020778179168701172, -0.00019213557243347168, -0.00017648935317993164, -0.0001608431339263916, -0.00014519691467285156, -0.00012955069541931152, -0.00011390447616577148, -9.825825691223145e-05, -8.26120376586914e-05, -6.696581840515137e-05, -5.131959915161133e-05, -3.567337989807129e-05, -2.002716064453125e-05, -4.380941390991211e-06, 1.1265277862548828e-05, 2.6911497116088867e-05, 4.2557716369628906e-05, 5.8203935623168945e-05, 7.385015487670898e-05, 8.949637413024902e-05, 0.00010514259338378906, 0.0001207888126373291, 0.00013643503189086914, 0.00015208125114440918, 0.00016772747039794922, 0.00018337368965148926, 0.0001990199089050293, 0.00021466612815856934, 0.00023031234741210938, 0.0002459585666656494, 0.00026160478591918945, 0.0002772510051727295, 0.00029289722442626953, 0.00030854344367980957, 0.0003241896629333496, 0.00033983588218688965, 0.0003554821014404297, 0.0003711283206939697, 0.00038677453994750977, 0.0004024207592010498, 0.00041806697845458984, 0.0004337131977081299, 0.0004493594169616699, 0.00046500563621520996, 0.00048065185546875]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 5.0, 3.0, 12.0, 7.0, 14.0, 15.0, 26.0, 27.0, 41.0, 51.0, 68.0, 94.0, 152.0, 250.0, 602.0, 7485.0, 1030871.0, 7442.0, 574.0, 249.0, 148.0, 109.0, 70.0, 61.0, 42.0, 38.0, 21.0, 17.0, 12.0, 7.0, 11.0, 1.0, 5.0, 4.0, 3.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.012115478515625, -0.011690378189086914, -0.011265277862548828, -0.010840177536010742, -0.010415077209472656, -0.00998997688293457, -0.009564876556396484, -0.009139776229858398, -0.008714675903320312, -0.008289575576782227, -0.00786447525024414, -0.007439374923706055, -0.007014274597167969, -0.006589174270629883, -0.006164073944091797, -0.005738973617553711, -0.005313873291015625, -0.004888772964477539, -0.004463672637939453, -0.004038572311401367, -0.0036134719848632812, -0.0031883716583251953, -0.0027632713317871094, -0.0023381710052490234, -0.0019130706787109375, -0.0014879703521728516, -0.0010628700256347656, -0.0006377696990966797, -0.00021266937255859375, 0.0002124309539794922, 0.0006375312805175781, 0.001062631607055664, 0.00148773193359375, 0.001912832260131836, 0.002337932586669922, 0.002763032913208008, 0.0031881332397460938, 0.0036132335662841797, 0.004038333892822266, 0.0044634342193603516, 0.0048885345458984375, 0.0053136348724365234, 0.005738735198974609, 0.006163835525512695, 0.006588935852050781, 0.007014036178588867, 0.007439136505126953, 0.007864236831665039, 0.008289337158203125, 0.008714437484741211, 0.009139537811279297, 0.009564638137817383, 0.009989738464355469, 0.010414838790893555, 0.01083993911743164, 0.011265039443969727, 0.011690139770507812, 0.012115240097045898, 0.012540340423583984, 0.01296544075012207, 0.013390541076660156, 0.013815641403198242, 0.014240741729736328, 0.014665842056274414, 0.0150909423828125]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [8.0, 56.0, 307.0, 451.0, 169.0, 21.0, 5.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014267714868765324, -9.896239498630166e-05, -5.524764128495008e-05, -1.1532887583598495e-05, 3.218186611775309e-05, 7.589661981910467e-05, 0.00011961137352045625, 0.0001633261126698926, 0.00020704088092315942, 0.000250755634624511, 0.0002944704028777778, 0.00033818514202721417, 0.0003818998811766505, 0.00042561464942991734, 0.00046932941768318415, 0.00051304412772879, 0.0005567588959820569, 0.0006004736642353237, 0.0006441883742809296, 0.0006879031425341964, 0.0007316179107874632, 0.00077533267904073, 0.0008190474472939968, 0.0008627621573396027, 0.0009064769255928695, 0.0009501916938461363, 0.0009939064038917422, 0.001037621172145009, 0.0010813359403982759, 0.0011250507086515427, 0.0011687654769048095, 0.0012124802451580763, 0.0012561948969960213, 0.001299909665249288, 0.001343624433502555, 0.0013873392017558217, 0.0014310539700090885, 0.0014747686218470335, 0.0015184833901003003, 0.0015621981583535671, 0.001605912926606834, 0.0016496276948601007, 0.0016933424631133676, 0.0017370572313666344, 0.0017807718832045794, 0.0018244866514578462, 0.001868201419711113, 0.0019119161879643798, 0.0019556309562176466, 0.0019993456080555916, 0.0020430604927241802, 0.002086775144562125, 0.002130490029230714, 0.002174204681068659, 0.0022179195657372475, 0.0022616342175751925, 0.0023053488694131374, 0.0023490635212510824, 0.002392778405919671, 0.002436493057757616, 0.0024802079424262047, 0.0025239225942641497, 0.0025676374789327383, 0.0026113521307706833, 0.002655067015439272]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 5.0, 5.0, 1.0, 8.0, 8.0, 4.0, 11.0, 14.0, 21.0, 18.0, 16.0, 26.0, 30.0, 28.0, 29.0, 35.0, 40.0, 39.0, 37.0, 40.0, 43.0, 33.0, 55.0, 41.0, 44.0, 33.0, 32.0, 29.0, 36.0, 33.0, 24.0, 30.0, 28.0, 20.0, 17.0, 18.0, 11.0, 12.0, 15.0, 8.0, 9.0, 3.0, 1.0, 4.0, 5.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00026494264602661133, -0.0002562534064054489, -0.0002475641667842865, -0.00023887492716312408, -0.00023018568754196167, -0.00022149644792079926, -0.00021280720829963684, -0.00020411796867847443, -0.000195428729057312, -0.0001867394894361496, -0.00017805024981498718, -0.00016936101019382477, -0.00016067177057266235, -0.00015198253095149994, -0.00014329329133033752, -0.0001346040517091751, -0.0001259148120880127, -0.00011722557246685028, -0.00010853633284568787, -9.984709322452545e-05, -9.115785360336304e-05, -8.246861398220062e-05, -7.377937436103821e-05, -6.50901347398758e-05, -5.640089511871338e-05, -4.7711655497550964e-05, -3.902241587638855e-05, -3.0333176255226135e-05, -2.164393663406372e-05, -1.2954697012901306e-05, -4.265457391738892e-06, 4.423782229423523e-06, 1.3113021850585938e-05, 2.1802261471748352e-05, 3.0491501092910767e-05, 3.918074071407318e-05, 4.7869980335235596e-05, 5.655921995639801e-05, 6.524845957756042e-05, 7.393769919872284e-05, 8.262693881988525e-05, 9.131617844104767e-05, 0.00010000541806221008, 0.0001086946576833725, 0.00011738389730453491, 0.00012607313692569733, 0.00013476237654685974, 0.00014345161616802216, 0.00015214085578918457, 0.00016083009541034698, 0.0001695193350315094, 0.00017820857465267181, 0.00018689781427383423, 0.00019558705389499664, 0.00020427629351615906, 0.00021296553313732147, 0.0002216547727584839, 0.0002303440123796463, 0.00023903325200080872, 0.00024772249162197113, 0.00025641173124313354, 0.00026510097086429596, 0.0002737902104854584, 0.0002824794501066208, 0.0002911686897277832]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 8.0, 10.0, 7.0, 7.0, 18.0, 7.0, 21.0, 25.0, 27.0, 38.0, 42.0, 35.0, 52.0, 46.0, 56.0, 51.0, 44.0, 45.0, 47.0, 47.0, 54.0, 42.0, 53.0, 51.0, 26.0, 29.0, 21.0, 19.0, 14.0, 18.0, 14.0, 5.0, 9.0, 6.0, 8.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.52734375, -6.28887939453125, -6.0504150390625, -5.81195068359375, -5.573486328125, -5.33502197265625, -5.0965576171875, -4.85809326171875, -4.61962890625, -4.38116455078125, -4.1427001953125, -3.90423583984375, -3.665771484375, -3.42730712890625, -3.1888427734375, -2.95037841796875, -2.7119140625, -2.47344970703125, -2.2349853515625, -1.99652099609375, -1.758056640625, -1.51959228515625, -1.2811279296875, -1.04266357421875, -0.80419921875, -0.56573486328125, -0.3272705078125, -0.08880615234375, 0.149658203125, 0.38812255859375, 0.6265869140625, 0.86505126953125, 1.103515625, 1.34197998046875, 1.5804443359375, 1.81890869140625, 2.057373046875, 2.29583740234375, 2.5343017578125, 2.77276611328125, 3.01123046875, 3.24969482421875, 3.4881591796875, 3.72662353515625, 3.965087890625, 4.20355224609375, 4.4420166015625, 4.68048095703125, 4.9189453125, 5.15740966796875, 5.3958740234375, 5.63433837890625, 5.872802734375, 6.11126708984375, 6.3497314453125, 6.58819580078125, 6.82666015625, 7.06512451171875, 7.3035888671875, 7.54205322265625, 7.780517578125, 8.01898193359375, 8.2574462890625, 8.49591064453125, 8.734375]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [5.0, 2.0, 1.0, 5.0, 5.0, 15.0, 19.0, 10.0, 22.0, 38.0, 43.0, 60.0, 94.0, 127.0, 178.0, 281.0, 359.0, 532.0, 633.0, 937.0, 1314.0, 1613.0, 2366.0, 3285.0, 4777.0, 7086.0, 11285.0, 20808.0, 45094.0, 118719.0, 379437.0, 277861.0, 88281.0, 35053.0, 17237.0, 9675.0, 6227.0, 4269.0, 2983.0, 2156.0, 1588.0, 1141.0, 817.0, 557.0, 441.0, 298.0, 218.0, 165.0, 120.0, 86.0, 79.0, 46.0, 31.0, 27.0, 20.0, 17.0, 5.0, 11.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0], "bins": [-3.4453125, -3.333648681640625, -3.22198486328125, -3.110321044921875, -2.9986572265625, -2.886993408203125, -2.77532958984375, -2.663665771484375, -2.552001953125, -2.440338134765625, -2.32867431640625, -2.217010498046875, -2.1053466796875, -1.993682861328125, -1.88201904296875, -1.770355224609375, -1.65869140625, -1.547027587890625, -1.43536376953125, -1.323699951171875, -1.2120361328125, -1.100372314453125, -0.98870849609375, -0.877044677734375, -0.765380859375, -0.653717041015625, -0.54205322265625, -0.430389404296875, -0.3187255859375, -0.207061767578125, -0.09539794921875, 0.016265869140625, 0.1279296875, 0.239593505859375, 0.35125732421875, 0.462921142578125, 0.5745849609375, 0.686248779296875, 0.79791259765625, 0.909576416015625, 1.021240234375, 1.132904052734375, 1.24456787109375, 1.356231689453125, 1.4678955078125, 1.579559326171875, 1.69122314453125, 1.802886962890625, 1.91455078125, 2.026214599609375, 2.13787841796875, 2.249542236328125, 2.3612060546875, 2.472869873046875, 2.58453369140625, 2.696197509765625, 2.807861328125, 2.919525146484375, 3.03118896484375, 3.142852783203125, 3.2545166015625, 3.366180419921875, 3.47784423828125, 3.589508056640625, 3.701171875]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 1.0, 4.0, 3.0, 2.0, 4.0, 8.0, 5.0, 12.0, 14.0, 13.0, 27.0, 21.0, 31.0, 31.0, 32.0, 39.0, 50.0, 52.0, 51.0, 88.0, 508.0, 1582.0, 65.0, 46.0, 51.0, 42.0, 53.0, 30.0, 39.0, 34.0, 25.0, 20.0, 16.0, 11.0, 13.0, 10.0, 5.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.859375, -25.0517578125, -24.244140625, -23.4365234375, -22.62890625, -21.8212890625, -21.013671875, -20.2060546875, -19.3984375, -18.5908203125, -17.783203125, -16.9755859375, -16.16796875, -15.3603515625, -14.552734375, -13.7451171875, -12.9375, -12.1298828125, -11.322265625, -10.5146484375, -9.70703125, -8.8994140625, -8.091796875, -7.2841796875, -6.4765625, -5.6689453125, -4.861328125, -4.0537109375, -3.24609375, -2.4384765625, -1.630859375, -0.8232421875, -0.015625, 0.7919921875, 1.599609375, 2.4072265625, 3.21484375, 4.0224609375, 4.830078125, 5.6376953125, 6.4453125, 7.2529296875, 8.060546875, 8.8681640625, 9.67578125, 10.4833984375, 11.291015625, 12.0986328125, 12.90625, 13.7138671875, 14.521484375, 15.3291015625, 16.13671875, 16.9443359375, 17.751953125, 18.5595703125, 19.3671875, 20.1748046875, 20.982421875, 21.7900390625, 22.59765625, 23.4052734375, 24.212890625, 25.0205078125, 25.828125]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 5.0, 0.0, 4.0, 6.0, 3.0, 8.0, 11.0, 14.0, 17.0, 24.0, 31.0, 30.0, 54.0, 54.0, 75.0, 148.0, 219.0, 340.0, 697.0, 8765.0, 3080274.0, 52244.0, 1423.0, 452.0, 267.0, 140.0, 91.0, 73.0, 54.0, 46.0, 36.0, 25.0, 18.0, 14.0, 11.0, 7.0, 8.0, 3.0, 5.0, 4.0, 5.0, 3.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-46.28125, -44.8212890625, -43.361328125, -41.9013671875, -40.44140625, -38.9814453125, -37.521484375, -36.0615234375, -34.6015625, -33.1416015625, -31.681640625, -30.2216796875, -28.76171875, -27.3017578125, -25.841796875, -24.3818359375, -22.921875, -21.4619140625, -20.001953125, -18.5419921875, -17.08203125, -15.6220703125, -14.162109375, -12.7021484375, -11.2421875, -9.7822265625, -8.322265625, -6.8623046875, -5.40234375, -3.9423828125, -2.482421875, -1.0224609375, 0.4375, 1.8974609375, 3.357421875, 4.8173828125, 6.27734375, 7.7373046875, 9.197265625, 10.6572265625, 12.1171875, 13.5771484375, 15.037109375, 16.4970703125, 17.95703125, 19.4169921875, 20.876953125, 22.3369140625, 23.796875, 25.2568359375, 26.716796875, 28.1767578125, 29.63671875, 31.0966796875, 32.556640625, 34.0166015625, 35.4765625, 36.9365234375, 38.396484375, 39.8564453125, 41.31640625, 42.7763671875, 44.236328125, 45.6962890625, 47.15625]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 42.0, 273.0, 496.0, 185.0, 15.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-117.33168029785156, -114.99890899658203, -112.66613006591797, -110.33335876464844, -108.00057983398438, -105.66780853271484, -103.33503723144531, -101.00225830078125, -98.66948699951172, -96.33671569824219, -94.00393676757812, -91.6711654663086, -89.33839416503906, -87.005615234375, -84.67284393310547, -82.34007263183594, -80.00729370117188, -77.67452239990234, -75.34174346923828, -73.00897216796875, -70.67619323730469, -68.34342193603516, -66.01065063476562, -63.67787551879883, -61.34510040283203, -59.012325286865234, -56.67955017089844, -54.346778869628906, -52.01400375366211, -49.68122863769531, -47.34845733642578, -45.015682220458984, -42.68291091918945, -40.350135803222656, -38.017364501953125, -35.68458938598633, -33.35181427001953, -31.019039154052734, -28.68626594543457, -26.353492736816406, -24.02071762084961, -21.687942504882812, -19.35516929626465, -17.022396087646484, -14.689620971679688, -12.356846809387207, -10.024072647094727, -7.6912994384765625, -5.358524322509766, -3.025750160217285, -0.6929759979248047, 1.6397981643676758, 3.9725723266601562, 6.305346488952637, 8.638120651245117, 10.970893859863281, 13.303668975830078, 15.636443138122559, 17.96921730041504, 20.301990509033203, 22.634765625, 24.967540740966797, 27.30031394958496, 29.633087158203125, 31.965862274169922]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 7.0, 2.0, 9.0, 8.0, 9.0, 10.0, 8.0, 17.0, 10.0, 18.0, 22.0, 23.0, 19.0, 27.0, 37.0, 33.0, 31.0, 30.0, 35.0, 57.0, 42.0, 42.0, 31.0, 44.0, 48.0, 51.0, 39.0, 34.0, 29.0, 33.0, 44.0, 27.0, 29.0, 12.0, 20.0, 10.0, 10.0, 12.0, 6.0, 5.0, 6.0, 9.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-63.45050048828125, -61.33300018310547, -59.21549987792969, -57.09800338745117, -54.98050308227539, -52.86300277709961, -50.745506286621094, -48.62800598144531, -46.51050567626953, -44.39300537109375, -42.27550506591797, -40.15800857543945, -38.04050827026367, -35.92300796508789, -33.805511474609375, -31.688011169433594, -29.570510864257812, -27.45301055908203, -25.335512161254883, -23.218013763427734, -21.100513458251953, -18.983013153076172, -16.865514755249023, -14.748015403747559, -12.630516052246094, -10.513016700744629, -8.395517349243164, -6.278017997741699, -4.160518646240234, -2.0430192947387695, 0.07448005676269531, 2.19197940826416, 4.309471130371094, 6.426970481872559, 8.544469833374023, 10.661969184875488, 12.779468536376953, 14.896967887878418, 17.014467239379883, 19.13196563720703, 21.249465942382812, 23.366966247558594, 25.484464645385742, 27.60196304321289, 29.719463348388672, 31.836963653564453, 33.95446014404297, 36.07196044921875, 38.18946075439453, 40.30696105957031, 42.424461364746094, 44.54195785522461, 46.65945816040039, 48.77695846557617, 50.89445495605469, 53.01195526123047, 55.12945556640625, 57.24695587158203, 59.36445617675781, 61.48195266723633, 63.59945297241211, 65.71694946289062, 67.8344497680664, 69.95195007324219, 72.06945037841797]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 10.0, 7.0, 9.0, 8.0, 16.0, 15.0, 14.0, 26.0, 31.0, 40.0, 41.0, 42.0, 46.0, 44.0, 66.0, 42.0, 45.0, 50.0, 41.0, 62.0, 41.0, 46.0, 58.0, 33.0, 29.0, 30.0, 25.0, 13.0, 12.0, 22.0, 12.0, 6.0, 7.0, 6.0, 7.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.7890625, -6.5474853515625, -6.305908203125, -6.0643310546875, -5.82275390625, -5.5811767578125, -5.339599609375, -5.0980224609375, -4.8564453125, -4.6148681640625, -4.373291015625, -4.1317138671875, -3.89013671875, -3.6485595703125, -3.406982421875, -3.1654052734375, -2.923828125, -2.6822509765625, -2.440673828125, -2.1990966796875, -1.95751953125, -1.7159423828125, -1.474365234375, -1.2327880859375, -0.9912109375, -0.7496337890625, -0.508056640625, -0.2664794921875, -0.02490234375, 0.2166748046875, 0.458251953125, 0.6998291015625, 0.94140625, 1.1829833984375, 1.424560546875, 1.6661376953125, 1.90771484375, 2.1492919921875, 2.390869140625, 2.6324462890625, 2.8740234375, 3.1156005859375, 3.357177734375, 3.5987548828125, 3.84033203125, 4.0819091796875, 4.323486328125, 4.5650634765625, 4.806640625, 5.0482177734375, 5.289794921875, 5.5313720703125, 5.77294921875, 6.0145263671875, 6.256103515625, 6.4976806640625, 6.7392578125, 6.9808349609375, 7.222412109375, 7.4639892578125, 7.70556640625, 7.9471435546875, 8.188720703125, 8.4302978515625, 8.671875]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 4.0, 3.0, 11.0, 8.0, 19.0, 14.0, 30.0, 29.0, 51.0, 81.0, 129.0, 185.0, 342.0, 576.0, 1035.0, 2151.0, 4806.0, 11981.0, 31989.0, 107733.0, 384245.0, 1122412.0, 1509309.0, 723955.0, 202568.0, 57248.0, 19183.0, 7439.0, 3255.0, 1480.0, 795.0, 443.0, 256.0, 171.0, 119.0, 76.0, 46.0, 41.0, 23.0, 14.0, 12.0, 6.0, 3.0, 4.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.33203125, -6.10797119140625, -5.8839111328125, -5.65985107421875, -5.435791015625, -5.21173095703125, -4.9876708984375, -4.76361083984375, -4.53955078125, -4.31549072265625, -4.0914306640625, -3.86737060546875, -3.643310546875, -3.41925048828125, -3.1951904296875, -2.97113037109375, -2.7470703125, -2.52301025390625, -2.2989501953125, -2.07489013671875, -1.850830078125, -1.62677001953125, -1.4027099609375, -1.17864990234375, -0.95458984375, -0.73052978515625, -0.5064697265625, -0.28240966796875, -0.058349609375, 0.16571044921875, 0.3897705078125, 0.61383056640625, 0.837890625, 1.06195068359375, 1.2860107421875, 1.51007080078125, 1.734130859375, 1.95819091796875, 2.1822509765625, 2.40631103515625, 2.63037109375, 2.85443115234375, 3.0784912109375, 3.30255126953125, 3.526611328125, 3.75067138671875, 3.9747314453125, 4.19879150390625, 4.4228515625, 4.64691162109375, 4.8709716796875, 5.09503173828125, 5.319091796875, 5.54315185546875, 5.7672119140625, 5.99127197265625, 6.21533203125, 6.43939208984375, 6.6634521484375, 6.88751220703125, 7.111572265625, 7.33563232421875, 7.5596923828125, 7.78375244140625, 8.0078125]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 0.0, 2.0, 5.0, 3.0, 5.0, 3.0, 7.0, 15.0, 9.0, 15.0, 20.0, 21.0, 40.0, 51.0, 66.0, 107.0, 131.0, 140.0, 197.0, 252.0, 329.0, 354.0, 397.0, 377.0, 333.0, 277.0, 208.0, 160.0, 128.0, 89.0, 83.0, 66.0, 50.0, 39.0, 24.0, 23.0, 13.0, 14.0, 10.0, 2.0, 7.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.015625, -13.5733642578125, -13.131103515625, -12.6888427734375, -12.24658203125, -11.8043212890625, -11.362060546875, -10.9197998046875, -10.4775390625, -10.0352783203125, -9.593017578125, -9.1507568359375, -8.70849609375, -8.2662353515625, -7.823974609375, -7.3817138671875, -6.939453125, -6.4971923828125, -6.054931640625, -5.6126708984375, -5.17041015625, -4.7281494140625, -4.285888671875, -3.8436279296875, -3.4013671875, -2.9591064453125, -2.516845703125, -2.0745849609375, -1.63232421875, -1.1900634765625, -0.747802734375, -0.3055419921875, 0.13671875, 0.5789794921875, 1.021240234375, 1.4635009765625, 1.90576171875, 2.3480224609375, 2.790283203125, 3.2325439453125, 3.6748046875, 4.1170654296875, 4.559326171875, 5.0015869140625, 5.44384765625, 5.8861083984375, 6.328369140625, 6.7706298828125, 7.212890625, 7.6551513671875, 8.097412109375, 8.5396728515625, 8.98193359375, 9.4241943359375, 9.866455078125, 10.3087158203125, 10.7509765625, 11.1932373046875, 11.635498046875, 12.0777587890625, 12.52001953125, 12.9622802734375, 13.404541015625, 13.8468017578125, 14.2890625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 3.0, 7.0, 13.0, 7.0, 14.0, 22.0, 22.0, 38.0, 41.0, 48.0, 75.0, 89.0, 139.0, 198.0, 338.0, 783.0, 7869.0, 3075275.0, 1103431.0, 4267.0, 649.0, 311.0, 163.0, 118.0, 78.0, 68.0, 51.0, 44.0, 26.0, 19.0, 16.0, 11.0, 11.0, 12.0, 6.0, 1.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-61.5625, -59.5048828125, -57.447265625, -55.3896484375, -53.33203125, -51.2744140625, -49.216796875, -47.1591796875, -45.1015625, -43.0439453125, -40.986328125, -38.9287109375, -36.87109375, -34.8134765625, -32.755859375, -30.6982421875, -28.640625, -26.5830078125, -24.525390625, -22.4677734375, -20.41015625, -18.3525390625, -16.294921875, -14.2373046875, -12.1796875, -10.1220703125, -8.064453125, -6.0068359375, -3.94921875, -1.8916015625, 0.166015625, 2.2236328125, 4.28125, 6.3388671875, 8.396484375, 10.4541015625, 12.51171875, 14.5693359375, 16.626953125, 18.6845703125, 20.7421875, 22.7998046875, 24.857421875, 26.9150390625, 28.97265625, 31.0302734375, 33.087890625, 35.1455078125, 37.203125, 39.2607421875, 41.318359375, 43.3759765625, 45.43359375, 47.4912109375, 49.548828125, 51.6064453125, 53.6640625, 55.7216796875, 57.779296875, 59.8369140625, 61.89453125, 63.9521484375, 66.009765625, 68.0673828125, 70.125]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 13.0, 65.0, 249.0, 384.0, 220.0, 65.0, 18.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-221.6351776123047, -215.203369140625, -208.7715606689453, -202.33975219726562, -195.907958984375, -189.4761505126953, -183.04434204101562, -176.61253356933594, -170.18072509765625, -163.74891662597656, -157.31710815429688, -150.88531494140625, -144.45350646972656, -138.02169799804688, -131.5898895263672, -125.1580810546875, -118.72628784179688, -112.29447937011719, -105.86267852783203, -99.43087005615234, -92.99906921386719, -86.5672607421875, -80.13545227050781, -73.70364379882812, -67.27184295654297, -60.84003829956055, -54.408233642578125, -47.97642517089844, -41.544620513916016, -35.112815856933594, -28.681007385253906, -22.249202728271484, -15.817398071289062, -9.385592460632324, -2.953786849975586, 3.4780197143554688, 9.90982437133789, 16.341629028320312, 22.7734375, 29.205242156982422, 35.637046813964844, 42.068851470947266, 48.50065612792969, 54.932464599609375, 61.3642692565918, 67.79607391357422, 74.2278823852539, 80.65968322753906, 87.09149169921875, 93.52330017089844, 99.9551010131836, 106.38690948486328, 112.81871032714844, 119.25051879882812, 125.68232727050781, 132.1141357421875, 138.54592895507812, 144.9777374267578, 151.4095458984375, 157.84133911132812, 164.2731475830078, 170.7049560546875, 177.1367645263672, 183.56857299804688, 190.00038146972656]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 7.0, 7.0, 4.0, 8.0, 11.0, 8.0, 9.0, 14.0, 18.0, 15.0, 24.0, 25.0, 32.0, 33.0, 29.0, 32.0, 33.0, 39.0, 50.0, 34.0, 47.0, 37.0, 51.0, 46.0, 41.0, 41.0, 42.0, 28.0, 25.0, 31.0, 28.0, 27.0, 23.0, 20.0, 18.0, 17.0, 13.0, 12.0, 7.0, 6.0, 3.0, 1.0, 1.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-52.1146240234375, -50.40224075317383, -48.68985366821289, -46.97747039794922, -45.26508712768555, -43.552703857421875, -41.84031677246094, -40.127933502197266, -38.415550231933594, -36.70316696166992, -34.990779876708984, -33.27839660644531, -31.56601333618164, -29.853628158569336, -28.14124298095703, -26.42885971069336, -24.716474533081055, -23.00408935546875, -21.291706085205078, -19.579320907592773, -17.8669376373291, -16.154552459716797, -14.442168235778809, -12.72978401184082, -11.017399787902832, -9.305015563964844, -7.5926313400268555, -5.880246639251709, -4.167862415313721, -2.455477714538574, -0.7430934906005859, 0.9692907333374023, 2.6816749572753906, 4.394059181213379, 6.106443405151367, 7.818828105926514, 9.531211853027344, 11.243597030639648, 12.955981254577637, 14.668365478515625, 16.380748748779297, 18.0931339263916, 19.805517196655273, 21.517902374267578, 23.23028564453125, 24.942670822143555, 26.65505599975586, 28.36743927001953, 30.079824447631836, 31.79220962524414, 33.50459289550781, 35.216976165771484, 36.92936325073242, 38.641746520996094, 40.354129791259766, 42.06651306152344, 43.778900146484375, 45.49128341674805, 47.203670501708984, 48.916053771972656, 50.62843704223633, 52.3408203125, 54.05320739746094, 55.76559066772461, 57.47797393798828]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 9.0, 13.0, 13.0, 12.0, 25.0, 21.0, 37.0, 30.0, 42.0, 45.0, 42.0, 48.0, 45.0, 58.0, 50.0, 57.0, 48.0, 53.0, 57.0, 39.0, 47.0, 30.0, 31.0, 35.0, 21.0, 16.0, 23.0, 14.0, 8.0, 8.0, 3.0, 8.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.11328125, -6.86065673828125, -6.6080322265625, -6.35540771484375, -6.102783203125, -5.85015869140625, -5.5975341796875, -5.34490966796875, -5.09228515625, -4.83966064453125, -4.5870361328125, -4.33441162109375, -4.081787109375, -3.82916259765625, -3.5765380859375, -3.32391357421875, -3.0712890625, -2.81866455078125, -2.5660400390625, -2.31341552734375, -2.060791015625, -1.80816650390625, -1.5555419921875, -1.30291748046875, -1.05029296875, -0.79766845703125, -0.5450439453125, -0.29241943359375, -0.039794921875, 0.21282958984375, 0.4654541015625, 0.71807861328125, 0.970703125, 1.22332763671875, 1.4759521484375, 1.72857666015625, 1.981201171875, 2.23382568359375, 2.4864501953125, 2.73907470703125, 2.99169921875, 3.24432373046875, 3.4969482421875, 3.74957275390625, 4.002197265625, 4.25482177734375, 4.5074462890625, 4.76007080078125, 5.0126953125, 5.26531982421875, 5.5179443359375, 5.77056884765625, 6.023193359375, 6.27581787109375, 6.5284423828125, 6.78106689453125, 7.03369140625, 7.28631591796875, 7.5389404296875, 7.79156494140625, 8.044189453125, 8.29681396484375, 8.5494384765625, 8.80206298828125, 9.0546875]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 6.0, 3.0, 12.0, 16.0, 18.0, 23.0, 30.0, 61.0, 84.0, 137.0, 202.0, 324.0, 551.0, 881.0, 1458.0, 2474.0, 4289.0, 7592.0, 13486.0, 24114.0, 45309.0, 88846.0, 215250.0, 374999.0, 131436.0, 62443.0, 32620.0, 17956.0, 9988.0, 5666.0, 3324.0, 1959.0, 1166.0, 695.0, 400.0, 257.0, 166.0, 91.0, 73.0, 56.0, 28.0, 21.0, 11.0, 13.0, 11.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.662109375, -1.608917236328125, -1.55572509765625, -1.502532958984375, -1.4493408203125, -1.396148681640625, -1.34295654296875, -1.289764404296875, -1.236572265625, -1.183380126953125, -1.13018798828125, -1.076995849609375, -1.0238037109375, -0.970611572265625, -0.91741943359375, -0.864227294921875, -0.81103515625, -0.757843017578125, -0.70465087890625, -0.651458740234375, -0.5982666015625, -0.545074462890625, -0.49188232421875, -0.438690185546875, -0.385498046875, -0.332305908203125, -0.27911376953125, -0.225921630859375, -0.1727294921875, -0.119537353515625, -0.06634521484375, -0.013153076171875, 0.0400390625, 0.093231201171875, 0.14642333984375, 0.199615478515625, 0.2528076171875, 0.305999755859375, 0.35919189453125, 0.412384033203125, 0.465576171875, 0.518768310546875, 0.57196044921875, 0.625152587890625, 0.6783447265625, 0.731536865234375, 0.78472900390625, 0.837921142578125, 0.89111328125, 0.944305419921875, 0.99749755859375, 1.050689697265625, 1.1038818359375, 1.157073974609375, 1.21026611328125, 1.263458251953125, 1.316650390625, 1.369842529296875, 1.42303466796875, 1.476226806640625, 1.5294189453125, 1.582611083984375, 1.63580322265625, 1.688995361328125, 1.7421875]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 8.0, 5.0, 3.0, 9.0, 12.0, 14.0, 15.0, 19.0, 18.0, 17.0, 26.0, 20.0, 23.0, 25.0, 47.0, 20.0, 37.0, 39.0, 35.0, 38.0, 30.0, 1067.0, 55.0, 36.0, 26.0, 36.0, 35.0, 36.0, 35.0, 34.0, 30.0, 28.0, 23.0, 21.0, 24.0, 12.0, 20.0, 7.0, 9.0, 4.0, 9.0, 4.0, 5.0, 3.0, 6.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.380859375, -3.258026123046875, -3.13519287109375, -3.012359619140625, -2.8895263671875, -2.766693115234375, -2.64385986328125, -2.521026611328125, -2.398193359375, -2.275360107421875, -2.15252685546875, -2.029693603515625, -1.9068603515625, -1.784027099609375, -1.66119384765625, -1.538360595703125, -1.41552734375, -1.292694091796875, -1.16986083984375, -1.047027587890625, -0.9241943359375, -0.801361083984375, -0.67852783203125, -0.555694580078125, -0.432861328125, -0.310028076171875, -0.18719482421875, -0.064361572265625, 0.0584716796875, 0.181304931640625, 0.30413818359375, 0.426971435546875, 0.5498046875, 0.672637939453125, 0.79547119140625, 0.918304443359375, 1.0411376953125, 1.163970947265625, 1.28680419921875, 1.409637451171875, 1.532470703125, 1.655303955078125, 1.77813720703125, 1.900970458984375, 2.0238037109375, 2.146636962890625, 2.26947021484375, 2.392303466796875, 2.51513671875, 2.637969970703125, 2.76080322265625, 2.883636474609375, 3.0064697265625, 3.129302978515625, 3.25213623046875, 3.374969482421875, 3.497802734375, 3.620635986328125, 3.74346923828125, 3.866302490234375, 3.9891357421875, 4.111968994140625, 4.23480224609375, 4.357635498046875, 4.48046875]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 7.0, 8.0, 10.0, 22.0, 27.0, 58.0, 69.0, 98.0, 153.0, 231.0, 353.0, 526.0, 776.0, 1177.0, 1791.0, 2691.0, 4169.0, 6454.0, 10117.0, 16091.0, 25896.0, 43400.0, 73491.0, 133518.0, 1361472.0, 184491.0, 91894.0, 52914.0, 31552.0, 19428.0, 12134.0, 7887.0, 5000.0, 3043.0, 2197.0, 1368.0, 885.0, 555.0, 392.0, 234.0, 179.0, 134.0, 61.0, 51.0, 49.0, 34.0, 15.0, 9.0, 9.0, 9.0, 7.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0], "bins": [-1.2353515625, -1.196380615234375, -1.15740966796875, -1.118438720703125, -1.0794677734375, -1.040496826171875, -1.00152587890625, -0.962554931640625, -0.923583984375, -0.884613037109375, -0.84564208984375, -0.806671142578125, -0.7677001953125, -0.728729248046875, -0.68975830078125, -0.650787353515625, -0.61181640625, -0.572845458984375, -0.53387451171875, -0.494903564453125, -0.4559326171875, -0.416961669921875, -0.37799072265625, -0.339019775390625, -0.300048828125, -0.261077880859375, -0.22210693359375, -0.183135986328125, -0.1441650390625, -0.105194091796875, -0.06622314453125, -0.027252197265625, 0.01171875, 0.050689697265625, 0.08966064453125, 0.128631591796875, 0.1676025390625, 0.206573486328125, 0.24554443359375, 0.284515380859375, 0.323486328125, 0.362457275390625, 0.40142822265625, 0.440399169921875, 0.4793701171875, 0.518341064453125, 0.55731201171875, 0.596282958984375, 0.63525390625, 0.674224853515625, 0.71319580078125, 0.752166748046875, 0.7911376953125, 0.830108642578125, 0.86907958984375, 0.908050537109375, 0.947021484375, 0.985992431640625, 1.02496337890625, 1.063934326171875, 1.1029052734375, 1.141876220703125, 1.18084716796875, 1.219818115234375, 1.2587890625]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 7.0, 8.0, 5.0, 8.0, 15.0, 11.0, 19.0, 27.0, 28.0, 25.0, 45.0, 48.0, 57.0, 61.0, 71.0, 81.0, 69.0, 62.0, 72.0, 45.0, 41.0, 27.0, 30.0, 20.0, 14.0, 24.0, 17.0, 12.0, 10.0, 4.0, 7.0, 3.0, 5.0, 7.0, 5.0, 0.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006532669067382812, -0.0006332471966743469, -0.0006132274866104126, -0.0005932077765464783, -0.0005731880664825439, -0.0005531683564186096, -0.0005331486463546753, -0.000513128936290741, -0.0004931092262268066, -0.0004730895161628723, -0.000453069806098938, -0.00043305009603500366, -0.00041303038597106934, -0.000393010675907135, -0.0003729909658432007, -0.00035297125577926636, -0.00033295154571533203, -0.0003129318356513977, -0.0002929121255874634, -0.00027289241552352905, -0.0002528727054595947, -0.0002328529953956604, -0.00021283328533172607, -0.00019281357526779175, -0.00017279386520385742, -0.0001527741551399231, -0.00013275444507598877, -0.00011273473501205444, -9.271502494812012e-05, -7.269531488418579e-05, -5.2675604820251465e-05, -3.265589475631714e-05, -1.2636184692382812e-05, 7.383525371551514e-06, 2.740323543548584e-05, 4.7422945499420166e-05, 6.744265556335449e-05, 8.746236562728882e-05, 0.00010748207569122314, 0.00012750178575515747, 0.0001475214958190918, 0.00016754120588302612, 0.00018756091594696045, 0.00020758062601089478, 0.0002276003360748291, 0.00024762004613876343, 0.00026763975620269775, 0.0002876594662666321, 0.0003076791763305664, 0.00032769888639450073, 0.00034771859645843506, 0.0003677383065223694, 0.0003877580165863037, 0.00040777772665023804, 0.00042779743671417236, 0.0004478171467781067, 0.000467836856842041, 0.00048785656690597534, 0.0005078762769699097, 0.000527895987033844, 0.0005479156970977783, 0.0005679354071617126, 0.000587955117225647, 0.0006079748272895813, 0.0006279945373535156]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 1.0, 6.0, 4.0, 6.0, 6.0, 14.0, 13.0, 18.0, 20.0, 24.0, 33.0, 32.0, 52.0, 69.0, 97.0, 155.0, 285.0, 616.0, 5084.0, 1022072.0, 18276.0, 725.0, 317.0, 196.0, 119.0, 69.0, 53.0, 40.0, 31.0, 26.0, 21.0, 17.0, 9.0, 10.0, 6.0, 8.0, 4.0, 4.0, 1.0, 6.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01221466064453125, -0.011787652969360352, -0.011360645294189453, -0.010933637619018555, -0.010506629943847656, -0.010079622268676758, -0.00965261459350586, -0.009225606918334961, -0.008798599243164062, -0.008371591567993164, -0.007944583892822266, -0.007517576217651367, -0.007090568542480469, -0.00666356086730957, -0.006236553192138672, -0.0058095455169677734, -0.005382537841796875, -0.0049555301666259766, -0.004528522491455078, -0.00410151481628418, -0.0036745071411132812, -0.003247499465942383, -0.0028204917907714844, -0.002393484115600586, -0.0019664764404296875, -0.001539468765258789, -0.0011124610900878906, -0.0006854534149169922, -0.00025844573974609375, 0.0001685619354248047, 0.0005955696105957031, 0.0010225772857666016, 0.0014495849609375, 0.0018765926361083984, 0.002303600311279297, 0.0027306079864501953, 0.0031576156616210938, 0.003584623336791992, 0.004011631011962891, 0.004438638687133789, 0.0048656463623046875, 0.005292654037475586, 0.005719661712646484, 0.006146669387817383, 0.006573677062988281, 0.00700068473815918, 0.007427692413330078, 0.007854700088500977, 0.008281707763671875, 0.008708715438842773, 0.009135723114013672, 0.00956273078918457, 0.009989738464355469, 0.010416746139526367, 0.010843753814697266, 0.011270761489868164, 0.011697769165039062, 0.012124776840209961, 0.01255178451538086, 0.012978792190551758, 0.013405799865722656, 0.013832807540893555, 0.014259815216064453, 0.014686822891235352, 0.01511383056640625]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 7.0, 19.0, 48.0, 159.0, 280.0, 259.0, 158.0, 60.0, 12.0, 7.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00047273054951801896, -0.00044487009290605783, -0.0004170096362940967, -0.0003891491796821356, -0.00036128872307017446, -0.00033342826645821333, -0.0003055678098462522, -0.0002777073532342911, -0.00024984689662232995, -0.00022198644001036882, -0.0001941259833984077, -0.00016626552678644657, -0.00013840507017448545, -0.00011054461356252432, -8.268415695056319e-05, -5.4823700338602066e-05, -2.696324372664094e-05, 8.972128853201866e-07, 2.8757669497281313e-05, 5.661812610924244e-05, 8.447858272120357e-05, 0.00011233903933316469, 0.00014019949594512582, 0.00016805995255708694, 0.00019592040916904807, 0.0002237808657810092, 0.0002516413223929703, 0.00027950177900493145, 0.0003073622356168926, 0.0003352226922288537, 0.00036308314884081483, 0.00039094360545277596, 0.000418804120272398, 0.0004466645768843591, 0.00047452503349632025, 0.0005023854901082814, 0.0005302459467202425, 0.0005581064033322036, 0.0005859668599441648, 0.0006138273165561259, 0.000641687773168087, 0.0006695482297800481, 0.0006974086863920093, 0.0007252691430039704, 0.0007531295996159315, 0.0007809900562278926, 0.0008088505128398538, 0.0008367109694518149, 0.000864571426063776, 0.0008924318826757371, 0.0009202923392876983, 0.0009481527958996594, 0.0009760132525116205, 0.0010038737673312426, 0.0010317341657355428, 0.001059594564139843, 0.001087455078959465, 0.001115315593779087, 0.0011431759921833873, 0.0011710363905876875, 0.0011988969054073095, 0.0012267574202269316, 0.0012546178186312318, 0.001282478217035532, 0.001310338731855154]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 6.0, 5.0, 4.0, 7.0, 7.0, 8.0, 12.0, 21.0, 16.0, 20.0, 16.0, 26.0, 28.0, 27.0, 30.0, 30.0, 32.0, 29.0, 34.0, 36.0, 35.0, 33.0, 28.0, 33.0, 32.0, 27.0, 42.0, 38.0, 41.0, 39.0, 28.0, 23.0, 32.0, 26.0, 16.0, 20.0, 16.0, 14.0, 10.0, 14.0, 9.0, 9.0, 11.0, 8.0, 3.0, 9.0, 1.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.00026172399520874023, -0.00025298167020082474, -0.00024423934519290924, -0.00023549702018499374, -0.00022675469517707825, -0.00021801237016916275, -0.00020927004516124725, -0.00020052772015333176, -0.00019178539514541626, -0.00018304307013750076, -0.00017430074512958527, -0.00016555842012166977, -0.00015681609511375427, -0.00014807377010583878, -0.00013933144509792328, -0.00013058912009000778, -0.00012184679508209229, -0.00011310447007417679, -0.00010436214506626129, -9.56198200583458e-05, -8.68774950504303e-05, -7.81351700425148e-05, -6.93928450345993e-05, -6.065052002668381e-05, -5.190819501876831e-05, -4.3165870010852814e-05, -3.442354500293732e-05, -2.568121999502182e-05, -1.6938894987106323e-05, -8.196569979190826e-06, 5.457550287246704e-07, 9.288080036640167e-06, 1.8030405044555664e-05, 2.677273005247116e-05, 3.551505506038666e-05, 4.4257380068302155e-05, 5.299970507621765e-05, 6.174203008413315e-05, 7.048435509204865e-05, 7.922668009996414e-05, 8.796900510787964e-05, 9.671133011579514e-05, 0.00010545365512371063, 0.00011419598013162613, 0.00012293830513954163, 0.00013168063014745712, 0.00014042295515537262, 0.00014916528016328812, 0.0001579076051712036, 0.0001666499301791191, 0.0001753922551870346, 0.0001841345801949501, 0.0001928769052028656, 0.0002016192302107811, 0.0002103615552186966, 0.0002191038802266121, 0.0002278462052345276, 0.00023658853024244308, 0.0002453308552503586, 0.0002540731802582741, 0.0002628155052661896, 0.00027155783027410507, 0.00028030015528202057, 0.00028904248028993607, 0.00029778480529785156]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 9.0, 13.0, 13.0, 12.0, 25.0, 21.0, 37.0, 30.0, 42.0, 45.0, 42.0, 48.0, 45.0, 58.0, 50.0, 57.0, 48.0, 53.0, 57.0, 39.0, 47.0, 30.0, 31.0, 35.0, 21.0, 16.0, 23.0, 14.0, 8.0, 8.0, 3.0, 8.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.11328125, -6.86065673828125, -6.6080322265625, -6.35540771484375, -6.102783203125, -5.85015869140625, -5.5975341796875, -5.34490966796875, -5.09228515625, -4.83966064453125, -4.5870361328125, -4.33441162109375, -4.081787109375, -3.82916259765625, -3.5765380859375, -3.32391357421875, -3.0712890625, -2.81866455078125, -2.5660400390625, -2.31341552734375, -2.060791015625, -1.80816650390625, -1.5555419921875, -1.30291748046875, -1.05029296875, -0.79766845703125, -0.5450439453125, -0.29241943359375, -0.039794921875, 0.21282958984375, 0.4654541015625, 0.71807861328125, 0.970703125, 1.22332763671875, 1.4759521484375, 1.72857666015625, 1.981201171875, 2.23382568359375, 2.4864501953125, 2.73907470703125, 2.99169921875, 3.24432373046875, 3.4969482421875, 3.74957275390625, 4.002197265625, 4.25482177734375, 4.5074462890625, 4.76007080078125, 5.0126953125, 5.26531982421875, 5.5179443359375, 5.77056884765625, 6.023193359375, 6.27581787109375, 6.5284423828125, 6.78106689453125, 7.03369140625, 7.28631591796875, 7.5389404296875, 7.79156494140625, 8.044189453125, 8.29681396484375, 8.5494384765625, 8.80206298828125, 9.0546875]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 14.0, 17.0, 17.0, 28.0, 36.0, 79.0, 112.0, 201.0, 358.0, 570.0, 1163.0, 2037.0, 3858.0, 8354.0, 19976.0, 55491.0, 203252.0, 512325.0, 161469.0, 46785.0, 17305.0, 7425.0, 3526.0, 1850.0, 969.0, 543.0, 286.0, 169.0, 128.0, 70.0, 40.0, 23.0, 24.0, 20.0, 9.0, 7.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.69140625, -4.52032470703125, -4.3492431640625, -4.17816162109375, -4.007080078125, -3.83599853515625, -3.6649169921875, -3.49383544921875, -3.32275390625, -3.15167236328125, -2.9805908203125, -2.80950927734375, -2.638427734375, -2.46734619140625, -2.2962646484375, -2.12518310546875, -1.9541015625, -1.78302001953125, -1.6119384765625, -1.44085693359375, -1.269775390625, -1.09869384765625, -0.9276123046875, -0.75653076171875, -0.58544921875, -0.41436767578125, -0.2432861328125, -0.07220458984375, 0.098876953125, 0.26995849609375, 0.4410400390625, 0.61212158203125, 0.783203125, 0.95428466796875, 1.1253662109375, 1.29644775390625, 1.467529296875, 1.63861083984375, 1.8096923828125, 1.98077392578125, 2.15185546875, 2.32293701171875, 2.4940185546875, 2.66510009765625, 2.836181640625, 3.00726318359375, 3.1783447265625, 3.34942626953125, 3.5205078125, 3.69158935546875, 3.8626708984375, 4.03375244140625, 4.204833984375, 4.37591552734375, 4.5469970703125, 4.71807861328125, 4.88916015625, 5.06024169921875, 5.2313232421875, 5.40240478515625, 5.573486328125, 5.74456787109375, 5.9156494140625, 6.08673095703125, 6.2578125]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 4.0, 2.0, 6.0, 6.0, 9.0, 13.0, 12.0, 16.0, 19.0, 19.0, 24.0, 25.0, 42.0, 24.0, 35.0, 49.0, 55.0, 60.0, 50.0, 188.0, 1774.0, 147.0, 67.0, 50.0, 42.0, 34.0, 33.0, 32.0, 29.0, 24.0, 37.0, 26.0, 20.0, 18.0, 17.0, 10.0, 6.0, 5.0, 3.0, 9.0, 5.0, 6.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-23.828125, -23.093505859375, -22.35888671875, -21.624267578125, -20.8896484375, -20.155029296875, -19.42041015625, -18.685791015625, -17.951171875, -17.216552734375, -16.48193359375, -15.747314453125, -15.0126953125, -14.278076171875, -13.54345703125, -12.808837890625, -12.07421875, -11.339599609375, -10.60498046875, -9.870361328125, -9.1357421875, -8.401123046875, -7.66650390625, -6.931884765625, -6.197265625, -5.462646484375, -4.72802734375, -3.993408203125, -3.2587890625, -2.524169921875, -1.78955078125, -1.054931640625, -0.3203125, 0.414306640625, 1.14892578125, 1.883544921875, 2.6181640625, 3.352783203125, 4.08740234375, 4.822021484375, 5.556640625, 6.291259765625, 7.02587890625, 7.760498046875, 8.4951171875, 9.229736328125, 9.96435546875, 10.698974609375, 11.43359375, 12.168212890625, 12.90283203125, 13.637451171875, 14.3720703125, 15.106689453125, 15.84130859375, 16.575927734375, 17.310546875, 18.045166015625, 18.77978515625, 19.514404296875, 20.2490234375, 20.983642578125, 21.71826171875, 22.452880859375, 23.1875]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 6.0, 9.0, 6.0, 11.0, 9.0, 17.0, 25.0, 28.0, 34.0, 58.0, 49.0, 76.0, 118.0, 172.0, 230.0, 420.0, 1426.0, 56676.0, 3079010.0, 5602.0, 715.0, 326.0, 193.0, 140.0, 80.0, 71.0, 54.0, 27.0, 29.0, 24.0, 17.0, 16.0, 10.0, 5.0, 8.0, 3.0, 6.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-55.65625, -53.931640625, -52.20703125, -50.482421875, -48.7578125, -47.033203125, -45.30859375, -43.583984375, -41.859375, -40.134765625, -38.41015625, -36.685546875, -34.9609375, -33.236328125, -31.51171875, -29.787109375, -28.0625, -26.337890625, -24.61328125, -22.888671875, -21.1640625, -19.439453125, -17.71484375, -15.990234375, -14.265625, -12.541015625, -10.81640625, -9.091796875, -7.3671875, -5.642578125, -3.91796875, -2.193359375, -0.46875, 1.255859375, 2.98046875, 4.705078125, 6.4296875, 8.154296875, 9.87890625, 11.603515625, 13.328125, 15.052734375, 16.77734375, 18.501953125, 20.2265625, 21.951171875, 23.67578125, 25.400390625, 27.125, 28.849609375, 30.57421875, 32.298828125, 34.0234375, 35.748046875, 37.47265625, 39.197265625, 40.921875, 42.646484375, 44.37109375, 46.095703125, 47.8203125, 49.544921875, 51.26953125, 52.994140625, 54.71875]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 21.0, 983.0, 17.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.77444076538086, -42.39189910888672, -33.009361267089844, -23.626819610595703, -14.244277954101562, -4.861736297607422, 4.520801544189453, 13.90334701538086, 23.285884857177734, 32.668426513671875, 42.05096435546875, 51.43350601196289, 60.81604766845703, 70.19859313964844, 79.58113098144531, 88.96366882324219, 98.34620666503906, 107.72874450683594, 117.11128997802734, 126.49382781982422, 135.87637329101562, 145.2589111328125, 154.64144897460938, 164.02398681640625, 173.4065399169922, 182.78907775878906, 192.17161560058594, 201.55416870117188, 210.93670654296875, 220.31924438476562, 229.7017822265625, 239.08432006835938, 248.46688842773438, 257.84942626953125, 267.2319641113281, 276.614501953125, 285.9970397949219, 295.37957763671875, 304.76214599609375, 314.1446838378906, 323.5272216796875, 332.9097595214844, 342.29229736328125, 351.6748352050781, 361.057373046875, 370.43994140625, 379.82244873046875, 389.20501708984375, 398.5875244140625, 407.9700622558594, 417.35260009765625, 426.7351379394531, 436.11767578125, 445.500244140625, 454.88275146484375, 464.26531982421875, 473.6478576660156, 483.0303955078125, 492.4129333496094, 501.79547119140625, 511.1780090332031, 520.560546875, 529.943115234375, 539.3256225585938, 548.7081909179688]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 7.0, 4.0, 2.0, 2.0, 6.0, 11.0, 18.0, 12.0, 21.0, 10.0, 27.0, 22.0, 34.0, 30.0, 27.0, 38.0, 29.0, 42.0, 35.0, 34.0, 39.0, 34.0, 37.0, 48.0, 38.0, 35.0, 31.0, 44.0, 33.0, 29.0, 28.0, 27.0, 25.0, 21.0, 21.0, 15.0, 14.0, 19.0, 6.0, 9.0, 8.0, 5.0, 7.0, 4.0, 10.0, 3.0, 1.0, 2.0, 1.0, 3.0], "bins": [-60.87410354614258, -59.21186447143555, -57.54962158203125, -55.88738250732422, -54.22514343261719, -52.56290054321289, -50.90066146850586, -49.23841857910156, -47.57617950439453, -45.9139404296875, -44.2516975402832, -42.58945846557617, -40.927215576171875, -39.264976501464844, -37.60273742675781, -35.94049835205078, -34.278255462646484, -32.61601638793945, -30.953773498535156, -29.291534423828125, -27.62929344177246, -25.967052459716797, -24.304813385009766, -22.6425724029541, -20.980331420898438, -19.318090438842773, -17.65584945678711, -15.993610382080078, -14.331369400024414, -12.66912841796875, -11.006888389587402, -9.344648361206055, -7.682403564453125, -6.020163059234619, -4.357922554016113, -2.6956820487976074, -1.0334415435791016, 0.6287994384765625, 2.29103946685791, 3.953279495239258, 5.615520477294922, 7.277760982513428, 8.940001487731934, 10.602241516113281, 12.264482498168945, 13.92672348022461, 15.588963508605957, 17.251203536987305, 18.91344451904297, 20.575685501098633, 22.237926483154297, 23.900165557861328, 25.562406539916992, 27.224647521972656, 28.886886596679688, 30.54912757873535, 32.211368560791016, 33.87360763549805, 35.535850524902344, 37.198089599609375, 38.860328674316406, 40.5225715637207, 42.184810638427734, 43.84705352783203, 45.50929260253906]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 9.0, 10.0, 9.0, 19.0, 11.0, 17.0, 23.0, 35.0, 43.0, 34.0, 39.0, 40.0, 45.0, 46.0, 59.0, 56.0, 45.0, 57.0, 51.0, 47.0, 40.0, 47.0, 39.0, 25.0, 31.0, 21.0, 24.0, 19.0, 19.0, 11.0, 9.0, 6.0, 5.0, 7.0, 3.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.1484375, -6.8961181640625, -6.643798828125, -6.3914794921875, -6.13916015625, -5.8868408203125, -5.634521484375, -5.3822021484375, -5.1298828125, -4.8775634765625, -4.625244140625, -4.3729248046875, -4.12060546875, -3.8682861328125, -3.615966796875, -3.3636474609375, -3.111328125, -2.8590087890625, -2.606689453125, -2.3543701171875, -2.10205078125, -1.8497314453125, -1.597412109375, -1.3450927734375, -1.0927734375, -0.8404541015625, -0.588134765625, -0.3358154296875, -0.08349609375, 0.1688232421875, 0.421142578125, 0.6734619140625, 0.92578125, 1.1781005859375, 1.430419921875, 1.6827392578125, 1.93505859375, 2.1873779296875, 2.439697265625, 2.6920166015625, 2.9443359375, 3.1966552734375, 3.448974609375, 3.7012939453125, 3.95361328125, 4.2059326171875, 4.458251953125, 4.7105712890625, 4.962890625, 5.2152099609375, 5.467529296875, 5.7198486328125, 5.97216796875, 6.2244873046875, 6.476806640625, 6.7291259765625, 6.9814453125, 7.2337646484375, 7.486083984375, 7.7384033203125, 7.99072265625, 8.2430419921875, 8.495361328125, 8.7476806640625, 9.0]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 10.0, 9.0, 10.0, 14.0, 20.0, 19.0, 34.0, 33.0, 41.0, 42.0, 66.0, 128.0, 199.0, 572.0, 13536.0, 3810545.0, 366263.0, 1955.0, 293.0, 145.0, 92.0, 67.0, 42.0, 24.0, 18.0, 22.0, 21.0, 16.0, 12.0, 10.0, 8.0, 9.0, 4.0, 3.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.625, -40.17724609375, -38.7294921875, -37.28173828125, -35.833984375, -34.38623046875, -32.9384765625, -31.49072265625, -30.04296875, -28.59521484375, -27.1474609375, -25.69970703125, -24.251953125, -22.80419921875, -21.3564453125, -19.90869140625, -18.4609375, -17.01318359375, -15.5654296875, -14.11767578125, -12.669921875, -11.22216796875, -9.7744140625, -8.32666015625, -6.87890625, -5.43115234375, -3.9833984375, -2.53564453125, -1.087890625, 0.35986328125, 1.8076171875, 3.25537109375, 4.703125, 6.15087890625, 7.5986328125, 9.04638671875, 10.494140625, 11.94189453125, 13.3896484375, 14.83740234375, 16.28515625, 17.73291015625, 19.1806640625, 20.62841796875, 22.076171875, 23.52392578125, 24.9716796875, 26.41943359375, 27.8671875, 29.31494140625, 30.7626953125, 32.21044921875, 33.658203125, 35.10595703125, 36.5537109375, 38.00146484375, 39.44921875, 40.89697265625, 42.3447265625, 43.79248046875, 45.240234375, 46.68798828125, 48.1357421875, 49.58349609375, 51.03125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 8.0, 8.0, 15.0, 20.0, 33.0, 58.0, 63.0, 92.0, 131.0, 203.0, 264.0, 434.0, 519.0, 558.0, 484.0, 370.0, 252.0, 169.0, 134.0, 81.0, 62.0, 29.0, 29.0, 20.0, 11.0, 9.0, 5.0, 3.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.75, -16.179931640625, -15.60986328125, -15.039794921875, -14.4697265625, -13.899658203125, -13.32958984375, -12.759521484375, -12.189453125, -11.619384765625, -11.04931640625, -10.479248046875, -9.9091796875, -9.339111328125, -8.76904296875, -8.198974609375, -7.62890625, -7.058837890625, -6.48876953125, -5.918701171875, -5.3486328125, -4.778564453125, -4.20849609375, -3.638427734375, -3.068359375, -2.498291015625, -1.92822265625, -1.358154296875, -0.7880859375, -0.218017578125, 0.35205078125, 0.922119140625, 1.4921875, 2.062255859375, 2.63232421875, 3.202392578125, 3.7724609375, 4.342529296875, 4.91259765625, 5.482666015625, 6.052734375, 6.622802734375, 7.19287109375, 7.762939453125, 8.3330078125, 8.903076171875, 9.47314453125, 10.043212890625, 10.61328125, 11.183349609375, 11.75341796875, 12.323486328125, 12.8935546875, 13.463623046875, 14.03369140625, 14.603759765625, 15.173828125, 15.743896484375, 16.31396484375, 16.884033203125, 17.4541015625, 18.024169921875, 18.59423828125, 19.164306640625, 19.734375]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 7.0, 9.0, 4.0, 13.0, 15.0, 29.0, 40.0, 42.0, 54.0, 98.0, 130.0, 161.0, 247.0, 374.0, 807.0, 8220.0, 3782211.0, 397734.0, 2392.0, 597.0, 319.0, 215.0, 150.0, 105.0, 74.0, 56.0, 49.0, 33.0, 27.0, 19.0, 16.0, 15.0, 9.0, 5.0, 3.0, 7.0, 3.0, 1.0, 0.0, 1.0], "bins": [-92.75, -90.4775390625, -88.205078125, -85.9326171875, -83.66015625, -81.3876953125, -79.115234375, -76.8427734375, -74.5703125, -72.2978515625, -70.025390625, -67.7529296875, -65.48046875, -63.2080078125, -60.935546875, -58.6630859375, -56.390625, -54.1181640625, -51.845703125, -49.5732421875, -47.30078125, -45.0283203125, -42.755859375, -40.4833984375, -38.2109375, -35.9384765625, -33.666015625, -31.3935546875, -29.12109375, -26.8486328125, -24.576171875, -22.3037109375, -20.03125, -17.7587890625, -15.486328125, -13.2138671875, -10.94140625, -8.6689453125, -6.396484375, -4.1240234375, -1.8515625, 0.4208984375, 2.693359375, 4.9658203125, 7.23828125, 9.5107421875, 11.783203125, 14.0556640625, 16.328125, 18.6005859375, 20.873046875, 23.1455078125, 25.41796875, 27.6904296875, 29.962890625, 32.2353515625, 34.5078125, 36.7802734375, 39.052734375, 41.3251953125, 43.59765625, 45.8701171875, 48.142578125, 50.4150390625, 52.6875]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 26.0, 139.0, 326.0, 333.0, 153.0, 28.0, 7.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.12227630615234, -93.8685302734375, -87.61477661132812, -81.36102294921875, -75.1072769165039, -68.85353088378906, -62.59977722167969, -56.34602737426758, -50.09227752685547, -43.83852767944336, -37.58477783203125, -31.33102798461914, -25.07727813720703, -18.823528289794922, -12.569778442382812, -6.316028594970703, -0.06227874755859375, 6.191471099853516, 12.445220947265625, 18.698970794677734, 24.952720642089844, 31.206470489501953, 37.46022033691406, 43.71397018432617, 49.96772003173828, 56.22146987915039, 62.4752197265625, 68.72897338867188, 74.98271942138672, 81.23646545410156, 87.49021911621094, 93.74397277832031, 99.99771118164062, 106.25146484375, 112.50521087646484, 118.75895690917969, 125.01271057128906, 131.26646423339844, 137.52020263671875, 143.77395629882812, 150.0277099609375, 156.28146362304688, 162.53521728515625, 168.78895568847656, 175.04270935058594, 181.2964630126953, 187.55020141601562, 193.803955078125, 200.05770874023438, 206.31146240234375, 212.56521606445312, 218.81895446777344, 225.0727081298828, 231.3264617919922, 237.5802001953125, 243.83395385742188, 250.08770751953125, 256.3414611816406, 262.59521484375, 268.8489685058594, 275.10272216796875, 281.3564453125, 287.6101989746094, 293.86395263671875, 300.1177062988281]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 2.0, 9.0, 11.0, 14.0, 13.0, 21.0, 24.0, 20.0, 26.0, 40.0, 31.0, 36.0, 42.0, 57.0, 50.0, 52.0, 54.0, 59.0, 48.0, 59.0, 43.0, 51.0, 32.0, 33.0, 39.0, 28.0, 23.0, 15.0, 11.0, 15.0, 10.0, 12.0, 5.0, 5.0, 4.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-60.510009765625, -58.61606979370117, -56.72212600708008, -54.82818603515625, -52.934242248535156, -51.04030227661133, -49.1463623046875, -47.252418518066406, -45.35847854614258, -43.46453857421875, -41.570594787597656, -39.67665481567383, -37.78271484375, -35.888771057128906, -33.99483108520508, -32.10089111328125, -30.206947326660156, -28.313005447387695, -26.419063568115234, -24.525123596191406, -22.631181716918945, -20.737239837646484, -18.843299865722656, -16.949357986450195, -15.055416107177734, -13.161474227905273, -11.267533302307129, -9.373592376708984, -7.479650497436523, -5.5857086181640625, -3.691767692565918, -1.7978267669677734, 0.0961151123046875, 1.9900565147399902, 3.883997917175293, 5.777939319610596, 7.671880722045898, 9.56582260131836, 11.459763526916504, 13.353704452514648, 15.24764633178711, 17.14158821105957, 19.03553009033203, 20.92947006225586, 22.82341194152832, 24.71735382080078, 26.61129379272461, 28.50523567199707, 30.39917755126953, 32.29311752319336, 34.18706130981445, 36.08100128173828, 37.974945068359375, 39.8688850402832, 41.76282501220703, 43.656768798828125, 45.55070877075195, 47.44464874267578, 49.338592529296875, 51.2325325012207, 53.12647247314453, 55.020416259765625, 56.91435623168945, 58.80829620361328, 60.702239990234375]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 3.0, 8.0, 8.0, 9.0, 16.0, 20.0, 22.0, 28.0, 36.0, 34.0, 28.0, 43.0, 54.0, 41.0, 39.0, 55.0, 46.0, 62.0, 42.0, 57.0, 52.0, 42.0, 51.0, 35.0, 26.0, 20.0, 20.0, 26.0, 17.0, 13.0, 10.0, 14.0, 7.0, 5.0, 7.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.15234375, -6.89715576171875, -6.6419677734375, -6.38677978515625, -6.131591796875, -5.87640380859375, -5.6212158203125, -5.36602783203125, -5.11083984375, -4.85565185546875, -4.6004638671875, -4.34527587890625, -4.090087890625, -3.83489990234375, -3.5797119140625, -3.32452392578125, -3.0693359375, -2.81414794921875, -2.5589599609375, -2.30377197265625, -2.048583984375, -1.79339599609375, -1.5382080078125, -1.28302001953125, -1.02783203125, -0.77264404296875, -0.5174560546875, -0.26226806640625, -0.007080078125, 0.24810791015625, 0.5032958984375, 0.75848388671875, 1.013671875, 1.26885986328125, 1.5240478515625, 1.77923583984375, 2.034423828125, 2.28961181640625, 2.5447998046875, 2.79998779296875, 3.05517578125, 3.31036376953125, 3.5655517578125, 3.82073974609375, 4.075927734375, 4.33111572265625, 4.5863037109375, 4.84149169921875, 5.0966796875, 5.35186767578125, 5.6070556640625, 5.86224365234375, 6.117431640625, 6.37261962890625, 6.6278076171875, 6.88299560546875, 7.13818359375, 7.39337158203125, 7.6485595703125, 7.90374755859375, 8.158935546875, 8.41412353515625, 8.6693115234375, 8.92449951171875, 9.1796875]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 8.0, 14.0, 15.0, 22.0, 24.0, 49.0, 76.0, 111.0, 175.0, 292.0, 428.0, 741.0, 1292.0, 2074.0, 3557.0, 6000.0, 10460.0, 17992.0, 32450.0, 63812.0, 141146.0, 374865.0, 209202.0, 86460.0, 43164.0, 22765.0, 12973.0, 7475.0, 4363.0, 2578.0, 1581.0, 915.0, 547.0, 335.0, 220.0, 133.0, 81.0, 46.0, 39.0, 23.0, 24.0, 7.0, 7.0, 6.0, 5.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-1.853515625, -1.79852294921875, -1.7435302734375, -1.68853759765625, -1.633544921875, -1.57855224609375, -1.5235595703125, -1.46856689453125, -1.41357421875, -1.35858154296875, -1.3035888671875, -1.24859619140625, -1.193603515625, -1.13861083984375, -1.0836181640625, -1.02862548828125, -0.9736328125, -0.91864013671875, -0.8636474609375, -0.80865478515625, -0.753662109375, -0.69866943359375, -0.6436767578125, -0.58868408203125, -0.53369140625, -0.47869873046875, -0.4237060546875, -0.36871337890625, -0.313720703125, -0.25872802734375, -0.2037353515625, -0.14874267578125, -0.09375, -0.03875732421875, 0.0162353515625, 0.07122802734375, 0.126220703125, 0.18121337890625, 0.2362060546875, 0.29119873046875, 0.34619140625, 0.40118408203125, 0.4561767578125, 0.51116943359375, 0.566162109375, 0.62115478515625, 0.6761474609375, 0.73114013671875, 0.7861328125, 0.84112548828125, 0.8961181640625, 0.95111083984375, 1.006103515625, 1.06109619140625, 1.1160888671875, 1.17108154296875, 1.22607421875, 1.28106689453125, 1.3360595703125, 1.39105224609375, 1.446044921875, 1.50103759765625, 1.5560302734375, 1.61102294921875, 1.666015625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 6.0, 4.0, 8.0, 11.0, 15.0, 11.0, 14.0, 25.0, 22.0, 25.0, 21.0, 29.0, 37.0, 46.0, 39.0, 32.0, 46.0, 28.0, 39.0, 1066.0, 36.0, 41.0, 50.0, 46.0, 42.0, 33.0, 42.0, 32.0, 22.0, 28.0, 20.0, 12.0, 21.0, 17.0, 14.0, 10.0, 9.0, 3.0, 1.0, 2.0, 9.0, 5.0, 3.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-4.234375, -4.09576416015625, -3.9571533203125, -3.81854248046875, -3.679931640625, -3.54132080078125, -3.4027099609375, -3.26409912109375, -3.12548828125, -2.98687744140625, -2.8482666015625, -2.70965576171875, -2.571044921875, -2.43243408203125, -2.2938232421875, -2.15521240234375, -2.0166015625, -1.87799072265625, -1.7393798828125, -1.60076904296875, -1.462158203125, -1.32354736328125, -1.1849365234375, -1.04632568359375, -0.90771484375, -0.76910400390625, -0.6304931640625, -0.49188232421875, -0.353271484375, -0.21466064453125, -0.0760498046875, 0.06256103515625, 0.201171875, 0.33978271484375, 0.4783935546875, 0.61700439453125, 0.755615234375, 0.89422607421875, 1.0328369140625, 1.17144775390625, 1.31005859375, 1.44866943359375, 1.5872802734375, 1.72589111328125, 1.864501953125, 2.00311279296875, 2.1417236328125, 2.28033447265625, 2.4189453125, 2.55755615234375, 2.6961669921875, 2.83477783203125, 2.973388671875, 3.11199951171875, 3.2506103515625, 3.38922119140625, 3.52783203125, 3.66644287109375, 3.8050537109375, 3.94366455078125, 4.082275390625, 4.22088623046875, 4.3594970703125, 4.49810791015625, 4.63671875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 5.0, 5.0, 5.0, 2.0, 4.0, 20.0, 12.0, 25.0, 35.0, 45.0, 75.0, 97.0, 103.0, 197.0, 266.0, 384.0, 532.0, 725.0, 1042.0, 1558.0, 2266.0, 3346.0, 5033.0, 7647.0, 11696.0, 18431.0, 29725.0, 49535.0, 85784.0, 163310.0, 1353591.0, 152642.0, 81519.0, 47665.0, 28420.0, 17680.0, 11387.0, 7317.0, 4825.0, 3129.0, 2191.0, 1458.0, 981.0, 694.0, 497.0, 359.0, 241.0, 179.0, 103.0, 85.0, 79.0, 70.0, 28.0, 19.0, 27.0, 14.0, 11.0, 5.0, 3.0, 6.0, 5.0, 6.0, 3.0], "bins": [-1.244140625, -1.20458984375, -1.1650390625, -1.12548828125, -1.0859375, -1.04638671875, -1.0068359375, -0.96728515625, -0.927734375, -0.88818359375, -0.8486328125, -0.80908203125, -0.76953125, -0.72998046875, -0.6904296875, -0.65087890625, -0.611328125, -0.57177734375, -0.5322265625, -0.49267578125, -0.453125, -0.41357421875, -0.3740234375, -0.33447265625, -0.294921875, -0.25537109375, -0.2158203125, -0.17626953125, -0.13671875, -0.09716796875, -0.0576171875, -0.01806640625, 0.021484375, 0.06103515625, 0.1005859375, 0.14013671875, 0.1796875, 0.21923828125, 0.2587890625, 0.29833984375, 0.337890625, 0.37744140625, 0.4169921875, 0.45654296875, 0.49609375, 0.53564453125, 0.5751953125, 0.61474609375, 0.654296875, 0.69384765625, 0.7333984375, 0.77294921875, 0.8125, 0.85205078125, 0.8916015625, 0.93115234375, 0.970703125, 1.01025390625, 1.0498046875, 1.08935546875, 1.12890625, 1.16845703125, 1.2080078125, 1.24755859375, 1.287109375]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 4.0, 3.0, 2.0, 5.0, 7.0, 4.0, 3.0, 12.0, 8.0, 9.0, 15.0, 22.0, 19.0, 29.0, 36.0, 47.0, 48.0, 67.0, 68.0, 55.0, 72.0, 82.0, 63.0, 54.0, 42.0, 40.0, 38.0, 15.0, 27.0, 11.0, 19.0, 17.0, 9.0, 12.0, 11.0, 3.0, 7.0, 4.0, 5.0, 5.0, 0.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.000690460205078125, -0.0006682649254798889, -0.0006460696458816528, -0.0006238743662834167, -0.0006016790866851807, -0.0005794838070869446, -0.0005572885274887085, -0.0005350932478904724, -0.0005128979682922363, -0.0004907026886940002, -0.00046850740909576416, -0.0004463121294975281, -0.000424116849899292, -0.0004019215703010559, -0.0003797262907028198, -0.00035753101110458374, -0.00033533573150634766, -0.00031314045190811157, -0.0002909451723098755, -0.0002687498927116394, -0.0002465546131134033, -0.00022435933351516724, -0.00020216405391693115, -0.00017996877431869507, -0.00015777349472045898, -0.0001355782151222229, -0.00011338293552398682, -9.118765592575073e-05, -6.899237632751465e-05, -4.6797096729278564e-05, -2.460181713104248e-05, -2.4065375328063965e-06, 1.9788742065429688e-05, 4.198402166366577e-05, 6.417930126190186e-05, 8.637458086013794e-05, 0.00010856986045837402, 0.0001307651400566101, 0.0001529604196548462, 0.00017515569925308228, 0.00019735097885131836, 0.00021954625844955444, 0.00024174153804779053, 0.0002639368176460266, 0.0002861320972442627, 0.0003083273768424988, 0.00033052265644073486, 0.00035271793603897095, 0.00037491321563720703, 0.0003971084952354431, 0.0004193037748336792, 0.0004414990544319153, 0.00046369433403015137, 0.00048588961362838745, 0.0005080848932266235, 0.0005302801728248596, 0.0005524754524230957, 0.0005746707320213318, 0.0005968660116195679, 0.000619061291217804, 0.00064125657081604, 0.0006634518504142761, 0.0006856471300125122, 0.0007078424096107483, 0.0007300376892089844]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 3.0, 3.0, 5.0, 5.0, 4.0, 14.0, 15.0, 13.0, 12.0, 20.0, 16.0, 13.0, 19.0, 35.0, 47.0, 57.0, 126.0, 213.0, 619.0, 10895.0, 1033549.0, 1938.0, 414.0, 180.0, 86.0, 78.0, 42.0, 29.0, 20.0, 16.0, 14.0, 12.0, 2.0, 12.0, 4.0, 1.0, 7.0, 4.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.0186309814453125, -0.018054962158203125, -0.01747894287109375, -0.016902923583984375, -0.016326904296875, -0.015750885009765625, -0.01517486572265625, -0.014598846435546875, -0.0140228271484375, -0.013446807861328125, -0.01287078857421875, -0.012294769287109375, -0.01171875, -0.011142730712890625, -0.01056671142578125, -0.009990692138671875, -0.0094146728515625, -0.008838653564453125, -0.00826263427734375, -0.007686614990234375, -0.007110595703125, -0.006534576416015625, -0.00595855712890625, -0.005382537841796875, -0.0048065185546875, -0.004230499267578125, -0.00365447998046875, -0.003078460693359375, -0.00250244140625, -0.001926422119140625, -0.00135040283203125, -0.000774383544921875, -0.0001983642578125, 0.000377655029296875, 0.00095367431640625, 0.001529693603515625, 0.002105712890625, 0.002681732177734375, 0.00325775146484375, 0.003833770751953125, 0.0044097900390625, 0.004985809326171875, 0.00556182861328125, 0.006137847900390625, 0.0067138671875, 0.007289886474609375, 0.00786590576171875, 0.008441925048828125, 0.0090179443359375, 0.009593963623046875, 0.01016998291015625, 0.010746002197265625, 0.011322021484375, 0.011898040771484375, 0.01247406005859375, 0.013050079345703125, 0.0136260986328125, 0.014202117919921875, 0.01477813720703125, 0.015354156494140625, 0.01593017578125, 0.016506195068359375, 0.01708221435546875, 0.017658233642578125, 0.0182342529296875]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 65.0, 223.0, 379.0, 268.0, 61.0, 9.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010800500167533755, -0.0010394385317340493, -0.000998827163130045, -0.0009582156781107187, -0.0009176042512990534, -0.0008769928244873881, -0.0008363813976757228, -0.0007957699708640575, -0.0007551584858447313, -0.000714547059033066, -0.0006739356322214007, -0.0006333241472020745, -0.0005927127203904092, -0.0005521012935787439, -0.0005114898667670786, -0.0004708784108515829, -0.00043026701314374804, -0.00038965558633208275, -0.000349044130416587, -0.0003084327036049217, -0.00026782124768942595, -0.00022720982087776065, -0.00018659839406609535, -0.0001459869381505996, -0.0001053755113389343, -6.476406997535378e-05, -2.4152635887730867e-05, 1.6458798199892044e-05, 5.707023956347257e-05, 9.76816809270531e-05, 0.0001382931077387184, 0.00017890456365421414, 0.00021951599046587944, 0.00026012741727754474, 0.0003007388731930405, 0.0003413503000047058, 0.00038196175592020154, 0.00042257318273186684, 0.00046318460954353213, 0.0005037960363551974, 0.0005444075213745236, 0.0005850189481861889, 0.0006256303749978542, 0.0006662418600171804, 0.0007068532868288457, 0.000747464713640511, 0.0007880761404521763, 0.0008286875672638416, 0.0008692989940755069, 0.0009099104208871722, 0.0009505218476988375, 0.0009911332745105028, 0.001031744759529829, 0.0010723562445491552, 0.0011129676131531596, 0.0011535790981724858, 0.0011941904667764902, 0.0012348019517958164, 0.0012754133203998208, 0.001316024805419147, 0.0013566361740231514, 0.0013972476590424776, 0.0014378591440618038, 0.0014784705126658082, 0.0015190819976851344]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 5.0, 4.0, 2.0, 2.0, 2.0, 6.0, 10.0, 10.0, 7.0, 8.0, 10.0, 9.0, 17.0, 19.0, 23.0, 18.0, 27.0, 30.0, 27.0, 24.0, 42.0, 33.0, 44.0, 36.0, 35.0, 37.0, 36.0, 33.0, 43.0, 56.0, 41.0, 38.0, 39.0, 31.0, 27.0, 25.0, 20.0, 24.0, 21.0, 23.0, 19.0, 6.0, 6.0, 4.0, 8.0, 7.0, 4.0, 3.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003116130828857422, -0.00030045490711927414, -0.0002892967313528061, -0.00027813855558633804, -0.00026698037981987, -0.00025582220405340195, -0.0002446640282869339, -0.00023350585252046585, -0.0002223476767539978, -0.00021118950098752975, -0.0002000313252210617, -0.00018887314945459366, -0.0001777149736881256, -0.00016655679792165756, -0.00015539862215518951, -0.00014424044638872147, -0.00013308227062225342, -0.00012192409485578537, -0.00011076591908931732, -9.960774332284927e-05, -8.844956755638123e-05, -7.729139178991318e-05, -6.613321602344513e-05, -5.497504025697708e-05, -4.381686449050903e-05, -3.2658688724040985e-05, -2.1500512957572937e-05, -1.0342337191104889e-05, 8.158385753631592e-07, 1.1974014341831207e-05, 2.3132190108299255e-05, 3.4290365874767303e-05, 4.544854164123535e-05, 5.66067174077034e-05, 6.776489317417145e-05, 7.89230689406395e-05, 9.008124470710754e-05, 0.00010123942047357559, 0.00011239759624004364, 0.0001235557720065117, 0.00013471394777297974, 0.00014587212353944778, 0.00015703029930591583, 0.00016818847507238388, 0.00017934665083885193, 0.00019050482660531998, 0.00020166300237178802, 0.00021282117813825607, 0.00022397935390472412, 0.00023513752967119217, 0.0002462957054376602, 0.00025745388120412827, 0.0002686120569705963, 0.00027977023273706436, 0.0002909284085035324, 0.00030208658427000046, 0.0003132447600364685, 0.00032440293580293655, 0.0003355611115694046, 0.00034671928733587265, 0.0003578774631023407, 0.00036903563886880875, 0.0003801938146352768, 0.00039135199040174484, 0.0004025101661682129]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 3.0, 8.0, 8.0, 9.0, 16.0, 20.0, 22.0, 28.0, 36.0, 34.0, 28.0, 43.0, 54.0, 41.0, 39.0, 55.0, 46.0, 62.0, 42.0, 57.0, 52.0, 42.0, 51.0, 35.0, 26.0, 20.0, 20.0, 26.0, 17.0, 13.0, 10.0, 14.0, 7.0, 5.0, 7.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.15234375, -6.89715576171875, -6.6419677734375, -6.38677978515625, -6.131591796875, -5.87640380859375, -5.6212158203125, -5.36602783203125, -5.11083984375, -4.85565185546875, -4.6004638671875, -4.34527587890625, -4.090087890625, -3.83489990234375, -3.5797119140625, -3.32452392578125, -3.0693359375, -2.81414794921875, -2.5589599609375, -2.30377197265625, -2.048583984375, -1.79339599609375, -1.5382080078125, -1.28302001953125, -1.02783203125, -0.77264404296875, -0.5174560546875, -0.26226806640625, -0.007080078125, 0.24810791015625, 0.5032958984375, 0.75848388671875, 1.013671875, 1.26885986328125, 1.5240478515625, 1.77923583984375, 2.034423828125, 2.28961181640625, 2.5447998046875, 2.79998779296875, 3.05517578125, 3.31036376953125, 3.5655517578125, 3.82073974609375, 4.075927734375, 4.33111572265625, 4.5863037109375, 4.84149169921875, 5.0966796875, 5.35186767578125, 5.6070556640625, 5.86224365234375, 6.117431640625, 6.37261962890625, 6.6278076171875, 6.88299560546875, 7.13818359375, 7.39337158203125, 7.6485595703125, 7.90374755859375, 8.158935546875, 8.41412353515625, 8.6693115234375, 8.92449951171875, 9.1796875]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 6.0, 7.0, 24.0, 28.0, 30.0, 56.0, 73.0, 100.0, 118.0, 256.0, 341.0, 558.0, 788.0, 1227.0, 1796.0, 2795.0, 4380.0, 7053.0, 11838.0, 20716.0, 41721.0, 101406.0, 288843.0, 340746.0, 118984.0, 47938.0, 22848.0, 12705.0, 7641.0, 4685.0, 3021.0, 1931.0, 1358.0, 845.0, 585.0, 366.0, 232.0, 166.0, 104.0, 91.0, 44.0, 32.0, 23.0, 21.0, 8.0, 6.0, 6.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.533203125, -3.419525146484375, -3.30584716796875, -3.192169189453125, -3.0784912109375, -2.964813232421875, -2.85113525390625, -2.737457275390625, -2.623779296875, -2.510101318359375, -2.39642333984375, -2.282745361328125, -2.1690673828125, -2.055389404296875, -1.94171142578125, -1.828033447265625, -1.71435546875, -1.600677490234375, -1.48699951171875, -1.373321533203125, -1.2596435546875, -1.145965576171875, -1.03228759765625, -0.918609619140625, -0.804931640625, -0.691253662109375, -0.57757568359375, -0.463897705078125, -0.3502197265625, -0.236541748046875, -0.12286376953125, -0.009185791015625, 0.1044921875, 0.218170166015625, 0.33184814453125, 0.445526123046875, 0.5592041015625, 0.672882080078125, 0.78656005859375, 0.900238037109375, 1.013916015625, 1.127593994140625, 1.24127197265625, 1.354949951171875, 1.4686279296875, 1.582305908203125, 1.69598388671875, 1.809661865234375, 1.92333984375, 2.037017822265625, 2.15069580078125, 2.264373779296875, 2.3780517578125, 2.491729736328125, 2.60540771484375, 2.719085693359375, 2.832763671875, 2.946441650390625, 3.06011962890625, 3.173797607421875, 3.2874755859375, 3.401153564453125, 3.51483154296875, 3.628509521484375, 3.7421875]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 4.0, 12.0, 13.0, 7.0, 14.0, 20.0, 20.0, 28.0, 29.0, 33.0, 27.0, 44.0, 41.0, 46.0, 73.0, 84.0, 162.0, 1705.0, 168.0, 75.0, 67.0, 43.0, 47.0, 34.0, 31.0, 31.0, 27.0, 21.0, 21.0, 27.0, 16.0, 13.0, 7.0, 8.0, 13.0, 6.0, 5.0, 8.0, 3.0, 2.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-26.875, -26.095947265625, -25.31689453125, -24.537841796875, -23.7587890625, -22.979736328125, -22.20068359375, -21.421630859375, -20.642578125, -19.863525390625, -19.08447265625, -18.305419921875, -17.5263671875, -16.747314453125, -15.96826171875, -15.189208984375, -14.41015625, -13.631103515625, -12.85205078125, -12.072998046875, -11.2939453125, -10.514892578125, -9.73583984375, -8.956787109375, -8.177734375, -7.398681640625, -6.61962890625, -5.840576171875, -5.0615234375, -4.282470703125, -3.50341796875, -2.724365234375, -1.9453125, -1.166259765625, -0.38720703125, 0.391845703125, 1.1708984375, 1.949951171875, 2.72900390625, 3.508056640625, 4.287109375, 5.066162109375, 5.84521484375, 6.624267578125, 7.4033203125, 8.182373046875, 8.96142578125, 9.740478515625, 10.51953125, 11.298583984375, 12.07763671875, 12.856689453125, 13.6357421875, 14.414794921875, 15.19384765625, 15.972900390625, 16.751953125, 17.531005859375, 18.31005859375, 19.089111328125, 19.8681640625, 20.647216796875, 21.42626953125, 22.205322265625, 22.984375]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 3.0, 3.0, 11.0, 7.0, 18.0, 16.0, 21.0, 23.0, 40.0, 50.0, 57.0, 97.0, 130.0, 209.0, 301.0, 678.0, 4393.0, 3021965.0, 114654.0, 1772.0, 460.0, 246.0, 166.0, 115.0, 63.0, 65.0, 38.0, 22.0, 31.0, 10.0, 12.0, 9.0, 10.0, 2.0, 5.0, 2.0, 6.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-65.6875, -63.5556640625, -61.423828125, -59.2919921875, -57.16015625, -55.0283203125, -52.896484375, -50.7646484375, -48.6328125, -46.5009765625, -44.369140625, -42.2373046875, -40.10546875, -37.9736328125, -35.841796875, -33.7099609375, -31.578125, -29.4462890625, -27.314453125, -25.1826171875, -23.05078125, -20.9189453125, -18.787109375, -16.6552734375, -14.5234375, -12.3916015625, -10.259765625, -8.1279296875, -5.99609375, -3.8642578125, -1.732421875, 0.3994140625, 2.53125, 4.6630859375, 6.794921875, 8.9267578125, 11.05859375, 13.1904296875, 15.322265625, 17.4541015625, 19.5859375, 21.7177734375, 23.849609375, 25.9814453125, 28.11328125, 30.2451171875, 32.376953125, 34.5087890625, 36.640625, 38.7724609375, 40.904296875, 43.0361328125, 45.16796875, 47.2998046875, 49.431640625, 51.5634765625, 53.6953125, 55.8271484375, 57.958984375, 60.0908203125, 62.22265625, 64.3544921875, 66.486328125, 68.6181640625, 70.75]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 16.0, 84.0, 403.0, 403.0, 95.0, 10.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.12750244140625, -48.66709899902344, -45.206695556640625, -41.74629211425781, -38.285888671875, -34.82548522949219, -31.365083694458008, -27.904680252075195, -24.444276809692383, -20.98387336730957, -17.523469924926758, -14.063067436218262, -10.60266399383545, -7.142261505126953, -3.6818580627441406, -0.22145462036132812, 3.2389488220214844, 6.699352264404297, 10.15975570678711, 13.620158195495605, 17.080562591552734, 20.540964126586914, 24.001367568969727, 27.46177101135254, 30.92217445373535, 34.38257598876953, 37.842979431152344, 41.303382873535156, 44.76378631591797, 48.22418975830078, 51.684593200683594, 55.144996643066406, 58.60540008544922, 62.06580352783203, 65.52620697021484, 68.98661041259766, 72.44701385498047, 75.90741729736328, 79.3678207397461, 82.8282241821289, 86.28862762451172, 89.74903106689453, 93.20943450927734, 96.66983795166016, 100.13024139404297, 103.59064483642578, 107.0510482788086, 110.5114517211914, 113.97184753417969, 117.4322509765625, 120.89265441894531, 124.35305786132812, 127.81346130371094, 131.27386474609375, 134.73426818847656, 138.19467163085938, 141.6550750732422, 145.115478515625, 148.5758819580078, 152.03628540039062, 155.49668884277344, 158.95709228515625, 162.41749572753906, 165.87789916992188, 169.3383026123047]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 6.0, 6.0, 7.0, 7.0, 6.0, 11.0, 13.0, 12.0, 15.0, 18.0, 18.0, 28.0, 23.0, 23.0, 24.0, 34.0, 36.0, 41.0, 38.0, 29.0, 31.0, 30.0, 39.0, 38.0, 31.0, 33.0, 36.0, 32.0, 43.0, 32.0, 19.0, 24.0, 23.0, 28.0, 16.0, 20.0, 16.0, 16.0, 14.0, 16.0, 9.0, 11.0, 10.0, 9.0, 11.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0], "bins": [-61.33226013183594, -59.449153900146484, -57.5660514831543, -55.682945251464844, -53.799842834472656, -51.9167366027832, -50.03363037109375, -48.15052795410156, -46.26742172241211, -44.384315490722656, -42.50121307373047, -40.618106842041016, -38.73500061035156, -36.851898193359375, -34.96879196166992, -33.08568572998047, -31.20258331298828, -29.31947898864746, -27.43637466430664, -25.553268432617188, -23.670164108276367, -21.787059783935547, -19.903953552246094, -18.020849227905273, -16.137744903564453, -14.254640579223633, -12.371535301208496, -10.48843002319336, -8.605325698852539, -6.722221374511719, -4.839116096496582, -2.9560108184814453, -1.072906494140625, 0.8101983070373535, 2.693303108215332, 4.5764079093933105, 6.459512710571289, 8.34261703491211, 10.225722312927246, 12.108827590942383, 13.991931915283203, 15.875036239624023, 17.758140563964844, 19.641246795654297, 21.524351119995117, 23.407455444335938, 25.29056167602539, 27.17366600036621, 29.05677032470703, 30.93987464904785, 32.82297897338867, 34.706085205078125, 36.58918762207031, 38.472293853759766, 40.35540008544922, 42.238502502441406, 44.12160873413086, 46.00471496582031, 47.8878173828125, 49.77092361450195, 51.654029846191406, 53.537132263183594, 55.42023849487305, 57.3033447265625, 59.18644714355469]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 7.0, 1.0, 2.0, 5.0, 12.0, 10.0, 14.0, 22.0, 18.0, 21.0, 45.0, 30.0, 32.0, 41.0, 40.0, 45.0, 58.0, 49.0, 53.0, 56.0, 57.0, 51.0, 58.0, 45.0, 40.0, 26.0, 30.0, 25.0, 23.0, 20.0, 14.0, 20.0, 13.0, 6.0, 13.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.015625, -7.739501953125, -7.46337890625, -7.187255859375, -6.9111328125, -6.635009765625, -6.35888671875, -6.082763671875, -5.806640625, -5.530517578125, -5.25439453125, -4.978271484375, -4.7021484375, -4.426025390625, -4.14990234375, -3.873779296875, -3.59765625, -3.321533203125, -3.04541015625, -2.769287109375, -2.4931640625, -2.217041015625, -1.94091796875, -1.664794921875, -1.388671875, -1.112548828125, -0.83642578125, -0.560302734375, -0.2841796875, -0.008056640625, 0.26806640625, 0.544189453125, 0.8203125, 1.096435546875, 1.37255859375, 1.648681640625, 1.9248046875, 2.200927734375, 2.47705078125, 2.753173828125, 3.029296875, 3.305419921875, 3.58154296875, 3.857666015625, 4.1337890625, 4.409912109375, 4.68603515625, 4.962158203125, 5.23828125, 5.514404296875, 5.79052734375, 6.066650390625, 6.3427734375, 6.618896484375, 6.89501953125, 7.171142578125, 7.447265625, 7.723388671875, 7.99951171875, 8.275634765625, 8.5517578125, 8.827880859375, 9.10400390625, 9.380126953125, 9.65625]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 0.0, 5.0, 3.0, 11.0, 9.0, 7.0, 19.0, 23.0, 29.0, 51.0, 65.0, 98.0, 118.0, 215.0, 354.0, 680.0, 1444.0, 3485.0, 10964.0, 42324.0, 236767.0, 1110893.0, 1874812.0, 742713.0, 130967.0, 25695.0, 7314.0, 2620.0, 1104.0, 553.0, 313.0, 191.0, 130.0, 97.0, 54.0, 33.0, 40.0, 31.0, 15.0, 7.0, 14.0, 11.0, 8.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.6484375, -10.33837890625, -10.0283203125, -9.71826171875, -9.408203125, -9.09814453125, -8.7880859375, -8.47802734375, -8.16796875, -7.85791015625, -7.5478515625, -7.23779296875, -6.927734375, -6.61767578125, -6.3076171875, -5.99755859375, -5.6875, -5.37744140625, -5.0673828125, -4.75732421875, -4.447265625, -4.13720703125, -3.8271484375, -3.51708984375, -3.20703125, -2.89697265625, -2.5869140625, -2.27685546875, -1.966796875, -1.65673828125, -1.3466796875, -1.03662109375, -0.7265625, -0.41650390625, -0.1064453125, 0.20361328125, 0.513671875, 0.82373046875, 1.1337890625, 1.44384765625, 1.75390625, 2.06396484375, 2.3740234375, 2.68408203125, 2.994140625, 3.30419921875, 3.6142578125, 3.92431640625, 4.234375, 4.54443359375, 4.8544921875, 5.16455078125, 5.474609375, 5.78466796875, 6.0947265625, 6.40478515625, 6.71484375, 7.02490234375, 7.3349609375, 7.64501953125, 7.955078125, 8.26513671875, 8.5751953125, 8.88525390625, 9.1953125]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 5.0, 2.0, 5.0, 5.0, 7.0, 5.0, 11.0, 25.0, 13.0, 24.0, 42.0, 35.0, 38.0, 70.0, 82.0, 105.0, 129.0, 180.0, 238.0, 285.0, 324.0, 375.0, 343.0, 337.0, 287.0, 254.0, 172.0, 170.0, 107.0, 83.0, 69.0, 57.0, 30.0, 38.0, 18.0, 25.0, 22.0, 17.0, 15.0, 6.0, 9.0, 6.0, 6.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.109375, -9.7222900390625, -9.335205078125, -8.9481201171875, -8.56103515625, -8.1739501953125, -7.786865234375, -7.3997802734375, -7.0126953125, -6.6256103515625, -6.238525390625, -5.8514404296875, -5.46435546875, -5.0772705078125, -4.690185546875, -4.3031005859375, -3.916015625, -3.5289306640625, -3.141845703125, -2.7547607421875, -2.36767578125, -1.9805908203125, -1.593505859375, -1.2064208984375, -0.8193359375, -0.4322509765625, -0.045166015625, 0.3419189453125, 0.72900390625, 1.1160888671875, 1.503173828125, 1.8902587890625, 2.27734375, 2.6644287109375, 3.051513671875, 3.4385986328125, 3.82568359375, 4.2127685546875, 4.599853515625, 4.9869384765625, 5.3740234375, 5.7611083984375, 6.148193359375, 6.5352783203125, 6.92236328125, 7.3094482421875, 7.696533203125, 8.0836181640625, 8.470703125, 8.8577880859375, 9.244873046875, 9.6319580078125, 10.01904296875, 10.4061279296875, 10.793212890625, 11.1802978515625, 11.5673828125, 11.9544677734375, 12.341552734375, 12.7286376953125, 13.11572265625, 13.5028076171875, 13.889892578125, 14.2769775390625, 14.6640625]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 3.0, 3.0, 5.0, 7.0, 11.0, 9.0, 11.0, 17.0, 25.0, 25.0, 32.0, 51.0, 69.0, 83.0, 101.0, 138.0, 217.0, 314.0, 720.0, 4040.0, 1057310.0, 3121501.0, 7568.0, 851.0, 364.0, 197.0, 168.0, 100.0, 71.0, 63.0, 48.0, 32.0, 33.0, 19.0, 15.0, 15.0, 12.0, 4.0, 7.0, 3.0, 2.0, 4.0, 7.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-69.8125, -67.82275390625, -65.8330078125, -63.84326171875, -61.853515625, -59.86376953125, -57.8740234375, -55.88427734375, -53.89453125, -51.90478515625, -49.9150390625, -47.92529296875, -45.935546875, -43.94580078125, -41.9560546875, -39.96630859375, -37.9765625, -35.98681640625, -33.9970703125, -32.00732421875, -30.017578125, -28.02783203125, -26.0380859375, -24.04833984375, -22.05859375, -20.06884765625, -18.0791015625, -16.08935546875, -14.099609375, -12.10986328125, -10.1201171875, -8.13037109375, -6.140625, -4.15087890625, -2.1611328125, -0.17138671875, 1.818359375, 3.80810546875, 5.7978515625, 7.78759765625, 9.77734375, 11.76708984375, 13.7568359375, 15.74658203125, 17.736328125, 19.72607421875, 21.7158203125, 23.70556640625, 25.6953125, 27.68505859375, 29.6748046875, 31.66455078125, 33.654296875, 35.64404296875, 37.6337890625, 39.62353515625, 41.61328125, 43.60302734375, 45.5927734375, 47.58251953125, 49.572265625, 51.56201171875, 53.5517578125, 55.54150390625, 57.53125]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 7.0, 16.0, 36.0, 90.0, 137.0, 162.0, 211.0, 180.0, 99.0, 46.0, 15.0, 8.0, 5.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.4683837890625, -89.17403411865234, -85.87968444824219, -82.58533477783203, -79.29098510742188, -75.99663543701172, -72.70228576660156, -69.40792846679688, -66.11358642578125, -62.819236755371094, -59.52488708496094, -56.23053741455078, -52.936187744140625, -49.64183807373047, -46.34748458862305, -43.05313491821289, -39.75878143310547, -36.46443176269531, -33.170082092285156, -29.875730514526367, -26.58138084411621, -23.287031173706055, -19.992679595947266, -16.69832992553711, -13.403980255126953, -10.109630584716797, -6.815279960632324, -3.5209293365478516, -0.2265796661376953, 3.067770004272461, 6.36212158203125, 9.656471252441406, 12.950820922851562, 16.24517059326172, 19.539520263671875, 22.833871841430664, 26.12822151184082, 29.422571182250977, 32.716922760009766, 36.01127243041992, 39.30562210083008, 42.599971771240234, 45.89432144165039, 49.18867492675781, 52.48302459716797, 55.777374267578125, 59.07172393798828, 62.36607360839844, 65.6604232788086, 68.95477294921875, 72.2491226196289, 75.54347229003906, 78.83782196044922, 82.13217163085938, 85.42652893066406, 88.72087097167969, 92.01522827148438, 95.30957794189453, 98.60392761230469, 101.89827728271484, 105.192626953125, 108.48697662353516, 111.78132629394531, 115.07568359375, 118.37002563476562]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 4.0, 5.0, 8.0, 8.0, 6.0, 15.0, 14.0, 16.0, 28.0, 28.0, 31.0, 36.0, 43.0, 37.0, 41.0, 57.0, 55.0, 45.0, 40.0, 44.0, 57.0, 54.0, 37.0, 40.0, 54.0, 42.0, 26.0, 23.0, 26.0, 18.0, 14.0, 14.0, 7.0, 14.0, 7.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-67.71780395507812, -65.8613052368164, -64.00480651855469, -62.148311614990234, -60.29181671142578, -58.43531799316406, -56.578819274902344, -54.72232437133789, -52.86582946777344, -51.00933074951172, -49.152835845947266, -47.29633712768555, -45.439842224121094, -43.583343505859375, -41.726844787597656, -39.8703498840332, -38.013851165771484, -36.157352447509766, -34.30085754394531, -32.444358825683594, -30.58786392211914, -28.731365203857422, -26.874868392944336, -25.01837158203125, -23.161874771118164, -21.305377960205078, -19.448881149291992, -17.592384338378906, -15.735886573791504, -13.879389762878418, -12.022891998291016, -10.16639518737793, -8.309898376464844, -6.453401565551758, -4.596904277801514, -2.7404069900512695, -0.8839101791381836, 0.9725866317749023, 2.8290843963623047, 4.685581207275391, 6.542078018188477, 8.398574829101562, 10.255071640014648, 12.11156940460205, 13.968066215515137, 15.824563026428223, 17.681060791015625, 19.53755760192871, 21.394054412841797, 23.250551223754883, 25.10704803466797, 26.963546752929688, 28.82004165649414, 30.67654037475586, 32.53303527832031, 34.38953399658203, 36.24603271484375, 38.10253143310547, 39.95902633666992, 41.81552505493164, 43.672019958496094, 45.52851867675781, 47.38501739501953, 49.241512298583984, 51.09800720214844]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 3.0, 8.0, 9.0, 18.0, 19.0, 30.0, 18.0, 28.0, 23.0, 27.0, 42.0, 40.0, 54.0, 48.0, 54.0, 40.0, 55.0, 54.0, 55.0, 48.0, 54.0, 38.0, 39.0, 24.0, 29.0, 36.0, 17.0, 23.0, 17.0, 13.0, 10.0, 5.0, 9.0, 9.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2265625, -7.95849609375, -7.6904296875, -7.42236328125, -7.154296875, -6.88623046875, -6.6181640625, -6.35009765625, -6.08203125, -5.81396484375, -5.5458984375, -5.27783203125, -5.009765625, -4.74169921875, -4.4736328125, -4.20556640625, -3.9375, -3.66943359375, -3.4013671875, -3.13330078125, -2.865234375, -2.59716796875, -2.3291015625, -2.06103515625, -1.79296875, -1.52490234375, -1.2568359375, -0.98876953125, -0.720703125, -0.45263671875, -0.1845703125, 0.08349609375, 0.3515625, 0.61962890625, 0.8876953125, 1.15576171875, 1.423828125, 1.69189453125, 1.9599609375, 2.22802734375, 2.49609375, 2.76416015625, 3.0322265625, 3.30029296875, 3.568359375, 3.83642578125, 4.1044921875, 4.37255859375, 4.640625, 4.90869140625, 5.1767578125, 5.44482421875, 5.712890625, 5.98095703125, 6.2490234375, 6.51708984375, 6.78515625, 7.05322265625, 7.3212890625, 7.58935546875, 7.857421875, 8.12548828125, 8.3935546875, 8.66162109375, 8.9296875]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 4.0, 1.0, 4.0, 5.0, 10.0, 10.0, 15.0, 24.0, 23.0, 48.0, 69.0, 95.0, 136.0, 226.0, 299.0, 515.0, 745.0, 1171.0, 1834.0, 2852.0, 4398.0, 6998.0, 10899.0, 16785.0, 26249.0, 43241.0, 74792.0, 146494.0, 321706.0, 174045.0, 85781.0, 48240.0, 29127.0, 18463.0, 11886.0, 7610.0, 4908.0, 3191.0, 1995.0, 1299.0, 807.0, 541.0, 333.0, 222.0, 137.0, 103.0, 74.0, 42.0, 32.0, 26.0, 14.0, 13.0, 10.0, 6.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.41015625, -1.36553955078125, -1.3209228515625, -1.27630615234375, -1.231689453125, -1.18707275390625, -1.1424560546875, -1.09783935546875, -1.05322265625, -1.00860595703125, -0.9639892578125, -0.91937255859375, -0.874755859375, -0.83013916015625, -0.7855224609375, -0.74090576171875, -0.6962890625, -0.65167236328125, -0.6070556640625, -0.56243896484375, -0.517822265625, -0.47320556640625, -0.4285888671875, -0.38397216796875, -0.33935546875, -0.29473876953125, -0.2501220703125, -0.20550537109375, -0.160888671875, -0.11627197265625, -0.0716552734375, -0.02703857421875, 0.017578125, 0.06219482421875, 0.1068115234375, 0.15142822265625, 0.196044921875, 0.24066162109375, 0.2852783203125, 0.32989501953125, 0.37451171875, 0.41912841796875, 0.4637451171875, 0.50836181640625, 0.552978515625, 0.59759521484375, 0.6422119140625, 0.68682861328125, 0.7314453125, 0.77606201171875, 0.8206787109375, 0.86529541015625, 0.909912109375, 0.95452880859375, 0.9991455078125, 1.04376220703125, 1.08837890625, 1.13299560546875, 1.1776123046875, 1.22222900390625, 1.266845703125, 1.31146240234375, 1.3560791015625, 1.40069580078125, 1.4453125]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 3.0, 5.0, 7.0, 4.0, 7.0, 12.0, 7.0, 16.0, 14.0, 18.0, 22.0, 22.0, 27.0, 30.0, 27.0, 45.0, 33.0, 25.0, 30.0, 55.0, 41.0, 35.0, 1059.0, 40.0, 27.0, 46.0, 33.0, 35.0, 31.0, 23.0, 38.0, 26.0, 28.0, 27.0, 14.0, 22.0, 16.0, 13.0, 11.0, 10.0, 9.0, 5.0, 6.0, 3.0, 5.0, 2.0, 4.0, 2.0, 0.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-4.0234375, -3.895263671875, -3.76708984375, -3.638916015625, -3.5107421875, -3.382568359375, -3.25439453125, -3.126220703125, -2.998046875, -2.869873046875, -2.74169921875, -2.613525390625, -2.4853515625, -2.357177734375, -2.22900390625, -2.100830078125, -1.97265625, -1.844482421875, -1.71630859375, -1.588134765625, -1.4599609375, -1.331787109375, -1.20361328125, -1.075439453125, -0.947265625, -0.819091796875, -0.69091796875, -0.562744140625, -0.4345703125, -0.306396484375, -0.17822265625, -0.050048828125, 0.078125, 0.206298828125, 0.33447265625, 0.462646484375, 0.5908203125, 0.718994140625, 0.84716796875, 0.975341796875, 1.103515625, 1.231689453125, 1.35986328125, 1.488037109375, 1.6162109375, 1.744384765625, 1.87255859375, 2.000732421875, 2.12890625, 2.257080078125, 2.38525390625, 2.513427734375, 2.6416015625, 2.769775390625, 2.89794921875, 3.026123046875, 3.154296875, 3.282470703125, 3.41064453125, 3.538818359375, 3.6669921875, 3.795166015625, 3.92333984375, 4.051513671875, 4.1796875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [6.0, 4.0, 7.0, 6.0, 13.0, 15.0, 26.0, 30.0, 43.0, 56.0, 87.0, 116.0, 149.0, 214.0, 310.0, 413.0, 600.0, 808.0, 1131.0, 1581.0, 2277.0, 3211.0, 4556.0, 6777.0, 10211.0, 14957.0, 22937.0, 35581.0, 56691.0, 93275.0, 183185.0, 1323527.0, 128034.0, 73323.0, 45645.0, 28892.0, 18872.0, 12302.0, 8398.0, 5571.0, 3855.0, 2766.0, 1886.0, 1327.0, 985.0, 697.0, 510.0, 362.0, 243.0, 202.0, 120.0, 98.0, 79.0, 54.0, 35.0, 26.0, 17.0, 17.0, 10.0, 8.0, 6.0, 6.0, 0.0, 6.0], "bins": [-1.1240234375, -1.08807373046875, -1.0521240234375, -1.01617431640625, -0.980224609375, -0.94427490234375, -0.9083251953125, -0.87237548828125, -0.83642578125, -0.80047607421875, -0.7645263671875, -0.72857666015625, -0.692626953125, -0.65667724609375, -0.6207275390625, -0.58477783203125, -0.548828125, -0.51287841796875, -0.4769287109375, -0.44097900390625, -0.405029296875, -0.36907958984375, -0.3331298828125, -0.29718017578125, -0.26123046875, -0.22528076171875, -0.1893310546875, -0.15338134765625, -0.117431640625, -0.08148193359375, -0.0455322265625, -0.00958251953125, 0.0263671875, 0.06231689453125, 0.0982666015625, 0.13421630859375, 0.170166015625, 0.20611572265625, 0.2420654296875, 0.27801513671875, 0.31396484375, 0.34991455078125, 0.3858642578125, 0.42181396484375, 0.457763671875, 0.49371337890625, 0.5296630859375, 0.56561279296875, 0.6015625, 0.63751220703125, 0.6734619140625, 0.70941162109375, 0.745361328125, 0.78131103515625, 0.8172607421875, 0.85321044921875, 0.88916015625, 0.92510986328125, 0.9610595703125, 0.99700927734375, 1.032958984375, 1.06890869140625, 1.1048583984375, 1.14080810546875, 1.1767578125]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 4.0, 0.0, 4.0, 13.0, 5.0, 7.0, 9.0, 19.0, 16.0, 17.0, 35.0, 49.0, 57.0, 73.0, 98.0, 97.0, 80.0, 78.0, 65.0, 59.0, 39.0, 35.0, 21.0, 17.0, 15.0, 13.0, 14.0, 10.0, 5.0, 9.0, 6.0, 5.0, 1.0, 5.0, 6.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0008206367492675781, -0.0007950067520141602, -0.0007693767547607422, -0.0007437467575073242, -0.0007181167602539062, -0.0006924867630004883, -0.0006668567657470703, -0.0006412267684936523, -0.0006155967712402344, -0.0005899667739868164, -0.0005643367767333984, -0.0005387067794799805, -0.0005130767822265625, -0.00048744678497314453, -0.00046181678771972656, -0.0004361867904663086, -0.0004105567932128906, -0.00038492679595947266, -0.0003592967987060547, -0.0003336668014526367, -0.00030803680419921875, -0.0002824068069458008, -0.0002567768096923828, -0.00023114681243896484, -0.00020551681518554688, -0.0001798868179321289, -0.00015425682067871094, -0.00012862682342529297, -0.000102996826171875, -7.736682891845703e-05, -5.173683166503906e-05, -2.6106834411621094e-05, -4.76837158203125e-07, 2.5153160095214844e-05, 5.078315734863281e-05, 7.641315460205078e-05, 0.00010204315185546875, 0.00012767314910888672, 0.0001533031463623047, 0.00017893314361572266, 0.00020456314086914062, 0.0002301931381225586, 0.00025582313537597656, 0.00028145313262939453, 0.0003070831298828125, 0.00033271312713623047, 0.00035834312438964844, 0.0003839731216430664, 0.0004096031188964844, 0.00043523311614990234, 0.0004608631134033203, 0.0004864931106567383, 0.0005121231079101562, 0.0005377531051635742, 0.0005633831024169922, 0.0005890130996704102, 0.0006146430969238281, 0.0006402730941772461, 0.0006659030914306641, 0.000691533088684082, 0.0007171630859375, 0.000742793083190918, 0.0007684230804443359, 0.0007940530776977539, 0.0008196830749511719]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 2.0, 3.0, 6.0, 9.0, 2.0, 9.0, 9.0, 10.0, 18.0, 21.0, 21.0, 27.0, 38.0, 43.0, 66.0, 118.0, 211.0, 451.0, 2256.0, 1003416.0, 40178.0, 862.0, 281.0, 155.0, 116.0, 53.0, 43.0, 31.0, 23.0, 15.0, 14.0, 10.0, 9.0, 5.0, 2.0, 7.0, 4.0, 4.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.018768310546875, -0.018195390701293945, -0.01762247085571289, -0.017049551010131836, -0.01647663116455078, -0.015903711318969727, -0.015330791473388672, -0.014757871627807617, -0.014184951782226562, -0.013612031936645508, -0.013039112091064453, -0.012466192245483398, -0.011893272399902344, -0.011320352554321289, -0.010747432708740234, -0.01017451286315918, -0.009601593017578125, -0.00902867317199707, -0.008455753326416016, -0.007882833480834961, -0.007309913635253906, -0.0067369937896728516, -0.006164073944091797, -0.005591154098510742, -0.0050182342529296875, -0.004445314407348633, -0.003872394561767578, -0.0032994747161865234, -0.0027265548706054688, -0.002153635025024414, -0.0015807151794433594, -0.0010077953338623047, -0.00043487548828125, 0.0001380443572998047, 0.0007109642028808594, 0.001283884048461914, 0.0018568038940429688, 0.0024297237396240234, 0.003002643585205078, 0.003575563430786133, 0.0041484832763671875, 0.004721403121948242, 0.005294322967529297, 0.0058672428131103516, 0.006440162658691406, 0.007013082504272461, 0.007586002349853516, 0.00815892219543457, 0.008731842041015625, 0.00930476188659668, 0.009877681732177734, 0.010450601577758789, 0.011023521423339844, 0.011596441268920898, 0.012169361114501953, 0.012742280960083008, 0.013315200805664062, 0.013888120651245117, 0.014461040496826172, 0.015033960342407227, 0.015606880187988281, 0.016179800033569336, 0.01675271987915039, 0.017325639724731445, 0.0178985595703125]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 7.0, 23.0, 55.0, 110.0, 177.0, 220.0, 203.0, 127.0, 47.0, 26.0, 8.0, 4.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004970945883542299, -0.0004716735566034913, -0.0004462525248527527, -0.0004208315222058445, -0.0003954104904551059, -0.0003699894587043673, -0.0003445684560574591, -0.0003191474243067205, -0.0002937263925559819, -0.00026830536080524325, -0.00024288434360641986, -0.00021746332640759647, -0.00019204229465685785, -0.00016662126290611923, -0.00014120024570729584, -0.00011577922850847244, -9.035819675773382e-05, -6.493717228295282e-05, -3.951614780817181e-05, -1.4095123333390802e-05, 1.1325901141390204e-05, 3.6746932892128825e-05, 6.216795009095222e-05, 8.758896728977561e-05, 0.00011300999904051423, 0.00013843103079125285, 0.00016385204799007624, 0.00018927306518889964, 0.00021469409693963826, 0.00024011512869037688, 0.00026553613133728504, 0.00029095716308802366, 0.0003163781948387623, 0.0003417992265895009, 0.0003672202583402395, 0.0003926412609871477, 0.0004180622927378863, 0.00044348332448862493, 0.0004689043271355331, 0.0004943253588862717, 0.0005197463906370103, 0.000545167422387749, 0.0005705884541384876, 0.0005960094858892262, 0.0006214304594323039, 0.0006468514911830425, 0.0006722725229337811, 0.0006976935546845198, 0.0007231145864352584, 0.000748535618185997, 0.0007739566499367356, 0.0007993776816874743, 0.0008247987134382129, 0.0008502197451889515, 0.0008756407187320292, 0.0009010617504827678, 0.0009264827822335064, 0.0009519038139842451, 0.0009773247875273228, 0.0010027458192780614, 0.0010281668510288, 0.0010535878827795386, 0.0010790089145302773, 0.0011044299462810159, 0.0011298509780317545]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 4.0, 4.0, 2.0, 7.0, 11.0, 12.0, 10.0, 13.0, 16.0, 25.0, 16.0, 37.0, 24.0, 35.0, 30.0, 39.0, 38.0, 38.0, 53.0, 38.0, 51.0, 43.0, 49.0, 47.0, 42.0, 30.0, 31.0, 41.0, 25.0, 29.0, 34.0, 32.0, 28.0, 11.0, 11.0, 11.0, 8.0, 7.0, 7.0, 3.0, 6.0, 3.0, 1.0, 1.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00039893388748168945, -0.000386715866625309, -0.00037449784576892853, -0.00036227982491254807, -0.0003500618040561676, -0.00033784378319978714, -0.0003256257623434067, -0.0003134077414870262, -0.00030118972063064575, -0.0002889716997742653, -0.0002767536789178848, -0.00026453565806150436, -0.0002523176372051239, -0.00024009961634874344, -0.00022788159549236298, -0.0002156635746359825, -0.00020344555377960205, -0.0001912275329232216, -0.00017900951206684113, -0.00016679149121046066, -0.0001545734703540802, -0.00014235544949769974, -0.00013013742864131927, -0.00011791940778493881, -0.00010570138692855835, -9.348336607217789e-05, -8.126534521579742e-05, -6.904732435941696e-05, -5.68293035030365e-05, -4.4611282646656036e-05, -3.2393261790275574e-05, -2.017524093389511e-05, -7.957220077514648e-06, 4.260800778865814e-06, 1.6478821635246277e-05, 2.869684249162674e-05, 4.09148633480072e-05, 5.3132884204387665e-05, 6.535090506076813e-05, 7.756892591714859e-05, 8.978694677352905e-05, 0.00010200496762990952, 0.00011422298848628998, 0.00012644100934267044, 0.0001386590301990509, 0.00015087705105543137, 0.00016309507191181183, 0.0001753130927681923, 0.00018753111362457275, 0.00019974913448095322, 0.00021196715533733368, 0.00022418517619371414, 0.0002364031970500946, 0.00024862121790647507, 0.00026083923876285553, 0.000273057259619236, 0.00028527528047561646, 0.0002974933013319969, 0.0003097113221883774, 0.00032192934304475784, 0.0003341473639011383, 0.00034636538475751877, 0.00035858340561389923, 0.0003708014264702797, 0.00038301944732666016]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 3.0, 8.0, 9.0, 18.0, 19.0, 30.0, 18.0, 28.0, 23.0, 27.0, 42.0, 40.0, 54.0, 48.0, 54.0, 40.0, 55.0, 54.0, 55.0, 48.0, 54.0, 38.0, 39.0, 24.0, 29.0, 36.0, 17.0, 23.0, 17.0, 13.0, 10.0, 5.0, 9.0, 9.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2265625, -7.95849609375, -7.6904296875, -7.42236328125, -7.154296875, -6.88623046875, -6.6181640625, -6.35009765625, -6.08203125, -5.81396484375, -5.5458984375, -5.27783203125, -5.009765625, -4.74169921875, -4.4736328125, -4.20556640625, -3.9375, -3.66943359375, -3.4013671875, -3.13330078125, -2.865234375, -2.59716796875, -2.3291015625, -2.06103515625, -1.79296875, -1.52490234375, -1.2568359375, -0.98876953125, -0.720703125, -0.45263671875, -0.1845703125, 0.08349609375, 0.3515625, 0.61962890625, 0.8876953125, 1.15576171875, 1.423828125, 1.69189453125, 1.9599609375, 2.22802734375, 2.49609375, 2.76416015625, 3.0322265625, 3.30029296875, 3.568359375, 3.83642578125, 4.1044921875, 4.37255859375, 4.640625, 4.90869140625, 5.1767578125, 5.44482421875, 5.712890625, 5.98095703125, 6.2490234375, 6.51708984375, 6.78515625, 7.05322265625, 7.3212890625, 7.58935546875, 7.857421875, 8.12548828125, 8.3935546875, 8.66162109375, 8.9296875]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 5.0, 9.0, 12.0, 18.0, 27.0, 31.0, 48.0, 82.0, 132.0, 181.0, 258.0, 430.0, 915.0, 1844.0, 4274.0, 10721.0, 29225.0, 87118.0, 278627.0, 416722.0, 143035.0, 46684.0, 16402.0, 6330.0, 2628.0, 1177.0, 637.0, 319.0, 233.0, 142.0, 89.0, 55.0, 48.0, 32.0, 30.0, 7.0, 11.0, 8.0, 5.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.59375, -5.42535400390625, -5.2569580078125, -5.08856201171875, -4.920166015625, -4.75177001953125, -4.5833740234375, -4.41497802734375, -4.24658203125, -4.07818603515625, -3.9097900390625, -3.74139404296875, -3.572998046875, -3.40460205078125, -3.2362060546875, -3.06781005859375, -2.8994140625, -2.73101806640625, -2.5626220703125, -2.39422607421875, -2.225830078125, -2.05743408203125, -1.8890380859375, -1.72064208984375, -1.55224609375, -1.38385009765625, -1.2154541015625, -1.04705810546875, -0.878662109375, -0.71026611328125, -0.5418701171875, -0.37347412109375, -0.205078125, -0.03668212890625, 0.1317138671875, 0.30010986328125, 0.468505859375, 0.63690185546875, 0.8052978515625, 0.97369384765625, 1.14208984375, 1.31048583984375, 1.4788818359375, 1.64727783203125, 1.815673828125, 1.98406982421875, 2.1524658203125, 2.32086181640625, 2.4892578125, 2.65765380859375, 2.8260498046875, 2.99444580078125, 3.162841796875, 3.33123779296875, 3.4996337890625, 3.66802978515625, 3.83642578125, 4.00482177734375, 4.1732177734375, 4.34161376953125, 4.510009765625, 4.67840576171875, 4.8468017578125, 5.01519775390625, 5.18359375]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 3.0, 4.0, 2.0, 1.0, 6.0, 10.0, 10.0, 14.0, 18.0, 18.0, 20.0, 27.0, 24.0, 33.0, 48.0, 45.0, 40.0, 56.0, 80.0, 295.0, 1711.0, 139.0, 66.0, 61.0, 48.0, 43.0, 43.0, 30.0, 30.0, 13.0, 19.0, 25.0, 13.0, 13.0, 10.0, 5.0, 9.0, 3.0, 6.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-29.1875, -28.28369140625, -27.3798828125, -26.47607421875, -25.572265625, -24.66845703125, -23.7646484375, -22.86083984375, -21.95703125, -21.05322265625, -20.1494140625, -19.24560546875, -18.341796875, -17.43798828125, -16.5341796875, -15.63037109375, -14.7265625, -13.82275390625, -12.9189453125, -12.01513671875, -11.111328125, -10.20751953125, -9.3037109375, -8.39990234375, -7.49609375, -6.59228515625, -5.6884765625, -4.78466796875, -3.880859375, -2.97705078125, -2.0732421875, -1.16943359375, -0.265625, 0.63818359375, 1.5419921875, 2.44580078125, 3.349609375, 4.25341796875, 5.1572265625, 6.06103515625, 6.96484375, 7.86865234375, 8.7724609375, 9.67626953125, 10.580078125, 11.48388671875, 12.3876953125, 13.29150390625, 14.1953125, 15.09912109375, 16.0029296875, 16.90673828125, 17.810546875, 18.71435546875, 19.6181640625, 20.52197265625, 21.42578125, 22.32958984375, 23.2333984375, 24.13720703125, 25.041015625, 25.94482421875, 26.8486328125, 27.75244140625, 28.65625]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 6.0, 8.0, 12.0, 10.0, 16.0, 24.0, 25.0, 29.0, 34.0, 50.0, 87.0, 99.0, 162.0, 147.0, 302.0, 529.0, 1817.0, 2004303.0, 1134744.0, 1785.0, 534.0, 265.0, 164.0, 160.0, 90.0, 79.0, 44.0, 38.0, 34.0, 25.0, 22.0, 9.0, 14.0, 16.0, 2.0, 1.0, 6.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-64.5, -62.4833984375, -60.466796875, -58.4501953125, -56.43359375, -54.4169921875, -52.400390625, -50.3837890625, -48.3671875, -46.3505859375, -44.333984375, -42.3173828125, -40.30078125, -38.2841796875, -36.267578125, -34.2509765625, -32.234375, -30.2177734375, -28.201171875, -26.1845703125, -24.16796875, -22.1513671875, -20.134765625, -18.1181640625, -16.1015625, -14.0849609375, -12.068359375, -10.0517578125, -8.03515625, -6.0185546875, -4.001953125, -1.9853515625, 0.03125, 2.0478515625, 4.064453125, 6.0810546875, 8.09765625, 10.1142578125, 12.130859375, 14.1474609375, 16.1640625, 18.1806640625, 20.197265625, 22.2138671875, 24.23046875, 26.2470703125, 28.263671875, 30.2802734375, 32.296875, 34.3134765625, 36.330078125, 38.3466796875, 40.36328125, 42.3798828125, 44.396484375, 46.4130859375, 48.4296875, 50.4462890625, 52.462890625, 54.4794921875, 56.49609375, 58.5126953125, 60.529296875, 62.5458984375, 64.5625]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 75.0, 507.0, 394.0, 37.0], "bins": [-217.60609436035156, -214.08934020996094, -210.57260131835938, -207.05584716796875, -203.5391082763672, -200.02235412597656, -196.505615234375, -192.98886108398438, -189.4721221923828, -185.9553680419922, -182.43862915039062, -178.921875, -175.40513610839844, -171.8883819580078, -168.37164306640625, -164.85488891601562, -161.33815002441406, -157.82139587402344, -154.30465698242188, -150.78790283203125, -147.2711639404297, -143.75440979003906, -140.2376708984375, -136.72091674804688, -133.2041778564453, -129.6874237060547, -126.17068481445312, -122.65393829345703, -119.13719177246094, -115.62044525146484, -112.10369873046875, -108.58695220947266, -105.07019805908203, -101.55345153808594, -98.03670501708984, -94.51995849609375, -91.00321197509766, -87.48646545410156, -83.96971893310547, -80.45297241210938, -76.93622589111328, -73.41947937011719, -69.9027328491211, -66.385986328125, -62.869239807128906, -59.35249328613281, -55.83574676513672, -52.319000244140625, -48.80225372314453, -45.28550720214844, -41.768760681152344, -38.25201416015625, -34.735267639160156, -31.21851921081543, -27.701772689819336, -24.185026168823242, -20.66827964782715, -17.151533126831055, -13.634786605834961, -10.11803913116455, -6.601292610168457, -3.084545135498047, 0.4322013854980469, 3.9489479064941406, 7.465694904327393]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 7.0, 7.0, 4.0, 14.0, 5.0, 15.0, 7.0, 7.0, 12.0, 15.0, 12.0, 20.0, 25.0, 22.0, 18.0, 32.0, 29.0, 31.0, 36.0, 30.0, 35.0, 42.0, 33.0, 40.0, 40.0, 39.0, 29.0, 31.0, 39.0, 30.0, 32.0, 34.0, 31.0, 24.0, 28.0, 12.0, 15.0, 21.0, 17.0, 14.0, 18.0, 7.0, 5.0, 11.0, 9.0, 6.0, 3.0, 6.0, 6.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-52.272640228271484, -50.53852462768555, -48.804405212402344, -47.070289611816406, -45.33617401123047, -43.60205841064453, -41.86793899536133, -40.13382339477539, -38.39970779418945, -36.665592193603516, -34.93147277832031, -33.197357177734375, -31.463241577148438, -29.729124069213867, -27.995006561279297, -26.26089096069336, -24.52677345275879, -22.79265594482422, -21.05854034423828, -19.32442283630371, -17.590307235717773, -15.856189727783203, -14.12207317352295, -12.387956619262695, -10.653840065002441, -8.919723510742188, -7.185606956481934, -5.4514899253845215, -3.7173733711242676, -1.9832563400268555, -0.24913978576660156, 1.4849767684936523, 3.2190933227539062, 4.95320987701416, 6.687326431274414, 8.421443939208984, 10.155559539794922, 11.889677047729492, 13.623793601989746, 15.35791015625, 17.092025756835938, 18.826143264770508, 20.560258865356445, 22.294376373291016, 24.028491973876953, 25.762609481811523, 27.496726989746094, 29.23084259033203, 30.9649600982666, 32.69907760620117, 34.43319320678711, 36.16730880737305, 37.90142822265625, 39.63554382324219, 41.369659423828125, 43.10377502441406, 44.837894439697266, 46.5720100402832, 48.306129455566406, 50.040245056152344, 51.77436065673828, 53.50847625732422, 55.24259567260742, 56.97671127319336, 58.7108268737793]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 12.0, 11.0, 16.0, 12.0, 31.0, 24.0, 27.0, 19.0, 35.0, 31.0, 50.0, 47.0, 47.0, 50.0, 48.0, 54.0, 54.0, 44.0, 46.0, 47.0, 46.0, 44.0, 23.0, 31.0, 26.0, 26.0, 17.0, 16.0, 17.0, 8.0, 9.0, 11.0, 3.0, 8.0, 8.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5078125, -8.239501953125, -7.97119140625, -7.702880859375, -7.4345703125, -7.166259765625, -6.89794921875, -6.629638671875, -6.361328125, -6.093017578125, -5.82470703125, -5.556396484375, -5.2880859375, -5.019775390625, -4.75146484375, -4.483154296875, -4.21484375, -3.946533203125, -3.67822265625, -3.409912109375, -3.1416015625, -2.873291015625, -2.60498046875, -2.336669921875, -2.068359375, -1.800048828125, -1.53173828125, -1.263427734375, -0.9951171875, -0.726806640625, -0.45849609375, -0.190185546875, 0.078125, 0.346435546875, 0.61474609375, 0.883056640625, 1.1513671875, 1.419677734375, 1.68798828125, 1.956298828125, 2.224609375, 2.492919921875, 2.76123046875, 3.029541015625, 3.2978515625, 3.566162109375, 3.83447265625, 4.102783203125, 4.37109375, 4.639404296875, 4.90771484375, 5.176025390625, 5.4443359375, 5.712646484375, 5.98095703125, 6.249267578125, 6.517578125, 6.785888671875, 7.05419921875, 7.322509765625, 7.5908203125, 7.859130859375, 8.12744140625, 8.395751953125, 8.6640625]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 7.0, 6.0, 10.0, 9.0, 13.0, 21.0, 28.0, 26.0, 30.0, 33.0, 45.0, 69.0, 104.0, 155.0, 412.0, 1636.0, 29517.0, 2878963.0, 1270562.0, 10841.0, 978.0, 288.0, 158.0, 99.0, 61.0, 47.0, 29.0, 29.0, 17.0, 16.0, 18.0, 10.0, 16.0, 9.0, 4.0, 9.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.984375, -30.980712890625, -29.97705078125, -28.973388671875, -27.9697265625, -26.966064453125, -25.96240234375, -24.958740234375, -23.955078125, -22.951416015625, -21.94775390625, -20.944091796875, -19.9404296875, -18.936767578125, -17.93310546875, -16.929443359375, -15.92578125, -14.922119140625, -13.91845703125, -12.914794921875, -11.9111328125, -10.907470703125, -9.90380859375, -8.900146484375, -7.896484375, -6.892822265625, -5.88916015625, -4.885498046875, -3.8818359375, -2.878173828125, -1.87451171875, -0.870849609375, 0.1328125, 1.136474609375, 2.14013671875, 3.143798828125, 4.1474609375, 5.151123046875, 6.15478515625, 7.158447265625, 8.162109375, 9.165771484375, 10.16943359375, 11.173095703125, 12.1767578125, 13.180419921875, 14.18408203125, 15.187744140625, 16.19140625, 17.195068359375, 18.19873046875, 19.202392578125, 20.2060546875, 21.209716796875, 22.21337890625, 23.217041015625, 24.220703125, 25.224365234375, 26.22802734375, 27.231689453125, 28.2353515625, 29.239013671875, 30.24267578125, 31.246337890625, 32.25]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 3.0, 5.0, 5.0, 6.0, 13.0, 17.0, 33.0, 28.0, 56.0, 72.0, 81.0, 108.0, 197.0, 260.0, 337.0, 458.0, 526.0, 473.0, 381.0, 307.0, 193.0, 160.0, 105.0, 74.0, 52.0, 51.0, 29.0, 16.0, 16.0, 9.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.859375, -17.343994140625, -16.82861328125, -16.313232421875, -15.7978515625, -15.282470703125, -14.76708984375, -14.251708984375, -13.736328125, -13.220947265625, -12.70556640625, -12.190185546875, -11.6748046875, -11.159423828125, -10.64404296875, -10.128662109375, -9.61328125, -9.097900390625, -8.58251953125, -8.067138671875, -7.5517578125, -7.036376953125, -6.52099609375, -6.005615234375, -5.490234375, -4.974853515625, -4.45947265625, -3.944091796875, -3.4287109375, -2.913330078125, -2.39794921875, -1.882568359375, -1.3671875, -0.851806640625, -0.33642578125, 0.178955078125, 0.6943359375, 1.209716796875, 1.72509765625, 2.240478515625, 2.755859375, 3.271240234375, 3.78662109375, 4.302001953125, 4.8173828125, 5.332763671875, 5.84814453125, 6.363525390625, 6.87890625, 7.394287109375, 7.90966796875, 8.425048828125, 8.9404296875, 9.455810546875, 9.97119140625, 10.486572265625, 11.001953125, 11.517333984375, 12.03271484375, 12.548095703125, 13.0634765625, 13.578857421875, 14.09423828125, 14.609619140625, 15.125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 5.0, 3.0, 4.0, 2.0, 4.0, 8.0, 6.0, 14.0, 13.0, 17.0, 18.0, 14.0, 28.0, 33.0, 34.0, 56.0, 59.0, 91.0, 127.0, 151.0, 252.0, 431.0, 853.0, 6725.0, 2987351.0, 1191815.0, 4139.0, 771.0, 366.0, 230.0, 165.0, 105.0, 80.0, 64.0, 51.0, 43.0, 34.0, 26.0, 17.0, 16.0, 9.0, 8.0, 9.0, 9.0, 10.0, 6.0, 4.0, 5.0, 2.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-55.46875, -53.55126953125, -51.6337890625, -49.71630859375, -47.798828125, -45.88134765625, -43.9638671875, -42.04638671875, -40.12890625, -38.21142578125, -36.2939453125, -34.37646484375, -32.458984375, -30.54150390625, -28.6240234375, -26.70654296875, -24.7890625, -22.87158203125, -20.9541015625, -19.03662109375, -17.119140625, -15.20166015625, -13.2841796875, -11.36669921875, -9.44921875, -7.53173828125, -5.6142578125, -3.69677734375, -1.779296875, 0.13818359375, 2.0556640625, 3.97314453125, 5.890625, 7.80810546875, 9.7255859375, 11.64306640625, 13.560546875, 15.47802734375, 17.3955078125, 19.31298828125, 21.23046875, 23.14794921875, 25.0654296875, 26.98291015625, 28.900390625, 30.81787109375, 32.7353515625, 34.65283203125, 36.5703125, 38.48779296875, 40.4052734375, 42.32275390625, 44.240234375, 46.15771484375, 48.0751953125, 49.99267578125, 51.91015625, 53.82763671875, 55.7451171875, 57.66259765625, 59.580078125, 61.49755859375, 63.4150390625, 65.33251953125, 67.25]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 37.0, 373.0, 529.0, 72.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-101.61149597167969, -91.5614013671875, -81.51130676269531, -71.46121978759766, -61.41112518310547, -51.36103057861328, -41.31093978881836, -31.260848999023438, -21.21075439453125, -11.160661697387695, -1.1105690002441406, 8.939523696899414, 18.98961639404297, 29.039710998535156, 39.08980178833008, 49.139892578125, 59.18998718261719, 69.24008178710938, 79.29017639160156, 89.34026336669922, 99.3903579711914, 109.4404525756836, 119.49053955078125, 129.54063415527344, 139.59072875976562, 149.6408233642578, 159.69091796875, 169.7410125732422, 179.79110717773438, 189.8411865234375, 199.8912811279297, 209.94137573242188, 219.991455078125, 230.0415496826172, 240.09164428710938, 250.14173889160156, 260.19183349609375, 270.2419128417969, 280.2920227050781, 290.34210205078125, 300.3922119140625, 310.4422912597656, 320.4924011230469, 330.54248046875, 340.59259033203125, 350.6426696777344, 360.6927795410156, 370.74285888671875, 380.7929382324219, 390.843017578125, 400.89312744140625, 410.9432067871094, 420.9933166503906, 431.04339599609375, 441.093505859375, 451.1435852050781, 461.19366455078125, 471.2437438964844, 481.2938537597656, 491.34393310546875, 501.39404296875, 511.4441223144531, 521.4942016601562, 531.5443115234375, 541.5944213867188]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 5.0, 3.0, 5.0, 4.0, 8.0, 12.0, 5.0, 16.0, 16.0, 15.0, 15.0, 10.0, 29.0, 25.0, 34.0, 27.0, 34.0, 35.0, 32.0, 34.0, 40.0, 32.0, 35.0, 30.0, 49.0, 31.0, 37.0, 30.0, 28.0, 34.0, 35.0, 24.0, 29.0, 32.0, 15.0, 31.0, 19.0, 19.0, 16.0, 13.0, 10.0, 5.0, 14.0, 6.0, 8.0, 5.0, 6.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-42.279083251953125, -41.03327560424805, -39.78746795654297, -38.54166030883789, -37.29585266113281, -36.050048828125, -34.80424118041992, -33.558433532714844, -32.312625885009766, -31.066818237304688, -29.82101058959961, -28.575204849243164, -27.329397201538086, -26.083589553833008, -24.837783813476562, -23.591976165771484, -22.346168518066406, -21.100360870361328, -19.85455322265625, -18.608747482299805, -17.362939834594727, -16.11713218688965, -14.871325492858887, -13.625518798828125, -12.379711151123047, -11.133903503417969, -9.888096809387207, -8.642290115356445, -7.396482467651367, -6.150675296783447, -4.904868125915527, -3.6590614318847656, -2.4132537841796875, -1.1674466133117676, 0.07836055755615234, 1.3241677284240723, 2.569974899291992, 3.815782070159912, 5.061589241027832, 6.307395935058594, 7.553203582763672, 8.79901123046875, 10.044817924499512, 11.290624618530273, 12.536432266235352, 13.78223991394043, 15.028046607971191, 16.273853302001953, 17.51966094970703, 18.76546859741211, 20.011276245117188, 21.257081985473633, 22.50288963317871, 23.74869728088379, 24.994503021240234, 26.240310668945312, 27.48611831665039, 28.73192596435547, 29.977733612060547, 31.223539352416992, 32.46934509277344, 33.715152740478516, 34.960960388183594, 36.20676803588867, 37.45257568359375]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 4.0, 5.0, 12.0, 8.0, 9.0, 8.0, 13.0, 20.0, 21.0, 27.0, 28.0, 19.0, 35.0, 41.0, 44.0, 43.0, 58.0, 51.0, 50.0, 49.0, 42.0, 40.0, 52.0, 41.0, 44.0, 39.0, 36.0, 32.0, 30.0, 20.0, 16.0, 11.0, 12.0, 7.0, 11.0, 8.0, 12.0, 3.0, 5.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6015625, -8.34332275390625, -8.0850830078125, -7.82684326171875, -7.568603515625, -7.31036376953125, -7.0521240234375, -6.79388427734375, -6.53564453125, -6.27740478515625, -6.0191650390625, -5.76092529296875, -5.502685546875, -5.24444580078125, -4.9862060546875, -4.72796630859375, -4.4697265625, -4.21148681640625, -3.9532470703125, -3.69500732421875, -3.436767578125, -3.17852783203125, -2.9202880859375, -2.66204833984375, -2.40380859375, -2.14556884765625, -1.8873291015625, -1.62908935546875, -1.370849609375, -1.11260986328125, -0.8543701171875, -0.59613037109375, -0.337890625, -0.07965087890625, 0.1785888671875, 0.43682861328125, 0.695068359375, 0.95330810546875, 1.2115478515625, 1.46978759765625, 1.72802734375, 1.98626708984375, 2.2445068359375, 2.50274658203125, 2.760986328125, 3.01922607421875, 3.2774658203125, 3.53570556640625, 3.7939453125, 4.05218505859375, 4.3104248046875, 4.56866455078125, 4.826904296875, 5.08514404296875, 5.3433837890625, 5.60162353515625, 5.85986328125, 6.11810302734375, 6.3763427734375, 6.63458251953125, 6.892822265625, 7.15106201171875, 7.4093017578125, 7.66754150390625, 7.92578125]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 6.0, 8.0, 8.0, 13.0, 24.0, 24.0, 30.0, 53.0, 87.0, 129.0, 207.0, 339.0, 517.0, 783.0, 1182.0, 1663.0, 2588.0, 3897.0, 6149.0, 9605.0, 15062.0, 24938.0, 42291.0, 75877.0, 153661.0, 338913.0, 172243.0, 81864.0, 44966.0, 26442.0, 16172.0, 10276.0, 6531.0, 4033.0, 2678.0, 1705.0, 1216.0, 814.0, 580.0, 345.0, 238.0, 130.0, 96.0, 59.0, 34.0, 26.0, 14.0, 17.0, 9.0, 9.0, 3.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.5458984375, -1.496917724609375, -1.44793701171875, -1.398956298828125, -1.3499755859375, -1.300994873046875, -1.25201416015625, -1.203033447265625, -1.154052734375, -1.105072021484375, -1.05609130859375, -1.007110595703125, -0.9581298828125, -0.909149169921875, -0.86016845703125, -0.811187744140625, -0.76220703125, -0.713226318359375, -0.66424560546875, -0.615264892578125, -0.5662841796875, -0.517303466796875, -0.46832275390625, -0.419342041015625, -0.370361328125, -0.321380615234375, -0.27239990234375, -0.223419189453125, -0.1744384765625, -0.125457763671875, -0.07647705078125, -0.027496337890625, 0.021484375, 0.070465087890625, 0.11944580078125, 0.168426513671875, 0.2174072265625, 0.266387939453125, 0.31536865234375, 0.364349365234375, 0.413330078125, 0.462310791015625, 0.51129150390625, 0.560272216796875, 0.6092529296875, 0.658233642578125, 0.70721435546875, 0.756195068359375, 0.80517578125, 0.854156494140625, 0.90313720703125, 0.952117919921875, 1.0010986328125, 1.050079345703125, 1.09906005859375, 1.148040771484375, 1.197021484375, 1.246002197265625, 1.29498291015625, 1.343963623046875, 1.3929443359375, 1.441925048828125, 1.49090576171875, 1.539886474609375, 1.5888671875]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 8.0, 7.0, 4.0, 5.0, 15.0, 10.0, 18.0, 20.0, 23.0, 18.0, 21.0, 41.0, 40.0, 27.0, 35.0, 34.0, 42.0, 55.0, 57.0, 32.0, 1068.0, 46.0, 41.0, 41.0, 40.0, 29.0, 34.0, 29.0, 35.0, 20.0, 24.0, 14.0, 16.0, 21.0, 17.0, 11.0, 12.0, 5.0, 6.0, 3.0, 1.0, 7.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.58984375, -4.44342041015625, -4.2969970703125, -4.15057373046875, -4.004150390625, -3.85772705078125, -3.7113037109375, -3.56488037109375, -3.41845703125, -3.27203369140625, -3.1256103515625, -2.97918701171875, -2.832763671875, -2.68634033203125, -2.5399169921875, -2.39349365234375, -2.2470703125, -2.10064697265625, -1.9542236328125, -1.80780029296875, -1.661376953125, -1.51495361328125, -1.3685302734375, -1.22210693359375, -1.07568359375, -0.92926025390625, -0.7828369140625, -0.63641357421875, -0.489990234375, -0.34356689453125, -0.1971435546875, -0.05072021484375, 0.095703125, 0.24212646484375, 0.3885498046875, 0.53497314453125, 0.681396484375, 0.82781982421875, 0.9742431640625, 1.12066650390625, 1.26708984375, 1.41351318359375, 1.5599365234375, 1.70635986328125, 1.852783203125, 1.99920654296875, 2.1456298828125, 2.29205322265625, 2.4384765625, 2.58489990234375, 2.7313232421875, 2.87774658203125, 3.024169921875, 3.17059326171875, 3.3170166015625, 3.46343994140625, 3.60986328125, 3.75628662109375, 3.9027099609375, 4.04913330078125, 4.195556640625, 4.34197998046875, 4.4884033203125, 4.63482666015625, 4.78125]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 0.0, 7.0, 6.0, 5.0, 11.0, 14.0, 27.0, 30.0, 49.0, 69.0, 103.0, 152.0, 246.0, 325.0, 515.0, 786.0, 1130.0, 1814.0, 2714.0, 4259.0, 6520.0, 10142.0, 15909.0, 25840.0, 42189.0, 72408.0, 136394.0, 1361848.0, 187980.0, 89507.0, 51874.0, 31287.0, 18986.0, 12101.0, 7593.0, 5001.0, 3114.0, 2112.0, 1371.0, 883.0, 605.0, 399.0, 257.0, 191.0, 113.0, 78.0, 52.0, 39.0, 31.0, 16.0, 17.0, 8.0, 6.0, 2.0, 4.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-1.328125, -1.2862091064453125, -1.244293212890625, -1.2023773193359375, -1.16046142578125, -1.1185455322265625, -1.076629638671875, -1.0347137451171875, -0.9927978515625, -0.9508819580078125, -0.908966064453125, -0.8670501708984375, -0.82513427734375, -0.7832183837890625, -0.741302490234375, -0.6993865966796875, -0.657470703125, -0.6155548095703125, -0.573638916015625, -0.5317230224609375, -0.48980712890625, -0.4478912353515625, -0.405975341796875, -0.3640594482421875, -0.3221435546875, -0.2802276611328125, -0.238311767578125, -0.1963958740234375, -0.15447998046875, -0.1125640869140625, -0.070648193359375, -0.0287322998046875, 0.01318359375, 0.0550994873046875, 0.097015380859375, 0.1389312744140625, 0.18084716796875, 0.2227630615234375, 0.264678955078125, 0.3065948486328125, 0.3485107421875, 0.3904266357421875, 0.432342529296875, 0.4742584228515625, 0.51617431640625, 0.5580902099609375, 0.600006103515625, 0.6419219970703125, 0.683837890625, 0.7257537841796875, 0.767669677734375, 0.8095855712890625, 0.85150146484375, 0.8934173583984375, 0.935333251953125, 0.9772491455078125, 1.0191650390625, 1.0610809326171875, 1.102996826171875, 1.1449127197265625, 1.18682861328125, 1.2287445068359375, 1.270660400390625, 1.3125762939453125, 1.3544921875]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 3.0, 2.0, 2.0, 4.0, 5.0, 5.0, 6.0, 17.0, 10.0, 19.0, 14.0, 25.0, 24.0, 30.0, 21.0, 22.0, 30.0, 43.0, 44.0, 46.0, 38.0, 68.0, 55.0, 49.0, 58.0, 50.0, 45.0, 41.0, 33.0, 27.0, 33.0, 23.0, 21.0, 14.0, 15.0, 10.0, 12.0, 9.0, 6.0, 6.0, 3.0, 5.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0004620552062988281, -0.00044658035039901733, -0.00043110549449920654, -0.00041563063859939575, -0.00040015578269958496, -0.00038468092679977417, -0.0003692060708999634, -0.0003537312150001526, -0.0003382563591003418, -0.000322781503200531, -0.0003073066473007202, -0.0002918317914009094, -0.00027635693550109863, -0.00026088207960128784, -0.00024540722370147705, -0.00022993236780166626, -0.00021445751190185547, -0.00019898265600204468, -0.0001835078001022339, -0.0001680329442024231, -0.0001525580883026123, -0.00013708323240280151, -0.00012160837650299072, -0.00010613352060317993, -9.065866470336914e-05, -7.518380880355835e-05, -5.970895290374756e-05, -4.423409700393677e-05, -2.8759241104125977e-05, -1.3284385204315186e-05, 2.1904706954956055e-06, 1.7665326595306396e-05, 3.314018249511719e-05, 4.861503839492798e-05, 6.408989429473877e-05, 7.956475019454956e-05, 9.503960609436035e-05, 0.00011051446199417114, 0.00012598931789398193, 0.00014146417379379272, 0.00015693902969360352, 0.0001724138855934143, 0.0001878887414932251, 0.0002033635973930359, 0.00021883845329284668, 0.00023431330919265747, 0.00024978816509246826, 0.00026526302099227905, 0.00028073787689208984, 0.00029621273279190063, 0.0003116875886917114, 0.0003271624445915222, 0.000342637300491333, 0.0003581121563911438, 0.0003735870122909546, 0.0003890618681907654, 0.00040453672409057617, 0.00042001157999038696, 0.00043548643589019775, 0.00045096129179000854, 0.00046643614768981934, 0.0004819110035896301, 0.0004973858594894409, 0.0005128607153892517, 0.0005283355712890625]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 3.0, 1.0, 11.0, 8.0, 6.0, 14.0, 18.0, 9.0, 20.0, 26.0, 46.0, 34.0, 58.0, 91.0, 155.0, 361.0, 871.0, 28048.0, 1013067.0, 4288.0, 657.0, 256.0, 123.0, 77.0, 59.0, 31.0, 54.0, 29.0, 31.0, 20.0, 10.0, 14.0, 13.0, 11.0, 8.0, 8.0, 4.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.0156097412109375, -0.015180230140686035, -0.01475071907043457, -0.014321208000183105, -0.01389169692993164, -0.013462185859680176, -0.013032674789428711, -0.012603163719177246, -0.012173652648925781, -0.011744141578674316, -0.011314630508422852, -0.010885119438171387, -0.010455608367919922, -0.010026097297668457, -0.009596586227416992, -0.009167075157165527, -0.008737564086914062, -0.008308053016662598, -0.007878541946411133, -0.007449030876159668, -0.007019519805908203, -0.006590008735656738, -0.0061604976654052734, -0.005730986595153809, -0.005301475524902344, -0.004871964454650879, -0.004442453384399414, -0.004012942314147949, -0.0035834312438964844, -0.0031539201736450195, -0.0027244091033935547, -0.00229489803314209, -0.001865386962890625, -0.0014358758926391602, -0.0010063648223876953, -0.0005768537521362305, -0.00014734268188476562, 0.0002821683883666992, 0.0007116794586181641, 0.001141190528869629, 0.0015707015991210938, 0.0020002126693725586, 0.0024297237396240234, 0.0028592348098754883, 0.003288745880126953, 0.003718256950378418, 0.004147768020629883, 0.004577279090881348, 0.0050067901611328125, 0.005436301231384277, 0.005865812301635742, 0.006295323371887207, 0.006724834442138672, 0.007154345512390137, 0.0075838565826416016, 0.008013367652893066, 0.008442878723144531, 0.008872389793395996, 0.009301900863647461, 0.009731411933898926, 0.01016092300415039, 0.010590434074401855, 0.01101994514465332, 0.011449456214904785, 0.01187896728515625]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 9.0, 8.0, 25.0, 51.0, 124.0, 173.0, 224.0, 158.0, 122.0, 69.0, 28.0, 11.0, 9.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0006575408042408526, -0.0006366601446643472, -0.0006157794850878417, -0.0005948988255113363, -0.0005740182241424918, -0.0005531375645659864, -0.000532256904989481, -0.0005113762454129755, -0.0004904955858364701, -0.0004696149262599647, -0.0004487342666834593, -0.0004278536362107843, -0.0004069729766342789, -0.00038609231705777347, -0.0003652116865850985, -0.0003443310270085931, -0.00032345036743208766, -0.00030256970785558224, -0.0002816890482790768, -0.00026080841780640185, -0.00023992775822989643, -0.000219047098653391, -0.0001981664536288008, -0.00017728580860421062, -0.0001564051490277052, -0.00013552448945119977, -0.00011464384442660958, -9.376319212606177e-05, -7.288253982551396e-05, -5.200188752496615e-05, -3.112123522441834e-05, -1.0240590199828148e-05, 1.0640011169016361e-05, 3.152066346956417e-05, 5.240131577011198e-05, 7.328196807065979e-05, 9.41626203712076e-05, 0.0001150432726717554, 0.0001359239249723032, 0.0001568045699968934, 0.00017768522957339883, 0.00019856588914990425, 0.00021944653417449445, 0.00024032717919908464, 0.00026120783877559006, 0.0002820884983520955, 0.00030296912882477045, 0.0003238497884012759, 0.0003447304479777813, 0.0003656111075542867, 0.00038649176713079214, 0.0004073723976034671, 0.00042825305717997253, 0.00044913371675647795, 0.0004700143472291529, 0.0004908950068056583, 0.0005117756663821638, 0.0005326563259586692, 0.0005535369855351746, 0.00057441764511168, 0.0005952982464805245, 0.00061617890605703, 0.0006370595656335354, 0.0006579402252100408, 0.0006788208847865462]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 10.0, 12.0, 9.0, 14.0, 13.0, 24.0, 21.0, 24.0, 31.0, 24.0, 31.0, 37.0, 31.0, 44.0, 35.0, 38.0, 47.0, 45.0, 43.0, 36.0, 49.0, 48.0, 43.0, 25.0, 41.0, 39.0, 15.0, 18.0, 22.0, 22.0, 19.0, 15.0, 18.0, 11.0, 8.0, 6.0, 5.0, 4.0, 7.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.000274658203125, -0.0002651410177350044, -0.00025562383234500885, -0.0002461066469550133, -0.0002365894615650177, -0.00022707227617502213, -0.00021755509078502655, -0.00020803790539503098, -0.0001985207200050354, -0.00018900353461503983, -0.00017948634922504425, -0.00016996916383504868, -0.0001604519784450531, -0.00015093479305505753, -0.00014141760766506195, -0.00013190042227506638, -0.0001223832368850708, -0.00011286605149507523, -0.00010334886610507965, -9.383168071508408e-05, -8.43144953250885e-05, -7.479730993509293e-05, -6.528012454509735e-05, -5.5762939155101776e-05, -4.62457537651062e-05, -3.6728568375110626e-05, -2.721138298511505e-05, -1.7694197595119476e-05, -8.177012205123901e-06, 1.3401731848716736e-06, 1.0857358574867249e-05, 2.0374543964862823e-05, 2.98917293548584e-05, 3.9408914744853973e-05, 4.892610013484955e-05, 5.844328552484512e-05, 6.79604709148407e-05, 7.747765630483627e-05, 8.699484169483185e-05, 9.651202708482742e-05, 0.000106029212474823, 0.00011554639786481857, 0.00012506358325481415, 0.00013458076864480972, 0.0001440979540348053, 0.00015361513942480087, 0.00016313232481479645, 0.00017264951020479202, 0.0001821666955947876, 0.00019168388098478317, 0.00020120106637477875, 0.00021071825176477432, 0.0002202354371547699, 0.00022975262254476547, 0.00023926980793476105, 0.0002487869933247566, 0.0002583041787147522, 0.00026782136410474777, 0.00027733854949474335, 0.0002868557348847389, 0.0002963729202747345, 0.00030589010566473007, 0.00031540729105472565, 0.0003249244764447212, 0.0003344416618347168]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 4.0, 5.0, 12.0, 8.0, 9.0, 8.0, 13.0, 20.0, 21.0, 27.0, 28.0, 19.0, 35.0, 41.0, 44.0, 43.0, 58.0, 51.0, 50.0, 49.0, 42.0, 40.0, 52.0, 41.0, 44.0, 39.0, 36.0, 32.0, 30.0, 20.0, 16.0, 11.0, 12.0, 7.0, 11.0, 8.0, 12.0, 3.0, 5.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6015625, -8.34332275390625, -8.0850830078125, -7.82684326171875, -7.568603515625, -7.31036376953125, -7.0521240234375, -6.79388427734375, -6.53564453125, -6.27740478515625, -6.0191650390625, -5.76092529296875, -5.502685546875, -5.24444580078125, -4.9862060546875, -4.72796630859375, -4.4697265625, -4.21148681640625, -3.9532470703125, -3.69500732421875, -3.436767578125, -3.17852783203125, -2.9202880859375, -2.66204833984375, -2.40380859375, -2.14556884765625, -1.8873291015625, -1.62908935546875, -1.370849609375, -1.11260986328125, -0.8543701171875, -0.59613037109375, -0.337890625, -0.07965087890625, 0.1785888671875, 0.43682861328125, 0.695068359375, 0.95330810546875, 1.2115478515625, 1.46978759765625, 1.72802734375, 1.98626708984375, 2.2445068359375, 2.50274658203125, 2.760986328125, 3.01922607421875, 3.2774658203125, 3.53570556640625, 3.7939453125, 4.05218505859375, 4.3104248046875, 4.56866455078125, 4.826904296875, 5.08514404296875, 5.3433837890625, 5.60162353515625, 5.85986328125, 6.11810302734375, 6.3763427734375, 6.63458251953125, 6.892822265625, 7.15106201171875, 7.4093017578125, 7.66754150390625, 7.92578125]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 5.0, 3.0, 4.0, 5.0, 9.0, 6.0, 13.0, 14.0, 15.0, 26.0, 21.0, 40.0, 39.0, 71.0, 78.0, 113.0, 156.0, 220.0, 280.0, 447.0, 749.0, 1272.0, 2421.0, 5259.0, 13534.0, 38446.0, 125392.0, 505877.0, 248060.0, 67299.0, 22402.0, 8181.0, 3519.0, 1768.0, 925.0, 594.0, 356.0, 258.0, 185.0, 116.0, 88.0, 67.0, 57.0, 40.0, 35.0, 23.0, 22.0, 11.0, 8.0, 13.0, 8.0, 7.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.6640625, -7.43695068359375, -7.2098388671875, -6.98272705078125, -6.755615234375, -6.52850341796875, -6.3013916015625, -6.07427978515625, -5.84716796875, -5.62005615234375, -5.3929443359375, -5.16583251953125, -4.938720703125, -4.71160888671875, -4.4844970703125, -4.25738525390625, -4.0302734375, -3.80316162109375, -3.5760498046875, -3.34893798828125, -3.121826171875, -2.89471435546875, -2.6676025390625, -2.44049072265625, -2.21337890625, -1.98626708984375, -1.7591552734375, -1.53204345703125, -1.304931640625, -1.07781982421875, -0.8507080078125, -0.62359619140625, -0.396484375, -0.16937255859375, 0.0577392578125, 0.28485107421875, 0.511962890625, 0.73907470703125, 0.9661865234375, 1.19329833984375, 1.42041015625, 1.64752197265625, 1.8746337890625, 2.10174560546875, 2.328857421875, 2.55596923828125, 2.7830810546875, 3.01019287109375, 3.2373046875, 3.46441650390625, 3.6915283203125, 3.91864013671875, 4.145751953125, 4.37286376953125, 4.5999755859375, 4.82708740234375, 5.05419921875, 5.28131103515625, 5.5084228515625, 5.73553466796875, 5.962646484375, 6.18975830078125, 6.4168701171875, 6.64398193359375, 6.87109375]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 3.0, 6.0, 2.0, 9.0, 6.0, 10.0, 5.0, 19.0, 11.0, 16.0, 18.0, 21.0, 30.0, 31.0, 42.0, 41.0, 51.0, 50.0, 68.0, 96.0, 212.0, 1669.0, 175.0, 77.0, 65.0, 48.0, 48.0, 46.0, 25.0, 15.0, 22.0, 20.0, 28.0, 15.0, 14.0, 10.0, 8.0, 8.0, 2.0, 5.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.390625, -18.595703125, -17.80078125, -17.005859375, -16.2109375, -15.416015625, -14.62109375, -13.826171875, -13.03125, -12.236328125, -11.44140625, -10.646484375, -9.8515625, -9.056640625, -8.26171875, -7.466796875, -6.671875, -5.876953125, -5.08203125, -4.287109375, -3.4921875, -2.697265625, -1.90234375, -1.107421875, -0.3125, 0.482421875, 1.27734375, 2.072265625, 2.8671875, 3.662109375, 4.45703125, 5.251953125, 6.046875, 6.841796875, 7.63671875, 8.431640625, 9.2265625, 10.021484375, 10.81640625, 11.611328125, 12.40625, 13.201171875, 13.99609375, 14.791015625, 15.5859375, 16.380859375, 17.17578125, 17.970703125, 18.765625, 19.560546875, 20.35546875, 21.150390625, 21.9453125, 22.740234375, 23.53515625, 24.330078125, 25.125, 25.919921875, 26.71484375, 27.509765625, 28.3046875, 29.099609375, 29.89453125, 30.689453125, 31.484375]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 6.0, 5.0, 7.0, 18.0, 15.0, 25.0, 39.0, 54.0, 54.0, 85.0, 134.0, 268.0, 417.0, 1256.0, 187773.0, 2952015.0, 2170.0, 513.0, 285.0, 171.0, 122.0, 84.0, 54.0, 41.0, 30.0, 24.0, 15.0, 8.0, 9.0, 8.0, 4.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.625, -68.984375, -66.34375, -63.703125, -61.0625, -58.421875, -55.78125, -53.140625, -50.5, -47.859375, -45.21875, -42.578125, -39.9375, -37.296875, -34.65625, -32.015625, -29.375, -26.734375, -24.09375, -21.453125, -18.8125, -16.171875, -13.53125, -10.890625, -8.25, -5.609375, -2.96875, -0.328125, 2.3125, 4.953125, 7.59375, 10.234375, 12.875, 15.515625, 18.15625, 20.796875, 23.4375, 26.078125, 28.71875, 31.359375, 34.0, 36.640625, 39.28125, 41.921875, 44.5625, 47.203125, 49.84375, 52.484375, 55.125, 57.765625, 60.40625, 63.046875, 65.6875, 68.328125, 70.96875, 73.609375, 76.25, 78.890625, 81.53125, 84.171875, 86.8125, 89.453125, 92.09375, 94.734375, 97.375]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 5.0, 79.0, 459.0, 415.0, 53.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.370668411254883, -22.769210815429688, -18.16775131225586, -13.566293716430664, -8.964836120605469, -4.363378524780273, 0.2380809783935547, 4.839536666870117, 9.440996170043945, 14.04245376586914, 18.64391326904297, 23.245370864868164, 27.84682846069336, 32.44828796386719, 37.04974365234375, 41.65119934082031, 46.252662658691406, 50.854122161865234, 55.4555778503418, 60.057037353515625, 64.65849304199219, 69.25994873046875, 73.86141204833984, 78.4628677368164, 83.06432342529297, 87.66577911376953, 92.26724243164062, 96.86869812011719, 101.47015380859375, 106.07160949707031, 110.6730728149414, 115.27452850341797, 119.87599182128906, 124.47744750976562, 129.0789031982422, 133.68035888671875, 138.28182983398438, 142.88328552246094, 147.4847412109375, 152.08619689941406, 156.68765258789062, 161.2891082763672, 165.89056396484375, 170.49203491210938, 175.09349060058594, 179.6949462890625, 184.29640197753906, 188.89785766601562, 193.49932861328125, 198.1007843017578, 202.70223999023438, 207.3037109375, 211.90516662597656, 216.50662231445312, 221.1080780029297, 225.70953369140625, 230.3109893798828, 234.91244506835938, 239.51390075683594, 244.1153564453125, 248.71682739257812, 253.3182830810547, 257.91973876953125, 262.52117919921875, 267.1226501464844]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 9.0, 9.0, 11.0, 8.0, 11.0, 15.0, 14.0, 19.0, 13.0, 18.0, 19.0, 23.0, 22.0, 36.0, 30.0, 30.0, 36.0, 32.0, 35.0, 28.0, 43.0, 33.0, 38.0, 38.0, 29.0, 45.0, 35.0, 33.0, 28.0, 25.0, 29.0, 29.0, 25.0, 14.0, 26.0, 19.0, 14.0, 13.0, 7.0, 7.0, 8.0, 12.0, 7.0, 5.0, 6.0, 6.0, 2.0, 5.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.5810546875, -56.7160758972168, -54.851097106933594, -52.986114501953125, -51.12113571166992, -49.25615692138672, -47.391178131103516, -45.52619934082031, -43.661216735839844, -41.79623794555664, -39.93125915527344, -38.06627655029297, -36.201297760009766, -34.33631896972656, -32.47134017944336, -30.606361389160156, -28.741382598876953, -26.87640380859375, -25.011423110961914, -23.14644432067871, -21.281463623046875, -19.416484832763672, -17.55150604248047, -15.68652629852295, -13.82154655456543, -11.95656681060791, -10.09158706665039, -8.226608276367188, -6.361628532409668, -4.496648788452148, -2.6316699981689453, -0.7666902542114258, 1.0982856750488281, 2.9632651805877686, 4.828244686126709, 6.69322395324707, 8.55820369720459, 10.42318344116211, 12.288162231445312, 14.153141975402832, 16.01812171936035, 17.883100509643555, 19.74808120727539, 21.613059997558594, 23.478038787841797, 25.343019485473633, 27.207998275756836, 29.072978973388672, 30.937957763671875, 32.80293655395508, 34.66791534423828, 36.53289794921875, 38.39787673950195, 40.262855529785156, 42.12783432006836, 43.99281311035156, 45.85779571533203, 47.722774505615234, 49.58775329589844, 51.452735900878906, 53.31771469116211, 55.18269348144531, 57.047672271728516, 58.91265106201172, 60.77762985229492]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 7.0, 1.0, 1.0, 11.0, 8.0, 9.0, 7.0, 18.0, 13.0, 21.0, 21.0, 27.0, 25.0, 45.0, 41.0, 34.0, 36.0, 48.0, 50.0, 52.0, 45.0, 37.0, 38.0, 45.0, 34.0, 40.0, 55.0, 23.0, 50.0, 26.0, 32.0, 16.0, 20.0, 11.0, 10.0, 7.0, 13.0, 10.0, 10.0, 3.0, 2.0, 2.0, 0.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.15625, -8.89300537109375, -8.6297607421875, -8.36651611328125, -8.103271484375, -7.84002685546875, -7.5767822265625, -7.31353759765625, -7.05029296875, -6.78704833984375, -6.5238037109375, -6.26055908203125, -5.997314453125, -5.73406982421875, -5.4708251953125, -5.20758056640625, -4.9443359375, -4.68109130859375, -4.4178466796875, -4.15460205078125, -3.891357421875, -3.62811279296875, -3.3648681640625, -3.10162353515625, -2.83837890625, -2.57513427734375, -2.3118896484375, -2.04864501953125, -1.785400390625, -1.52215576171875, -1.2589111328125, -0.99566650390625, -0.732421875, -0.46917724609375, -0.2059326171875, 0.05731201171875, 0.320556640625, 0.58380126953125, 0.8470458984375, 1.11029052734375, 1.37353515625, 1.63677978515625, 1.9000244140625, 2.16326904296875, 2.426513671875, 2.68975830078125, 2.9530029296875, 3.21624755859375, 3.4794921875, 3.74273681640625, 4.0059814453125, 4.26922607421875, 4.532470703125, 4.79571533203125, 5.0589599609375, 5.32220458984375, 5.58544921875, 5.84869384765625, 6.1119384765625, 6.37518310546875, 6.638427734375, 6.90167236328125, 7.1649169921875, 7.42816162109375, 7.69140625]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 1.0, 6.0, 7.0, 6.0, 5.0, 11.0, 16.0, 18.0, 17.0, 17.0, 19.0, 27.0, 30.0, 37.0, 42.0, 90.0, 196.0, 577.0, 3472.0, 93790.0, 3535685.0, 550862.0, 7752.0, 980.0, 240.0, 80.0, 40.0, 36.0, 51.0, 29.0, 30.0, 24.0, 12.0, 18.0, 15.0, 13.0, 7.0, 6.0, 5.0, 6.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-33.0625, -32.10888671875, -31.1552734375, -30.20166015625, -29.248046875, -28.29443359375, -27.3408203125, -26.38720703125, -25.43359375, -24.47998046875, -23.5263671875, -22.57275390625, -21.619140625, -20.66552734375, -19.7119140625, -18.75830078125, -17.8046875, -16.85107421875, -15.8974609375, -14.94384765625, -13.990234375, -13.03662109375, -12.0830078125, -11.12939453125, -10.17578125, -9.22216796875, -8.2685546875, -7.31494140625, -6.361328125, -5.40771484375, -4.4541015625, -3.50048828125, -2.546875, -1.59326171875, -0.6396484375, 0.31396484375, 1.267578125, 2.22119140625, 3.1748046875, 4.12841796875, 5.08203125, 6.03564453125, 6.9892578125, 7.94287109375, 8.896484375, 9.85009765625, 10.8037109375, 11.75732421875, 12.7109375, 13.66455078125, 14.6181640625, 15.57177734375, 16.525390625, 17.47900390625, 18.4326171875, 19.38623046875, 20.33984375, 21.29345703125, 22.2470703125, 23.20068359375, 24.154296875, 25.10791015625, 26.0615234375, 27.01513671875, 27.96875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 6.0, 8.0, 12.0, 14.0, 12.0, 13.0, 30.0, 44.0, 61.0, 55.0, 114.0, 137.0, 244.0, 308.0, 407.0, 472.0, 538.0, 410.0, 354.0, 231.0, 163.0, 125.0, 83.0, 66.0, 43.0, 29.0, 27.0, 22.0, 9.0, 11.0, 7.0, 6.0, 4.0, 3.0, 2.0, 0.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.9921875, -15.4796142578125, -14.967041015625, -14.4544677734375, -13.94189453125, -13.4293212890625, -12.916748046875, -12.4041748046875, -11.8916015625, -11.3790283203125, -10.866455078125, -10.3538818359375, -9.84130859375, -9.3287353515625, -8.816162109375, -8.3035888671875, -7.791015625, -7.2784423828125, -6.765869140625, -6.2532958984375, -5.74072265625, -5.2281494140625, -4.715576171875, -4.2030029296875, -3.6904296875, -3.1778564453125, -2.665283203125, -2.1527099609375, -1.64013671875, -1.1275634765625, -0.614990234375, -0.1024169921875, 0.41015625, 0.9227294921875, 1.435302734375, 1.9478759765625, 2.46044921875, 2.9730224609375, 3.485595703125, 3.9981689453125, 4.5107421875, 5.0233154296875, 5.535888671875, 6.0484619140625, 6.56103515625, 7.0736083984375, 7.586181640625, 8.0987548828125, 8.611328125, 9.1239013671875, 9.636474609375, 10.1490478515625, 10.66162109375, 11.1741943359375, 11.686767578125, 12.1993408203125, 12.7119140625, 13.2244873046875, 13.737060546875, 14.2496337890625, 14.76220703125, 15.2747802734375, 15.787353515625, 16.2999267578125, 16.8125]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 9.0, 5.0, 6.0, 14.0, 16.0, 25.0, 25.0, 33.0, 42.0, 52.0, 58.0, 74.0, 84.0, 112.0, 171.0, 199.0, 285.0, 516.0, 1312.0, 63621.0, 4099725.0, 25217.0, 1046.0, 485.0, 295.0, 194.0, 145.0, 109.0, 79.0, 67.0, 49.0, 48.0, 23.0, 33.0, 19.0, 26.0, 11.0, 15.0, 13.0, 6.0, 3.0, 3.0, 5.0, 1.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-69.125, -66.9931640625, -64.861328125, -62.7294921875, -60.59765625, -58.4658203125, -56.333984375, -54.2021484375, -52.0703125, -49.9384765625, -47.806640625, -45.6748046875, -43.54296875, -41.4111328125, -39.279296875, -37.1474609375, -35.015625, -32.8837890625, -30.751953125, -28.6201171875, -26.48828125, -24.3564453125, -22.224609375, -20.0927734375, -17.9609375, -15.8291015625, -13.697265625, -11.5654296875, -9.43359375, -7.3017578125, -5.169921875, -3.0380859375, -0.90625, 1.2255859375, 3.357421875, 5.4892578125, 7.62109375, 9.7529296875, 11.884765625, 14.0166015625, 16.1484375, 18.2802734375, 20.412109375, 22.5439453125, 24.67578125, 26.8076171875, 28.939453125, 31.0712890625, 33.203125, 35.3349609375, 37.466796875, 39.5986328125, 41.73046875, 43.8623046875, 45.994140625, 48.1259765625, 50.2578125, 52.3896484375, 54.521484375, 56.6533203125, 58.78515625, 60.9169921875, 63.048828125, 65.1806640625, 67.3125]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 7.0, 383.0, 612.0, 17.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-428.6784973144531, -413.42657470703125, -398.1746520996094, -382.9227294921875, -367.67083740234375, -352.4189147949219, -337.1669921875, -321.9150695800781, -306.66314697265625, -291.4112243652344, -276.1593017578125, -260.90740966796875, -245.65548706054688, -230.403564453125, -215.15164184570312, -199.89971923828125, -184.6478271484375, -169.39590454101562, -154.1439971923828, -138.89207458496094, -123.6401596069336, -108.38824462890625, -93.13632202148438, -77.88440704345703, -62.63249206542969, -47.380577087402344, -32.128658294677734, -16.876739501953125, -1.6248245239257812, 13.627090454101562, 28.879013061523438, 44.13092803955078, 59.3828125, 74.63472747802734, 89.88664245605469, 105.13856506347656, 120.3904800415039, 135.64239501953125, 150.89431762695312, 166.146240234375, 181.3981475830078, 196.6500701904297, 211.9019775390625, 227.15390014648438, 242.40582275390625, 257.65771484375, 272.90966796875, 288.16156005859375, 303.4134826660156, 318.6654052734375, 333.9173278808594, 349.16925048828125, 364.421142578125, 379.6730651855469, 394.92498779296875, 410.1769104003906, 425.4288330078125, 440.6807556152344, 455.93267822265625, 471.1845703125, 486.4364929199219, 501.68841552734375, 516.9403076171875, 532.1922607421875, 547.4441528320312]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 5.0, 4.0, 2.0, 7.0, 4.0, 9.0, 6.0, 8.0, 12.0, 16.0, 14.0, 20.0, 25.0, 23.0, 30.0, 30.0, 36.0, 31.0, 39.0, 28.0, 32.0, 24.0, 42.0, 30.0, 37.0, 46.0, 41.0, 42.0, 35.0, 29.0, 40.0, 34.0, 31.0, 27.0, 22.0, 21.0, 23.0, 21.0, 18.0, 9.0, 5.0, 12.0, 5.0, 7.0, 11.0, 10.0, 1.0, 0.0, 5.0, 0.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-44.29730224609375, -42.754615783691406, -41.21193313598633, -39.669246673583984, -38.126564025878906, -36.58387756347656, -35.04119110107422, -33.49850845336914, -31.95582389831543, -30.41313934326172, -28.870454788208008, -27.327770233154297, -25.785083770751953, -24.242401123046875, -22.69971466064453, -21.15703010559082, -19.61434555053711, -18.0716609954834, -16.528976440429688, -14.98629093170166, -13.44360637664795, -11.900921821594238, -10.358236312866211, -8.8155517578125, -7.272867202758789, -5.730182647705078, -4.187497615814209, -2.64481258392334, -1.102128028869629, 0.44055652618408203, 1.9832420349121094, 3.5259265899658203, 5.068611145019531, 6.611295700073242, 8.153980255126953, 9.69666576385498, 11.239350318908691, 12.782034873962402, 14.32472038269043, 15.86740493774414, 17.41008949279785, 18.952774047851562, 20.495458602905273, 22.038143157958984, 23.580829620361328, 25.123512268066406, 26.66619873046875, 28.20888328552246, 29.751567840576172, 31.294252395629883, 32.836936950683594, 34.37962341308594, 35.922306060791016, 37.46499252319336, 39.00767517089844, 40.55036163330078, 42.093048095703125, 43.63573455810547, 45.17841720581055, 46.72110366821289, 48.26378631591797, 49.80647277832031, 51.349159240722656, 52.891841888427734, 54.43452453613281]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 11.0, 6.0, 9.0, 10.0, 16.0, 10.0, 13.0, 25.0, 18.0, 28.0, 35.0, 41.0, 43.0, 35.0, 42.0, 43.0, 44.0, 45.0, 53.0, 46.0, 48.0, 36.0, 45.0, 49.0, 41.0, 29.0, 24.0, 23.0, 25.0, 17.0, 22.0, 16.0, 10.0, 12.0, 12.0, 7.0, 5.0, 8.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.125, -7.8662109375, -7.607421875, -7.3486328125, -7.08984375, -6.8310546875, -6.572265625, -6.3134765625, -6.0546875, -5.7958984375, -5.537109375, -5.2783203125, -5.01953125, -4.7607421875, -4.501953125, -4.2431640625, -3.984375, -3.7255859375, -3.466796875, -3.2080078125, -2.94921875, -2.6904296875, -2.431640625, -2.1728515625, -1.9140625, -1.6552734375, -1.396484375, -1.1376953125, -0.87890625, -0.6201171875, -0.361328125, -0.1025390625, 0.15625, 0.4150390625, 0.673828125, 0.9326171875, 1.19140625, 1.4501953125, 1.708984375, 1.9677734375, 2.2265625, 2.4853515625, 2.744140625, 3.0029296875, 3.26171875, 3.5205078125, 3.779296875, 4.0380859375, 4.296875, 4.5556640625, 4.814453125, 5.0732421875, 5.33203125, 5.5908203125, 5.849609375, 6.1083984375, 6.3671875, 6.6259765625, 6.884765625, 7.1435546875, 7.40234375, 7.6611328125, 7.919921875, 8.1787109375, 8.4375]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 4.0, 3.0, 6.0, 17.0, 22.0, 33.0, 36.0, 75.0, 86.0, 129.0, 191.0, 285.0, 558.0, 832.0, 1393.0, 2167.0, 3352.0, 5353.0, 8789.0, 14530.0, 23863.0, 39721.0, 71390.0, 142594.0, 338333.0, 187175.0, 87555.0, 47849.0, 28047.0, 16803.0, 10399.0, 6307.0, 3956.0, 2506.0, 1568.0, 940.0, 635.0, 357.0, 233.0, 146.0, 115.0, 72.0, 44.0, 32.0, 22.0, 15.0, 8.0, 8.0, 3.0, 1.0, 6.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.712890625, -1.6604461669921875, -1.608001708984375, -1.5555572509765625, -1.50311279296875, -1.4506683349609375, -1.398223876953125, -1.3457794189453125, -1.2933349609375, -1.2408905029296875, -1.188446044921875, -1.1360015869140625, -1.08355712890625, -1.0311126708984375, -0.978668212890625, -0.9262237548828125, -0.873779296875, -0.8213348388671875, -0.768890380859375, -0.7164459228515625, -0.66400146484375, -0.6115570068359375, -0.559112548828125, -0.5066680908203125, -0.4542236328125, -0.4017791748046875, -0.349334716796875, -0.2968902587890625, -0.24444580078125, -0.1920013427734375, -0.139556884765625, -0.0871124267578125, -0.03466796875, 0.0177764892578125, 0.070220947265625, 0.1226654052734375, 0.17510986328125, 0.2275543212890625, 0.279998779296875, 0.3324432373046875, 0.3848876953125, 0.4373321533203125, 0.489776611328125, 0.5422210693359375, 0.59466552734375, 0.6471099853515625, 0.699554443359375, 0.7519989013671875, 0.804443359375, 0.8568878173828125, 0.909332275390625, 0.9617767333984375, 1.01422119140625, 1.0666656494140625, 1.119110107421875, 1.1715545654296875, 1.2239990234375, 1.2764434814453125, 1.328887939453125, 1.3813323974609375, 1.43377685546875, 1.4862213134765625, 1.538665771484375, 1.5911102294921875, 1.6435546875]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 4.0, 10.0, 9.0, 8.0, 6.0, 6.0, 7.0, 12.0, 16.0, 20.0, 26.0, 21.0, 34.0, 36.0, 30.0, 43.0, 37.0, 48.0, 33.0, 32.0, 35.0, 50.0, 1058.0, 37.0, 48.0, 37.0, 26.0, 29.0, 32.0, 28.0, 31.0, 22.0, 30.0, 22.0, 14.0, 18.0, 17.0, 12.0, 11.0, 6.0, 4.0, 7.0, 7.0, 4.0, 4.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.4375, -4.295166015625, -4.15283203125, -4.010498046875, -3.8681640625, -3.725830078125, -3.58349609375, -3.441162109375, -3.298828125, -3.156494140625, -3.01416015625, -2.871826171875, -2.7294921875, -2.587158203125, -2.44482421875, -2.302490234375, -2.16015625, -2.017822265625, -1.87548828125, -1.733154296875, -1.5908203125, -1.448486328125, -1.30615234375, -1.163818359375, -1.021484375, -0.879150390625, -0.73681640625, -0.594482421875, -0.4521484375, -0.309814453125, -0.16748046875, -0.025146484375, 0.1171875, 0.259521484375, 0.40185546875, 0.544189453125, 0.6865234375, 0.828857421875, 0.97119140625, 1.113525390625, 1.255859375, 1.398193359375, 1.54052734375, 1.682861328125, 1.8251953125, 1.967529296875, 2.10986328125, 2.252197265625, 2.39453125, 2.536865234375, 2.67919921875, 2.821533203125, 2.9638671875, 3.106201171875, 3.24853515625, 3.390869140625, 3.533203125, 3.675537109375, 3.81787109375, 3.960205078125, 4.1025390625, 4.244873046875, 4.38720703125, 4.529541015625, 4.671875]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 3.0, 4.0, 1.0, 6.0, 11.0, 10.0, 18.0, 25.0, 26.0, 58.0, 86.0, 115.0, 155.0, 213.0, 299.0, 416.0, 597.0, 880.0, 1261.0, 1818.0, 2744.0, 3820.0, 5753.0, 8471.0, 13077.0, 20064.0, 31085.0, 50284.0, 82303.0, 150297.0, 1344806.0, 150722.0, 84216.0, 51203.0, 32020.0, 20093.0, 13104.0, 8702.0, 5733.0, 3869.0, 2735.0, 1786.0, 1258.0, 930.0, 645.0, 401.0, 323.0, 203.0, 124.0, 102.0, 93.0, 57.0, 35.0, 26.0, 16.0, 17.0, 11.0, 4.0, 3.0, 4.0, 3.0, 1.0, 3.0], "bins": [-1.25390625, -1.214111328125, -1.17431640625, -1.134521484375, -1.0947265625, -1.054931640625, -1.01513671875, -0.975341796875, -0.935546875, -0.895751953125, -0.85595703125, -0.816162109375, -0.7763671875, -0.736572265625, -0.69677734375, -0.656982421875, -0.6171875, -0.577392578125, -0.53759765625, -0.497802734375, -0.4580078125, -0.418212890625, -0.37841796875, -0.338623046875, -0.298828125, -0.259033203125, -0.21923828125, -0.179443359375, -0.1396484375, -0.099853515625, -0.06005859375, -0.020263671875, 0.01953125, 0.059326171875, 0.09912109375, 0.138916015625, 0.1787109375, 0.218505859375, 0.25830078125, 0.298095703125, 0.337890625, 0.377685546875, 0.41748046875, 0.457275390625, 0.4970703125, 0.536865234375, 0.57666015625, 0.616455078125, 0.65625, 0.696044921875, 0.73583984375, 0.775634765625, 0.8154296875, 0.855224609375, 0.89501953125, 0.934814453125, 0.974609375, 1.014404296875, 1.05419921875, 1.093994140625, 1.1337890625, 1.173583984375, 1.21337890625, 1.253173828125, 1.29296875]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 8.0, 4.0, 1.0, 7.0, 4.0, 9.0, 6.0, 10.0, 14.0, 13.0, 14.0, 16.0, 21.0, 20.0, 31.0, 37.0, 40.0, 49.0, 52.0, 67.0, 52.0, 61.0, 69.0, 52.0, 48.0, 48.0, 50.0, 30.0, 25.0, 27.0, 25.0, 19.0, 17.0, 6.0, 12.0, 10.0, 6.0, 7.0, 2.0, 4.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0006628036499023438, -0.0006432607769966125, -0.0006237179040908813, -0.0006041750311851501, -0.0005846321582794189, -0.0005650892853736877, -0.0005455464124679565, -0.0005260035395622253, -0.0005064606666564941, -0.00048691779375076294, -0.00046737492084503174, -0.00044783204793930054, -0.00042828917503356934, -0.00040874630212783813, -0.00038920342922210693, -0.00036966055631637573, -0.00035011768341064453, -0.00033057481050491333, -0.00031103193759918213, -0.00029148906469345093, -0.0002719461917877197, -0.0002524033188819885, -0.00023286044597625732, -0.00021331757307052612, -0.00019377470016479492, -0.00017423182725906372, -0.00015468895435333252, -0.00013514608144760132, -0.00011560320854187012, -9.606033563613892e-05, -7.651746273040771e-05, -5.6974589824676514e-05, -3.743171691894531e-05, -1.788884401321411e-05, 1.6540288925170898e-06, 2.119690179824829e-05, 4.073977470397949e-05, 6.028264760971069e-05, 7.98255205154419e-05, 9.93683934211731e-05, 0.0001189112663269043, 0.0001384541392326355, 0.0001579970121383667, 0.0001775398850440979, 0.0001970827579498291, 0.0002166256308555603, 0.0002361685037612915, 0.0002557113766670227, 0.0002752542495727539, 0.0002947971224784851, 0.0003143399953842163, 0.0003338828682899475, 0.0003534257411956787, 0.0003729686141014099, 0.0003925114870071411, 0.0004120543599128723, 0.0004315972328186035, 0.0004511401057243347, 0.0004706829786300659, 0.0004902258515357971, 0.0005097687244415283, 0.0005293115973472595, 0.0005488544702529907, 0.0005683973431587219, 0.0005879402160644531]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 6.0, 0.0, 4.0, 5.0, 5.0, 3.0, 3.0, 9.0, 13.0, 13.0, 20.0, 16.0, 27.0, 23.0, 29.0, 28.0, 44.0, 58.0, 109.0, 141.0, 270.0, 651.0, 12571.0, 1027545.0, 5747.0, 518.0, 221.0, 127.0, 77.0, 50.0, 37.0, 37.0, 22.0, 19.0, 17.0, 16.0, 11.0, 15.0, 10.0, 11.0, 4.0, 9.0, 4.0, 2.0, 2.0, 6.0, 7.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0122833251953125, -0.011818647384643555, -0.01135396957397461, -0.010889291763305664, -0.010424613952636719, -0.009959936141967773, -0.009495258331298828, -0.009030580520629883, -0.008565902709960938, -0.008101224899291992, -0.007636547088623047, -0.0071718692779541016, -0.006707191467285156, -0.006242513656616211, -0.005777835845947266, -0.00531315803527832, -0.004848480224609375, -0.00438380241394043, -0.003919124603271484, -0.003454446792602539, -0.0029897689819335938, -0.0025250911712646484, -0.002060413360595703, -0.0015957355499267578, -0.0011310577392578125, -0.0006663799285888672, -0.00020170211791992188, 0.00026297569274902344, 0.0007276535034179688, 0.001192331314086914, 0.0016570091247558594, 0.0021216869354248047, 0.00258636474609375, 0.0030510425567626953, 0.0035157203674316406, 0.003980398178100586, 0.004445075988769531, 0.0049097537994384766, 0.005374431610107422, 0.005839109420776367, 0.0063037872314453125, 0.006768465042114258, 0.007233142852783203, 0.0076978206634521484, 0.008162498474121094, 0.008627176284790039, 0.009091854095458984, 0.00955653190612793, 0.010021209716796875, 0.01048588752746582, 0.010950565338134766, 0.011415243148803711, 0.011879920959472656, 0.012344598770141602, 0.012809276580810547, 0.013273954391479492, 0.013738632202148438, 0.014203310012817383, 0.014667987823486328, 0.015132665634155273, 0.015597343444824219, 0.016062021255493164, 0.01652669906616211, 0.016991376876831055, 0.0174560546875]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 10.0, 14.0, 41.0, 108.0, 180.0, 226.0, 185.0, 123.0, 76.0, 33.0, 12.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0011067636078223586, -0.001084487303160131, -0.0010622108820825815, -0.0010399345774203539, -0.0010176581563428044, -0.0009953818516805768, -0.0009731054306030273, -0.0009508291259407997, -0.0009285527630709112, -0.0009062764002010226, -0.0008840000373311341, -0.0008617236744612455, -0.000839447311591357, -0.0008171709487214684, -0.0007948946440592408, -0.0007726182811893523, -0.0007503419183194637, -0.0007280655554495752, -0.0007057891925796866, -0.0006835128297097981, -0.0006612364668399096, -0.0006389601621776819, -0.0006166837411001325, -0.0005944074364379048, -0.0005721310153603554, -0.0005498546524904668, -0.0005275782896205783, -0.0005053019267506897, -0.00048302559298463166, -0.0004607492301147431, -0.00043847286724485457, -0.0004161965334787965, -0.0003939201415050775, -0.00037164377863518894, -0.0003493674157653004, -0.0003270910819992423, -0.00030481471912935376, -0.0002825383562594652, -0.0002602619933895767, -0.00023798564507160336, -0.00021570928220171481, -0.00019343291933182627, -0.00017115657101385295, -0.0001488802081439644, -0.00012660384527407587, -0.00010432749695610255, -8.2051134086214e-05, -5.977478576824069e-05, -3.7498422898352146e-05, -1.5222065485431813e-05, 7.054291927488521e-06, 2.9330651159398258e-05, 5.160700675332919e-05, 7.388336234726012e-05, 9.615972521714866e-05, 0.00011843607353512198, 0.00014071243640501052, 0.00016298879927489907, 0.00018526514759287238, 0.00020754151046276093, 0.00022981787333264947, 0.000252094236202538, 0.00027437059907242656, 0.00029664693283848464, 0.0003189232957083732]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 7.0, 4.0, 13.0, 11.0, 16.0, 19.0, 11.0, 21.0, 20.0, 22.0, 17.0, 30.0, 32.0, 33.0, 20.0, 31.0, 28.0, 34.0, 40.0, 39.0, 37.0, 44.0, 38.0, 29.0, 33.0, 40.0, 39.0, 38.0, 33.0, 26.0, 26.0, 26.0, 18.0, 7.0, 15.0, 15.0, 17.0, 19.0, 11.0, 9.0, 13.0, 4.0, 2.0, 1.0, 3.0, 1.0, 6.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.00033724308013916016, -0.000327439047396183, -0.00031763501465320587, -0.00030783098191022873, -0.0002980269491672516, -0.00028822291642427444, -0.0002784188836812973, -0.00026861485093832016, -0.000258810818195343, -0.0002490067854523659, -0.00023920275270938873, -0.0002293987199664116, -0.00021959468722343445, -0.0002097906544804573, -0.00019998662173748016, -0.00019018258899450302, -0.00018037855625152588, -0.00017057452350854874, -0.0001607704907655716, -0.00015096645802259445, -0.0001411624252796173, -0.00013135839253664017, -0.00012155435979366302, -0.00011175032705068588, -0.00010194629430770874, -9.21422615647316e-05, -8.233822882175446e-05, -7.253419607877731e-05, -6.273016333580017e-05, -5.292613059282303e-05, -4.3122097849845886e-05, -3.3318065106868744e-05, -2.35140323638916e-05, -1.370999962091446e-05, -3.905966877937317e-06, 5.8980658650398254e-06, 1.5702098608016968e-05, 2.550613135099411e-05, 3.531016409397125e-05, 4.5114196836948395e-05, 5.491822957992554e-05, 6.472226232290268e-05, 7.452629506587982e-05, 8.433032780885696e-05, 9.41343605518341e-05, 0.00010393839329481125, 0.00011374242603778839, 0.00012354645878076553, 0.00013335049152374268, 0.00014315452426671982, 0.00015295855700969696, 0.0001627625897526741, 0.00017256662249565125, 0.0001823706552386284, 0.00019217468798160553, 0.00020197872072458267, 0.00021178275346755981, 0.00022158678621053696, 0.0002313908189535141, 0.00024119485169649124, 0.0002509988844394684, 0.0002608029171824455, 0.00027060694992542267, 0.0002804109826683998, 0.00029021501541137695]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 11.0, 6.0, 9.0, 10.0, 16.0, 10.0, 13.0, 25.0, 18.0, 28.0, 35.0, 41.0, 43.0, 35.0, 42.0, 43.0, 44.0, 45.0, 53.0, 46.0, 48.0, 36.0, 45.0, 49.0, 41.0, 29.0, 24.0, 23.0, 25.0, 17.0, 22.0, 16.0, 10.0, 12.0, 12.0, 7.0, 5.0, 8.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.125, -7.8662109375, -7.607421875, -7.3486328125, -7.08984375, -6.8310546875, -6.572265625, -6.3134765625, -6.0546875, -5.7958984375, -5.537109375, -5.2783203125, -5.01953125, -4.7607421875, -4.501953125, -4.2431640625, -3.984375, -3.7255859375, -3.466796875, -3.2080078125, -2.94921875, -2.6904296875, -2.431640625, -2.1728515625, -1.9140625, -1.6552734375, -1.396484375, -1.1376953125, -0.87890625, -0.6201171875, -0.361328125, -0.1025390625, 0.15625, 0.4150390625, 0.673828125, 0.9326171875, 1.19140625, 1.4501953125, 1.708984375, 1.9677734375, 2.2265625, 2.4853515625, 2.744140625, 3.0029296875, 3.26171875, 3.5205078125, 3.779296875, 4.0380859375, 4.296875, 4.5556640625, 4.814453125, 5.0732421875, 5.33203125, 5.5908203125, 5.849609375, 6.1083984375, 6.3671875, 6.6259765625, 6.884765625, 7.1435546875, 7.40234375, 7.6611328125, 7.919921875, 8.1787109375, 8.4375]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [5.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 6.0, 9.0, 11.0, 16.0, 14.0, 28.0, 27.0, 46.0, 63.0, 90.0, 126.0, 186.0, 240.0, 319.0, 532.0, 795.0, 1264.0, 2093.0, 3477.0, 5952.0, 10712.0, 20426.0, 44918.0, 116237.0, 331556.0, 312191.0, 109228.0, 43014.0, 19919.0, 10323.0, 5649.0, 3364.0, 2018.0, 1249.0, 779.0, 539.0, 324.0, 215.0, 167.0, 111.0, 81.0, 52.0, 50.0, 34.0, 32.0, 20.0, 16.0, 16.0, 5.0, 8.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-4.7734375, -4.628662109375, -4.48388671875, -4.339111328125, -4.1943359375, -4.049560546875, -3.90478515625, -3.760009765625, -3.615234375, -3.470458984375, -3.32568359375, -3.180908203125, -3.0361328125, -2.891357421875, -2.74658203125, -2.601806640625, -2.45703125, -2.312255859375, -2.16748046875, -2.022705078125, -1.8779296875, -1.733154296875, -1.58837890625, -1.443603515625, -1.298828125, -1.154052734375, -1.00927734375, -0.864501953125, -0.7197265625, -0.574951171875, -0.43017578125, -0.285400390625, -0.140625, 0.004150390625, 0.14892578125, 0.293701171875, 0.4384765625, 0.583251953125, 0.72802734375, 0.872802734375, 1.017578125, 1.162353515625, 1.30712890625, 1.451904296875, 1.5966796875, 1.741455078125, 1.88623046875, 2.031005859375, 2.17578125, 2.320556640625, 2.46533203125, 2.610107421875, 2.7548828125, 2.899658203125, 3.04443359375, 3.189208984375, 3.333984375, 3.478759765625, 3.62353515625, 3.768310546875, 3.9130859375, 4.057861328125, 4.20263671875, 4.347412109375, 4.4921875]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 4.0, 4.0, 10.0, 12.0, 13.0, 3.0, 8.0, 20.0, 22.0, 20.0, 26.0, 29.0, 38.0, 34.0, 54.0, 57.0, 48.0, 84.0, 189.0, 1730.0, 166.0, 57.0, 57.0, 54.0, 32.0, 41.0, 34.0, 31.0, 28.0, 24.0, 19.0, 13.0, 19.0, 16.0, 13.0, 11.0, 5.0, 6.0, 6.0, 3.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0], "bins": [-27.4375, -26.66259765625, -25.8876953125, -25.11279296875, -24.337890625, -23.56298828125, -22.7880859375, -22.01318359375, -21.23828125, -20.46337890625, -19.6884765625, -18.91357421875, -18.138671875, -17.36376953125, -16.5888671875, -15.81396484375, -15.0390625, -14.26416015625, -13.4892578125, -12.71435546875, -11.939453125, -11.16455078125, -10.3896484375, -9.61474609375, -8.83984375, -8.06494140625, -7.2900390625, -6.51513671875, -5.740234375, -4.96533203125, -4.1904296875, -3.41552734375, -2.640625, -1.86572265625, -1.0908203125, -0.31591796875, 0.458984375, 1.23388671875, 2.0087890625, 2.78369140625, 3.55859375, 4.33349609375, 5.1083984375, 5.88330078125, 6.658203125, 7.43310546875, 8.2080078125, 8.98291015625, 9.7578125, 10.53271484375, 11.3076171875, 12.08251953125, 12.857421875, 13.63232421875, 14.4072265625, 15.18212890625, 15.95703125, 16.73193359375, 17.5068359375, 18.28173828125, 19.056640625, 19.83154296875, 20.6064453125, 21.38134765625, 22.15625]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 5.0, 3.0, 5.0, 5.0, 13.0, 16.0, 16.0, 29.0, 39.0, 48.0, 83.0, 111.0, 147.0, 244.0, 302.0, 615.0, 4987.0, 3123248.0, 14006.0, 710.0, 368.0, 229.0, 153.0, 95.0, 57.0, 57.0, 28.0, 28.0, 17.0, 12.0, 6.0, 7.0, 6.0, 7.0, 2.0, 1.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-68.125, -65.5634765625, -63.001953125, -60.4404296875, -57.87890625, -55.3173828125, -52.755859375, -50.1943359375, -47.6328125, -45.0712890625, -42.509765625, -39.9482421875, -37.38671875, -34.8251953125, -32.263671875, -29.7021484375, -27.140625, -24.5791015625, -22.017578125, -19.4560546875, -16.89453125, -14.3330078125, -11.771484375, -9.2099609375, -6.6484375, -4.0869140625, -1.525390625, 1.0361328125, 3.59765625, 6.1591796875, 8.720703125, 11.2822265625, 13.84375, 16.4052734375, 18.966796875, 21.5283203125, 24.08984375, 26.6513671875, 29.212890625, 31.7744140625, 34.3359375, 36.8974609375, 39.458984375, 42.0205078125, 44.58203125, 47.1435546875, 49.705078125, 52.2666015625, 54.828125, 57.3896484375, 59.951171875, 62.5126953125, 65.07421875, 67.6357421875, 70.197265625, 72.7587890625, 75.3203125, 77.8818359375, 80.443359375, 83.0048828125, 85.56640625, 88.1279296875, 90.689453125, 93.2509765625, 95.8125]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 79.0, 785.0, 147.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.65671920776367, -46.27248764038086, -40.88825607299805, -35.504024505615234, -30.119792938232422, -24.73556137084961, -19.351329803466797, -13.967098236083984, -8.582866668701172, -3.1986351013183594, 2.185596466064453, 7.569828033447266, 12.954059600830078, 18.33829116821289, 23.722522735595703, 29.106754302978516, 34.49098587036133, 39.87521743774414, 45.25944900512695, 50.643680572509766, 56.02791213989258, 61.41214370727539, 66.79637145996094, 72.18060302734375, 77.56483459472656, 82.94906616210938, 88.33329772949219, 93.717529296875, 99.10176086425781, 104.48599243164062, 109.87022399902344, 115.25445556640625, 120.63870239257812, 126.02293395996094, 131.40716552734375, 136.79139709472656, 142.17562866210938, 147.5598602294922, 152.944091796875, 158.3283233642578, 163.71255493164062, 169.09678649902344, 174.48101806640625, 179.86524963378906, 185.24948120117188, 190.6337127685547, 196.0179443359375, 201.4021759033203, 206.78640747070312, 212.17063903808594, 217.55487060546875, 222.93910217285156, 228.32333374023438, 233.7075653076172, 239.091796875, 244.4760284423828, 249.86026000976562, 255.24449157714844, 260.62872314453125, 266.012939453125, 271.3971862792969, 276.78143310546875, 282.1656494140625, 287.54986572265625, 292.9341125488281]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 6.0, 7.0, 10.0, 11.0, 9.0, 14.0, 19.0, 14.0, 30.0, 23.0, 19.0, 26.0, 33.0, 44.0, 36.0, 48.0, 47.0, 42.0, 39.0, 43.0, 39.0, 37.0, 43.0, 42.0, 40.0, 33.0, 35.0, 34.0, 18.0, 18.0, 25.0, 25.0, 15.0, 11.0, 9.0, 7.0, 10.0, 10.0, 5.0, 7.0, 4.0, 2.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-64.66000366210938, -62.72977828979492, -60.799556732177734, -58.86933135986328, -56.939109802246094, -55.00888442993164, -53.07866287231445, -51.1484375, -49.21821594238281, -47.28799057006836, -45.35776901245117, -43.42754364013672, -41.49732208251953, -39.56709671020508, -37.63687515258789, -35.70664978027344, -33.77642822265625, -31.84620475769043, -29.91598129272461, -27.98575782775879, -26.05553436279297, -24.125308990478516, -22.195087432861328, -20.264862060546875, -18.334636688232422, -16.4044132232666, -14.474189758300781, -12.543966293334961, -10.61374282836914, -8.683518409729004, -6.753294944763184, -4.823071479797363, -2.8928489685058594, -0.9626253843307495, 0.9675981998443604, 2.8978219032287598, 4.82804536819458, 6.758269309997559, 8.688492774963379, 10.6187162399292, 12.54893970489502, 14.47916316986084, 16.409387588500977, 18.339611053466797, 20.269834518432617, 22.200057983398438, 24.130281448364258, 26.060504913330078, 27.9907283782959, 29.92095184326172, 31.85117530822754, 33.78139877319336, 35.71162414550781, 37.641845703125, 39.57207107543945, 41.50229263305664, 43.432518005371094, 45.36274337768555, 47.292964935302734, 49.22319030761719, 51.153411865234375, 53.08363723754883, 55.013858795166016, 56.94408416748047, 58.874305725097656]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 9.0, 2.0, 6.0, 11.0, 9.0, 12.0, 8.0, 19.0, 21.0, 23.0, 21.0, 44.0, 32.0, 35.0, 35.0, 42.0, 45.0, 35.0, 52.0, 36.0, 48.0, 49.0, 49.0, 51.0, 40.0, 36.0, 40.0, 23.0, 14.0, 29.0, 23.0, 23.0, 18.0, 9.0, 17.0, 11.0, 5.0, 7.0, 8.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.6875, -8.422119140625, -8.15673828125, -7.891357421875, -7.6259765625, -7.360595703125, -7.09521484375, -6.829833984375, -6.564453125, -6.299072265625, -6.03369140625, -5.768310546875, -5.5029296875, -5.237548828125, -4.97216796875, -4.706787109375, -4.44140625, -4.176025390625, -3.91064453125, -3.645263671875, -3.3798828125, -3.114501953125, -2.84912109375, -2.583740234375, -2.318359375, -2.052978515625, -1.78759765625, -1.522216796875, -1.2568359375, -0.991455078125, -0.72607421875, -0.460693359375, -0.1953125, 0.070068359375, 0.33544921875, 0.600830078125, 0.8662109375, 1.131591796875, 1.39697265625, 1.662353515625, 1.927734375, 2.193115234375, 2.45849609375, 2.723876953125, 2.9892578125, 3.254638671875, 3.52001953125, 3.785400390625, 4.05078125, 4.316162109375, 4.58154296875, 4.846923828125, 5.1123046875, 5.377685546875, 5.64306640625, 5.908447265625, 6.173828125, 6.439208984375, 6.70458984375, 6.969970703125, 7.2353515625, 7.500732421875, 7.76611328125, 8.031494140625, 8.296875]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 7.0, 7.0, 6.0, 6.0, 16.0, 12.0, 11.0, 17.0, 27.0, 29.0, 38.0, 56.0, 65.0, 116.0, 237.0, 447.0, 1384.0, 7661.0, 154630.0, 2725110.0, 1258279.0, 41145.0, 3354.0, 787.0, 345.0, 134.0, 74.0, 70.0, 42.0, 29.0, 27.0, 26.0, 19.0, 8.0, 10.0, 17.0, 11.0, 7.0, 3.0, 3.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-23.09375, -22.43017578125, -21.7666015625, -21.10302734375, -20.439453125, -19.77587890625, -19.1123046875, -18.44873046875, -17.78515625, -17.12158203125, -16.4580078125, -15.79443359375, -15.130859375, -14.46728515625, -13.8037109375, -13.14013671875, -12.4765625, -11.81298828125, -11.1494140625, -10.48583984375, -9.822265625, -9.15869140625, -8.4951171875, -7.83154296875, -7.16796875, -6.50439453125, -5.8408203125, -5.17724609375, -4.513671875, -3.85009765625, -3.1865234375, -2.52294921875, -1.859375, -1.19580078125, -0.5322265625, 0.13134765625, 0.794921875, 1.45849609375, 2.1220703125, 2.78564453125, 3.44921875, 4.11279296875, 4.7763671875, 5.43994140625, 6.103515625, 6.76708984375, 7.4306640625, 8.09423828125, 8.7578125, 9.42138671875, 10.0849609375, 10.74853515625, 11.412109375, 12.07568359375, 12.7392578125, 13.40283203125, 14.06640625, 14.72998046875, 15.3935546875, 16.05712890625, 16.720703125, 17.38427734375, 18.0478515625, 18.71142578125, 19.375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 2.0, 3.0, 9.0, 8.0, 11.0, 18.0, 43.0, 46.0, 58.0, 73.0, 101.0, 152.0, 199.0, 274.0, 392.0, 472.0, 515.0, 439.0, 353.0, 233.0, 178.0, 123.0, 103.0, 69.0, 52.0, 41.0, 20.0, 22.0, 22.0, 19.0, 4.0, 5.0, 8.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.703125, -17.2291259765625, -16.755126953125, -16.2811279296875, -15.80712890625, -15.3331298828125, -14.859130859375, -14.3851318359375, -13.9111328125, -13.4371337890625, -12.963134765625, -12.4891357421875, -12.01513671875, -11.5411376953125, -11.067138671875, -10.5931396484375, -10.119140625, -9.6451416015625, -9.171142578125, -8.6971435546875, -8.22314453125, -7.7491455078125, -7.275146484375, -6.8011474609375, -6.3271484375, -5.8531494140625, -5.379150390625, -4.9051513671875, -4.43115234375, -3.9571533203125, -3.483154296875, -3.0091552734375, -2.53515625, -2.0611572265625, -1.587158203125, -1.1131591796875, -0.63916015625, -0.1651611328125, 0.308837890625, 0.7828369140625, 1.2568359375, 1.7308349609375, 2.204833984375, 2.6788330078125, 3.15283203125, 3.6268310546875, 4.100830078125, 4.5748291015625, 5.048828125, 5.5228271484375, 5.996826171875, 6.4708251953125, 6.94482421875, 7.4188232421875, 7.892822265625, 8.3668212890625, 8.8408203125, 9.3148193359375, 9.788818359375, 10.2628173828125, 10.73681640625, 11.2108154296875, 11.684814453125, 12.1588134765625, 12.6328125]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 7.0, 5.0, 6.0, 12.0, 6.0, 13.0, 16.0, 23.0, 42.0, 38.0, 46.0, 52.0, 82.0, 104.0, 131.0, 129.0, 225.0, 339.0, 672.0, 2800.0, 2144754.0, 2040166.0, 2633.0, 674.0, 385.0, 223.0, 145.0, 136.0, 96.0, 69.0, 60.0, 48.0, 25.0, 23.0, 24.0, 11.0, 15.0, 17.0, 6.0, 10.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-64.875, -62.6376953125, -60.400390625, -58.1630859375, -55.92578125, -53.6884765625, -51.451171875, -49.2138671875, -46.9765625, -44.7392578125, -42.501953125, -40.2646484375, -38.02734375, -35.7900390625, -33.552734375, -31.3154296875, -29.078125, -26.8408203125, -24.603515625, -22.3662109375, -20.12890625, -17.8916015625, -15.654296875, -13.4169921875, -11.1796875, -8.9423828125, -6.705078125, -4.4677734375, -2.23046875, 0.0068359375, 2.244140625, 4.4814453125, 6.71875, 8.9560546875, 11.193359375, 13.4306640625, 15.66796875, 17.9052734375, 20.142578125, 22.3798828125, 24.6171875, 26.8544921875, 29.091796875, 31.3291015625, 33.56640625, 35.8037109375, 38.041015625, 40.2783203125, 42.515625, 44.7529296875, 46.990234375, 49.2275390625, 51.46484375, 53.7021484375, 55.939453125, 58.1767578125, 60.4140625, 62.6513671875, 64.888671875, 67.1259765625, 69.36328125, 71.6005859375, 73.837890625, 76.0751953125, 78.3125]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 6.0, 9.0, 11.0, 33.0, 38.0, 50.0, 81.0, 106.0, 106.0, 119.0, 125.0, 95.0, 72.0, 54.0, 45.0, 26.0, 13.0, 8.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-57.238162994384766, -55.61727523803711, -53.99638748168945, -52.3754997253418, -50.75461196899414, -49.133724212646484, -47.512840270996094, -45.89195251464844, -44.27106475830078, -42.650177001953125, -41.02928924560547, -39.40840148925781, -37.787513732910156, -36.1666259765625, -34.545738220214844, -32.92485046386719, -31.30396270751953, -29.683074951171875, -28.06218719482422, -26.441299438476562, -24.820411682128906, -23.19952392578125, -21.578638076782227, -19.95775032043457, -18.336862564086914, -16.715974807739258, -15.095087051391602, -13.474200248718262, -11.853312492370605, -10.23242473602295, -8.61153793334961, -6.990650177001953, -5.369758605957031, -3.748871088027954, -2.127983570098877, -0.5070962905883789, 1.1137914657592773, 2.7346792221069336, 4.355566024780273, 5.97645378112793, 7.597341537475586, 9.218229293823242, 10.839117050170898, 12.460003852844238, 14.080891609191895, 15.70177936553955, 17.32266616821289, 18.943553924560547, 20.564441680908203, 22.18532943725586, 23.806217193603516, 25.427104949951172, 27.047992706298828, 28.668880462646484, 30.289766311645508, 31.910654067993164, 33.53153991699219, 35.152427673339844, 36.7733154296875, 38.394203186035156, 40.01509094238281, 41.63597869873047, 43.256866455078125, 44.87775421142578, 46.49864196777344]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 3.0, 4.0, 3.0, 3.0, 3.0, 6.0, 8.0, 5.0, 6.0, 13.0, 9.0, 18.0, 14.0, 22.0, 30.0, 27.0, 22.0, 35.0, 38.0, 39.0, 31.0, 44.0, 40.0, 39.0, 37.0, 46.0, 41.0, 27.0, 39.0, 34.0, 40.0, 41.0, 30.0, 21.0, 21.0, 22.0, 19.0, 19.0, 11.0, 17.0, 8.0, 14.0, 13.0, 12.0, 12.0, 7.0, 6.0, 3.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-43.578758239746094, -42.21896743774414, -40.85917663574219, -39.4993896484375, -38.13959884643555, -36.779808044433594, -35.42001724243164, -34.06022644042969, -32.700435638427734, -31.34064483642578, -29.98085594177246, -28.621065139770508, -27.261274337768555, -25.901485443115234, -24.54169464111328, -23.181903839111328, -21.822114944458008, -20.462324142456055, -19.102535247802734, -17.74274444580078, -16.382953643798828, -15.023163795471191, -13.663373947143555, -12.303583145141602, -10.943793296813965, -9.584003448486328, -8.224212646484375, -6.864422798156738, -5.504632472991943, -4.144842147827148, -2.7850522994995117, -1.4252614974975586, -0.06547164916992188, 1.2943185567855835, 2.654108762741089, 4.013898849487305, 5.3736891746521, 6.7334794998168945, 8.093269348144531, 9.453060150146484, 10.812849998474121, 12.172639846801758, 13.532430648803711, 14.892220497131348, 16.252010345458984, 17.611801147460938, 18.97159194946289, 20.331382751464844, 21.691171646118164, 23.050962448120117, 24.410751342773438, 25.77054214477539, 27.130332946777344, 28.490123748779297, 29.849912643432617, 31.20970344543457, 32.56949234008789, 33.929283142089844, 35.2890739440918, 36.64886474609375, 38.00865173339844, 39.36844253540039, 40.728233337402344, 42.0880241394043, 43.44781494140625]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 5.0, 10.0, 15.0, 11.0, 8.0, 18.0, 27.0, 18.0, 24.0, 30.0, 38.0, 45.0, 40.0, 37.0, 40.0, 51.0, 44.0, 35.0, 58.0, 57.0, 52.0, 42.0, 44.0, 42.0, 31.0, 28.0, 16.0, 29.0, 19.0, 19.0, 16.0, 9.0, 9.0, 11.0, 7.0, 9.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.8359375, -8.5650634765625, -8.294189453125, -8.0233154296875, -7.75244140625, -7.4815673828125, -7.210693359375, -6.9398193359375, -6.6689453125, -6.3980712890625, -6.127197265625, -5.8563232421875, -5.58544921875, -5.3145751953125, -5.043701171875, -4.7728271484375, -4.501953125, -4.2310791015625, -3.960205078125, -3.6893310546875, -3.41845703125, -3.1475830078125, -2.876708984375, -2.6058349609375, -2.3349609375, -2.0640869140625, -1.793212890625, -1.5223388671875, -1.25146484375, -0.9805908203125, -0.709716796875, -0.4388427734375, -0.16796875, 0.1029052734375, 0.373779296875, 0.6446533203125, 0.91552734375, 1.1864013671875, 1.457275390625, 1.7281494140625, 1.9990234375, 2.2698974609375, 2.540771484375, 2.8116455078125, 3.08251953125, 3.3533935546875, 3.624267578125, 3.8951416015625, 4.166015625, 4.4368896484375, 4.707763671875, 4.9786376953125, 5.24951171875, 5.5203857421875, 5.791259765625, 6.0621337890625, 6.3330078125, 6.6038818359375, 6.874755859375, 7.1456298828125, 7.41650390625, 7.6873779296875, 7.958251953125, 8.2291259765625, 8.5]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 6.0, 8.0, 20.0, 17.0, 26.0, 49.0, 65.0, 107.0, 160.0, 245.0, 361.0, 621.0, 958.0, 1620.0, 2662.0, 4400.0, 7172.0, 12232.0, 20080.0, 35162.0, 64232.0, 135829.0, 383794.0, 193779.0, 81091.0, 42782.0, 24342.0, 14679.0, 8730.0, 5179.0, 3091.0, 1929.0, 1151.0, 704.0, 445.0, 296.0, 159.0, 130.0, 77.0, 46.0, 40.0, 34.0, 15.0, 11.0, 6.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.916015625, -1.8573760986328125, -1.798736572265625, -1.7400970458984375, -1.68145751953125, -1.6228179931640625, -1.564178466796875, -1.5055389404296875, -1.4468994140625, -1.3882598876953125, -1.329620361328125, -1.2709808349609375, -1.21234130859375, -1.1537017822265625, -1.095062255859375, -1.0364227294921875, -0.977783203125, -0.9191436767578125, -0.860504150390625, -0.8018646240234375, -0.74322509765625, -0.6845855712890625, -0.625946044921875, -0.5673065185546875, -0.5086669921875, -0.4500274658203125, -0.391387939453125, -0.3327484130859375, -0.27410888671875, -0.2154693603515625, -0.156829833984375, -0.0981903076171875, -0.03955078125, 0.0190887451171875, 0.077728271484375, 0.1363677978515625, 0.19500732421875, 0.2536468505859375, 0.312286376953125, 0.3709259033203125, 0.4295654296875, 0.4882049560546875, 0.546844482421875, 0.6054840087890625, 0.66412353515625, 0.7227630615234375, 0.781402587890625, 0.8400421142578125, 0.898681640625, 0.9573211669921875, 1.015960693359375, 1.0746002197265625, 1.13323974609375, 1.1918792724609375, 1.250518798828125, 1.3091583251953125, 1.3677978515625, 1.4264373779296875, 1.485076904296875, 1.5437164306640625, 1.60235595703125, 1.6609954833984375, 1.719635009765625, 1.7782745361328125, 1.8369140625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 9.0, 10.0, 7.0, 5.0, 10.0, 8.0, 18.0, 16.0, 18.0, 15.0, 22.0, 23.0, 24.0, 41.0, 29.0, 31.0, 37.0, 44.0, 27.0, 41.0, 38.0, 1074.0, 35.0, 44.0, 37.0, 26.0, 23.0, 43.0, 23.0, 29.0, 32.0, 23.0, 26.0, 24.0, 14.0, 17.0, 18.0, 9.0, 14.0, 6.0, 7.0, 9.0, 3.0, 5.0, 2.0, 2.0, 3.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.66796875, -4.52154541015625, -4.3751220703125, -4.22869873046875, -4.082275390625, -3.93585205078125, -3.7894287109375, -3.64300537109375, -3.49658203125, -3.35015869140625, -3.2037353515625, -3.05731201171875, -2.910888671875, -2.76446533203125, -2.6180419921875, -2.47161865234375, -2.3251953125, -2.17877197265625, -2.0323486328125, -1.88592529296875, -1.739501953125, -1.59307861328125, -1.4466552734375, -1.30023193359375, -1.15380859375, -1.00738525390625, -0.8609619140625, -0.71453857421875, -0.568115234375, -0.42169189453125, -0.2752685546875, -0.12884521484375, 0.017578125, 0.16400146484375, 0.3104248046875, 0.45684814453125, 0.603271484375, 0.74969482421875, 0.8961181640625, 1.04254150390625, 1.18896484375, 1.33538818359375, 1.4818115234375, 1.62823486328125, 1.774658203125, 1.92108154296875, 2.0675048828125, 2.21392822265625, 2.3603515625, 2.50677490234375, 2.6531982421875, 2.79962158203125, 2.946044921875, 3.09246826171875, 3.2388916015625, 3.38531494140625, 3.53173828125, 3.67816162109375, 3.8245849609375, 3.97100830078125, 4.117431640625, 4.26385498046875, 4.4102783203125, 4.55670166015625, 4.703125]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 1.0, 5.0, 3.0, 6.0, 7.0, 15.0, 24.0, 31.0, 29.0, 58.0, 100.0, 123.0, 154.0, 244.0, 321.0, 439.0, 618.0, 893.0, 1284.0, 1794.0, 2583.0, 3627.0, 5188.0, 7752.0, 11107.0, 16912.0, 25542.0, 39388.0, 61909.0, 101858.0, 224092.0, 1294679.0, 108215.0, 64989.0, 41074.0, 26782.0, 17389.0, 11700.0, 7903.0, 5570.0, 3720.0, 2732.0, 1799.0, 1345.0, 920.0, 648.0, 444.0, 360.0, 205.0, 143.0, 127.0, 86.0, 67.0, 32.0, 27.0, 26.0, 26.0, 10.0, 6.0, 6.0, 3.0, 1.0, 7.0], "bins": [-1.3125, -1.27154541015625, -1.2305908203125, -1.18963623046875, -1.148681640625, -1.10772705078125, -1.0667724609375, -1.02581787109375, -0.98486328125, -0.94390869140625, -0.9029541015625, -0.86199951171875, -0.821044921875, -0.78009033203125, -0.7391357421875, -0.69818115234375, -0.6572265625, -0.61627197265625, -0.5753173828125, -0.53436279296875, -0.493408203125, -0.45245361328125, -0.4114990234375, -0.37054443359375, -0.32958984375, -0.28863525390625, -0.2476806640625, -0.20672607421875, -0.165771484375, -0.12481689453125, -0.0838623046875, -0.04290771484375, -0.001953125, 0.03900146484375, 0.0799560546875, 0.12091064453125, 0.161865234375, 0.20281982421875, 0.2437744140625, 0.28472900390625, 0.32568359375, 0.36663818359375, 0.4075927734375, 0.44854736328125, 0.489501953125, 0.53045654296875, 0.5714111328125, 0.61236572265625, 0.6533203125, 0.69427490234375, 0.7352294921875, 0.77618408203125, 0.817138671875, 0.85809326171875, 0.8990478515625, 0.94000244140625, 0.98095703125, 1.02191162109375, 1.0628662109375, 1.10382080078125, 1.144775390625, 1.18572998046875, 1.2266845703125, 1.26763916015625, 1.30859375]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 2.0, 5.0, 10.0, 9.0, 5.0, 11.0, 18.0, 13.0, 13.0, 19.0, 28.0, 27.0, 37.0, 49.0, 72.0, 68.0, 66.0, 85.0, 77.0, 69.0, 69.0, 45.0, 39.0, 39.0, 18.0, 24.0, 20.0, 13.0, 6.0, 11.0, 11.0, 3.0, 8.0, 5.0, 5.0, 5.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007829666137695312, -0.0007588788866996765, -0.0007347911596298218, -0.000710703432559967, -0.0006866157054901123, -0.0006625279784202576, -0.0006384402513504028, -0.0006143525242805481, -0.0005902647972106934, -0.0005661770701408386, -0.0005420893430709839, -0.0005180016160011292, -0.0004939138889312744, -0.0004698261618614197, -0.00044573843479156494, -0.0004216507077217102, -0.00039756298065185547, -0.00037347525358200073, -0.000349387526512146, -0.00032529979944229126, -0.0003012120723724365, -0.0002771243453025818, -0.00025303661823272705, -0.00022894889116287231, -0.00020486116409301758, -0.00018077343702316284, -0.0001566857099533081, -0.00013259798288345337, -0.00010851025581359863, -8.44225287437439e-05, -6.033480167388916e-05, -3.6247074604034424e-05, -1.2159347534179688e-05, 1.1928379535675049e-05, 3.6016106605529785e-05, 6.010383367538452e-05, 8.419156074523926e-05, 0.000108279287815094, 0.00013236701488494873, 0.00015645474195480347, 0.0001805424690246582, 0.00020463019609451294, 0.00022871792316436768, 0.0002528056502342224, 0.00027689337730407715, 0.0003009811043739319, 0.0003250688314437866, 0.00034915655851364136, 0.0003732442855834961, 0.00039733201265335083, 0.00042141973972320557, 0.0004455074667930603, 0.00046959519386291504, 0.0004936829209327698, 0.0005177706480026245, 0.0005418583750724792, 0.000565946102142334, 0.0005900338292121887, 0.0006141215562820435, 0.0006382092833518982, 0.0006622970104217529, 0.0006863847374916077, 0.0007104724645614624, 0.0007345601916313171, 0.0007586479187011719]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 2.0, 2.0, 3.0, 3.0, 7.0, 6.0, 8.0, 14.0, 10.0, 14.0, 22.0, 29.0, 34.0, 37.0, 68.0, 108.0, 206.0, 410.0, 2206.0, 1003373.0, 40537.0, 742.0, 260.0, 122.0, 88.0, 50.0, 42.0, 37.0, 14.0, 21.0, 15.0, 14.0, 12.0, 7.0, 6.0, 1.0, 4.0, 4.0, 7.0, 1.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.0197296142578125, -0.019177675247192383, -0.018625736236572266, -0.01807379722595215, -0.01752185821533203, -0.016969919204711914, -0.016417980194091797, -0.01586604118347168, -0.015314102172851562, -0.014762163162231445, -0.014210224151611328, -0.013658285140991211, -0.013106346130371094, -0.012554407119750977, -0.01200246810913086, -0.011450529098510742, -0.010898590087890625, -0.010346651077270508, -0.00979471206665039, -0.009242773056030273, -0.008690834045410156, -0.008138895034790039, -0.007586956024169922, -0.007035017013549805, -0.0064830780029296875, -0.00593113899230957, -0.005379199981689453, -0.004827260971069336, -0.004275321960449219, -0.0037233829498291016, -0.0031714439392089844, -0.002619504928588867, -0.00206756591796875, -0.0015156269073486328, -0.0009636878967285156, -0.00041174888610839844, 0.00014019012451171875, 0.0006921291351318359, 0.0012440681457519531, 0.0017960071563720703, 0.0023479461669921875, 0.0028998851776123047, 0.003451824188232422, 0.004003763198852539, 0.004555702209472656, 0.0051076412200927734, 0.005659580230712891, 0.006211519241333008, 0.006763458251953125, 0.007315397262573242, 0.00786733627319336, 0.008419275283813477, 0.008971214294433594, 0.009523153305053711, 0.010075092315673828, 0.010627031326293945, 0.011178970336914062, 0.01173090934753418, 0.012282848358154297, 0.012834787368774414, 0.013386726379394531, 0.013938665390014648, 0.014490604400634766, 0.015042543411254883, 0.015594482421875]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 31.0, 260.0, 529.0, 178.0, 13.0, 4.0, 1.0, 1.0], "bins": [-0.003917249385267496, -0.003850169014185667, -0.0037830884102731943, -0.0037160080391913652, -0.003648927668109536, -0.0035818470641970634, -0.0035147666931152344, -0.0034476863220334053, -0.0033806059509515762, -0.003313525579869747, -0.0032464449759572744, -0.0031793646048754454, -0.0031122842337936163, -0.0030452036298811436, -0.0029781232587993145, -0.0029110428877174854, -0.0028439622838050127, -0.0027768819127231836, -0.002709801308810711, -0.002642720937728882, -0.0025756405666470528, -0.0025085601955652237, -0.002441479591652751, -0.002374399220570922, -0.002307318616658449, -0.00224023824557662, -0.0021731576416641474, -0.0021060772705823183, -0.0020389968995004892, -0.0019719162955880165, -0.0019048359245061874, -0.0018377555534243584, -0.0017706752987578511, -0.0017035948112607002, -0.0016365144401788712, -0.0015694339526817203, -0.0015023534651845694, -0.0014352730941027403, -0.0013681926066055894, -0.0013011121191084385, -0.0012340317480266094, -0.0011669512605294585, -0.0010998708894476295, -0.0010327904019504786, -0.0009657099726609886, -0.0008986295433714986, -0.0008315490558743477, -0.0007644686265848577, -0.0006973881972953677, -0.0006303077680058777, -0.0005632273387163877, -0.0004961468512192369, -0.00042906642192974687, -0.0003619859926402569, -0.00029490553424693644, -0.000227825075853616, -0.00016074461746029556, -9.366417361889035e-05, -2.6583729777485132e-05, 4.049671406392008e-05, 0.0001075771579053253, 0.00017465758719481528, 0.00024173804558813572, 0.00030881850398145616, 0.00037589893327094615]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 2.0, 6.0, 5.0, 8.0, 12.0, 12.0, 17.0, 14.0, 15.0, 23.0, 19.0, 20.0, 27.0, 27.0, 24.0, 32.0, 44.0, 42.0, 43.0, 45.0, 42.0, 37.0, 47.0, 43.0, 37.0, 53.0, 34.0, 35.0, 30.0, 39.0, 25.0, 35.0, 17.0, 15.0, 12.0, 18.0, 15.0, 5.0, 8.0, 7.0, 4.0, 1.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00041115283966064453, -0.0003994312137365341, -0.0003877095878124237, -0.0003759879618883133, -0.0003642663359642029, -0.00035254471004009247, -0.00034082308411598206, -0.00032910145819187164, -0.00031737983226776123, -0.0003056582063436508, -0.0002939365804195404, -0.00028221495449543, -0.0002704933285713196, -0.00025877170264720917, -0.00024705007672309875, -0.00023532845079898834, -0.00022360682487487793, -0.00021188519895076752, -0.0002001635730266571, -0.0001884419471025467, -0.00017672032117843628, -0.00016499869525432587, -0.00015327706933021545, -0.00014155544340610504, -0.00012983381748199463, -0.00011811219155788422, -0.0001063905656337738, -9.466893970966339e-05, -8.294731378555298e-05, -7.122568786144257e-05, -5.950406193733215e-05, -4.778243601322174e-05, -3.606081008911133e-05, -2.4339184165000916e-05, -1.2617558240890503e-05, -8.959323167800903e-07, 1.0825693607330322e-05, 2.2547319531440735e-05, 3.426894545555115e-05, 4.599057137966156e-05, 5.771219730377197e-05, 6.943382322788239e-05, 8.11554491519928e-05, 9.287707507610321e-05, 0.00010459870100021362, 0.00011632032692432404, 0.00012804195284843445, 0.00013976357877254486, 0.00015148520469665527, 0.00016320683062076569, 0.0001749284565448761, 0.0001866500824689865, 0.00019837170839309692, 0.00021009333431720734, 0.00022181496024131775, 0.00023353658616542816, 0.0002452582120895386, 0.000256979838013649, 0.0002687014639377594, 0.0002804230898618698, 0.0002921447157859802, 0.00030386634171009064, 0.00031558796763420105, 0.00032730959355831146, 0.0003390312194824219]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 5.0, 10.0, 15.0, 11.0, 8.0, 18.0, 27.0, 18.0, 24.0, 30.0, 38.0, 45.0, 40.0, 37.0, 40.0, 51.0, 44.0, 35.0, 58.0, 57.0, 52.0, 42.0, 44.0, 42.0, 31.0, 28.0, 16.0, 29.0, 19.0, 19.0, 16.0, 9.0, 9.0, 11.0, 7.0, 9.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.8359375, -8.5650634765625, -8.294189453125, -8.0233154296875, -7.75244140625, -7.4815673828125, -7.210693359375, -6.9398193359375, -6.6689453125, -6.3980712890625, -6.127197265625, -5.8563232421875, -5.58544921875, -5.3145751953125, -5.043701171875, -4.7728271484375, -4.501953125, -4.2310791015625, -3.960205078125, -3.6893310546875, -3.41845703125, -3.1475830078125, -2.876708984375, -2.6058349609375, -2.3349609375, -2.0640869140625, -1.793212890625, -1.5223388671875, -1.25146484375, -0.9805908203125, -0.709716796875, -0.4388427734375, -0.16796875, 0.1029052734375, 0.373779296875, 0.6446533203125, 0.91552734375, 1.1864013671875, 1.457275390625, 1.7281494140625, 1.9990234375, 2.2698974609375, 2.540771484375, 2.8116455078125, 3.08251953125, 3.3533935546875, 3.624267578125, 3.8951416015625, 4.166015625, 4.4368896484375, 4.707763671875, 4.9786376953125, 5.24951171875, 5.5203857421875, 5.791259765625, 6.0621337890625, 6.3330078125, 6.6038818359375, 6.874755859375, 7.1456298828125, 7.41650390625, 7.6873779296875, 7.958251953125, 8.2291259765625, 8.5]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 6.0, 6.0, 12.0, 18.0, 17.0, 18.0, 24.0, 50.0, 48.0, 81.0, 167.0, 273.0, 502.0, 1041.0, 2496.0, 6607.0, 23129.0, 123822.0, 655515.0, 188576.0, 32002.0, 8484.0, 2992.0, 1280.0, 590.0, 323.0, 157.0, 82.0, 65.0, 44.0, 36.0, 26.0, 18.0, 11.0, 14.0, 6.0, 10.0, 8.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.5703125, -8.3074951171875, -8.044677734375, -7.7818603515625, -7.51904296875, -7.2562255859375, -6.993408203125, -6.7305908203125, -6.4677734375, -6.2049560546875, -5.942138671875, -5.6793212890625, -5.41650390625, -5.1536865234375, -4.890869140625, -4.6280517578125, -4.365234375, -4.1024169921875, -3.839599609375, -3.5767822265625, -3.31396484375, -3.0511474609375, -2.788330078125, -2.5255126953125, -2.2626953125, -1.9998779296875, -1.737060546875, -1.4742431640625, -1.21142578125, -0.9486083984375, -0.685791015625, -0.4229736328125, -0.16015625, 0.1026611328125, 0.365478515625, 0.6282958984375, 0.89111328125, 1.1539306640625, 1.416748046875, 1.6795654296875, 1.9423828125, 2.2052001953125, 2.468017578125, 2.7308349609375, 2.99365234375, 3.2564697265625, 3.519287109375, 3.7821044921875, 4.044921875, 4.3077392578125, 4.570556640625, 4.8333740234375, 5.09619140625, 5.3590087890625, 5.621826171875, 5.8846435546875, 6.1474609375, 6.4102783203125, 6.673095703125, 6.9359130859375, 7.19873046875, 7.4615478515625, 7.724365234375, 7.9871826171875, 8.25]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 4.0, 5.0, 3.0, 7.0, 12.0, 11.0, 15.0, 18.0, 23.0, 21.0, 27.0, 32.0, 40.0, 32.0, 48.0, 55.0, 58.0, 66.0, 328.0, 1689.0, 118.0, 59.0, 37.0, 49.0, 47.0, 40.0, 32.0, 33.0, 27.0, 26.0, 15.0, 12.0, 11.0, 11.0, 12.0, 9.0, 6.0, 4.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-28.984375, -28.13525390625, -27.2861328125, -26.43701171875, -25.587890625, -24.73876953125, -23.8896484375, -23.04052734375, -22.19140625, -21.34228515625, -20.4931640625, -19.64404296875, -18.794921875, -17.94580078125, -17.0966796875, -16.24755859375, -15.3984375, -14.54931640625, -13.7001953125, -12.85107421875, -12.001953125, -11.15283203125, -10.3037109375, -9.45458984375, -8.60546875, -7.75634765625, -6.9072265625, -6.05810546875, -5.208984375, -4.35986328125, -3.5107421875, -2.66162109375, -1.8125, -0.96337890625, -0.1142578125, 0.73486328125, 1.583984375, 2.43310546875, 3.2822265625, 4.13134765625, 4.98046875, 5.82958984375, 6.6787109375, 7.52783203125, 8.376953125, 9.22607421875, 10.0751953125, 10.92431640625, 11.7734375, 12.62255859375, 13.4716796875, 14.32080078125, 15.169921875, 16.01904296875, 16.8681640625, 17.71728515625, 18.56640625, 19.41552734375, 20.2646484375, 21.11376953125, 21.962890625, 22.81201171875, 23.6611328125, 24.51025390625, 25.359375]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 6.0, 6.0, 9.0, 16.0, 17.0, 25.0, 17.0, 32.0, 43.0, 55.0, 81.0, 112.0, 165.0, 234.0, 337.0, 765.0, 7925.0, 3124151.0, 9719.0, 849.0, 369.0, 232.0, 149.0, 109.0, 69.0, 39.0, 53.0, 26.0, 21.0, 20.0, 15.0, 7.0, 7.0, 8.0, 8.0, 4.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-73.75, -71.61376953125, -69.4775390625, -67.34130859375, -65.205078125, -63.06884765625, -60.9326171875, -58.79638671875, -56.66015625, -54.52392578125, -52.3876953125, -50.25146484375, -48.115234375, -45.97900390625, -43.8427734375, -41.70654296875, -39.5703125, -37.43408203125, -35.2978515625, -33.16162109375, -31.025390625, -28.88916015625, -26.7529296875, -24.61669921875, -22.48046875, -20.34423828125, -18.2080078125, -16.07177734375, -13.935546875, -11.79931640625, -9.6630859375, -7.52685546875, -5.390625, -3.25439453125, -1.1181640625, 1.01806640625, 3.154296875, 5.29052734375, 7.4267578125, 9.56298828125, 11.69921875, 13.83544921875, 15.9716796875, 18.10791015625, 20.244140625, 22.38037109375, 24.5166015625, 26.65283203125, 28.7890625, 30.92529296875, 33.0615234375, 35.19775390625, 37.333984375, 39.47021484375, 41.6064453125, 43.74267578125, 45.87890625, 48.01513671875, 50.1513671875, 52.28759765625, 54.423828125, 56.56005859375, 58.6962890625, 60.83251953125, 62.96875]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 52.0, 363.0, 462.0, 123.0, 12.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.515823364257812, -23.231674194335938, -20.947525024414062, -18.663373947143555, -16.37922477722168, -14.095075607299805, -11.810925483703613, -9.526775360107422, -7.242626190185547, -4.958476543426514, -2.6743268966674805, -0.39017724990844727, 1.893972396850586, 4.178121566772461, 6.462271690368652, 8.746421813964844, 11.030570983886719, 13.314720153808594, 15.598870277404785, 17.883020401000977, 20.16716957092285, 22.451318740844727, 24.735469818115234, 27.01961898803711, 29.303768157958984, 31.58791732788086, 33.872066497802734, 36.15621566772461, 38.44036865234375, 40.724517822265625, 43.0086669921875, 45.292816162109375, 47.57695770263672, 49.861106872558594, 52.14525604248047, 54.429405212402344, 56.71355438232422, 58.997703552246094, 61.281856536865234, 63.56600570678711, 65.85015869140625, 68.13430786132812, 70.41845703125, 72.70260620117188, 74.98675537109375, 77.27090454101562, 79.5550537109375, 81.83920288085938, 84.12335205078125, 86.40750122070312, 88.691650390625, 90.97579956054688, 93.25994873046875, 95.54409790039062, 97.8282470703125, 100.11239624023438, 102.39654541015625, 104.68069458007812, 106.96484375, 109.24899291992188, 111.53314208984375, 113.81729125976562, 116.1014404296875, 118.38558959960938, 120.66974639892578]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 6.0, 5.0, 7.0, 9.0, 6.0, 6.0, 9.0, 10.0, 16.0, 20.0, 17.0, 21.0, 23.0, 22.0, 32.0, 12.0, 37.0, 45.0, 32.0, 38.0, 46.0, 49.0, 51.0, 37.0, 52.0, 35.0, 33.0, 32.0, 45.0, 34.0, 22.0, 30.0, 23.0, 19.0, 21.0, 10.0, 15.0, 11.0, 14.0, 12.0, 5.0, 12.0, 5.0, 7.0, 6.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-65.52726745605469, -63.564144134521484, -61.60102081298828, -59.637901306152344, -57.67477798461914, -55.71165466308594, -53.74853515625, -51.7854118347168, -49.822288513183594, -47.85916519165039, -45.89604187011719, -43.93292236328125, -41.96979904174805, -40.006675720214844, -38.043556213378906, -36.0804328918457, -34.1173095703125, -32.1541862487793, -30.191064834594727, -28.227943420410156, -26.264820098876953, -24.30169677734375, -22.33857536315918, -20.37545394897461, -18.412330627441406, -16.449207305908203, -14.486085891723633, -12.522963523864746, -10.55984115600586, -8.596718788146973, -6.633596420288086, -4.670474052429199, -2.707355499267578, -0.7442331314086914, 1.2188892364501953, 3.182011604309082, 5.145133972167969, 7.1082563400268555, 9.071378707885742, 11.034501075744629, 12.997623443603516, 14.960745811462402, 16.92386817932129, 18.88698959350586, 20.850112915039062, 22.813236236572266, 24.776357650756836, 26.739479064941406, 28.70260238647461, 30.665725708007812, 32.62884521484375, 34.59196853637695, 36.555091857910156, 38.51821517944336, 40.48133850097656, 42.4444580078125, 44.4075813293457, 46.370704650878906, 48.333824157714844, 50.29694747924805, 52.26007080078125, 54.22319412231445, 56.186317443847656, 58.149436950683594, 60.1125602722168]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 5.0, 9.0, 14.0, 11.0, 10.0, 17.0, 22.0, 27.0, 29.0, 32.0, 38.0, 31.0, 44.0, 42.0, 53.0, 41.0, 54.0, 46.0, 54.0, 54.0, 46.0, 46.0, 48.0, 45.0, 30.0, 21.0, 24.0, 21.0, 24.0, 16.0, 11.0, 7.0, 12.0, 8.0, 4.0, 6.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.703125, -9.4124755859375, -9.121826171875, -8.8311767578125, -8.54052734375, -8.2498779296875, -7.959228515625, -7.6685791015625, -7.3779296875, -7.0872802734375, -6.796630859375, -6.5059814453125, -6.21533203125, -5.9246826171875, -5.634033203125, -5.3433837890625, -5.052734375, -4.7620849609375, -4.471435546875, -4.1807861328125, -3.89013671875, -3.5994873046875, -3.308837890625, -3.0181884765625, -2.7275390625, -2.4368896484375, -2.146240234375, -1.8555908203125, -1.56494140625, -1.2742919921875, -0.983642578125, -0.6929931640625, -0.40234375, -0.1116943359375, 0.178955078125, 0.4696044921875, 0.76025390625, 1.0509033203125, 1.341552734375, 1.6322021484375, 1.9228515625, 2.2135009765625, 2.504150390625, 2.7947998046875, 3.08544921875, 3.3760986328125, 3.666748046875, 3.9573974609375, 4.248046875, 4.5386962890625, 4.829345703125, 5.1199951171875, 5.41064453125, 5.7012939453125, 5.991943359375, 6.2825927734375, 6.5732421875, 6.8638916015625, 7.154541015625, 7.4451904296875, 7.73583984375, 8.0264892578125, 8.317138671875, 8.6077880859375, 8.8984375]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0, 3.0, 7.0, 11.0, 21.0, 20.0, 27.0, 29.0, 49.0, 43.0, 53.0, 81.0, 109.0, 139.0, 229.0, 395.0, 925.0, 3828.0, 44571.0, 1562329.0, 2472203.0, 101073.0, 5618.0, 1173.0, 460.0, 244.0, 161.0, 112.0, 86.0, 54.0, 55.0, 34.0, 34.0, 25.0, 20.0, 13.0, 11.0, 11.0, 9.0, 5.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-22.296875, -21.6025390625, -20.908203125, -20.2138671875, -19.51953125, -18.8251953125, -18.130859375, -17.4365234375, -16.7421875, -16.0478515625, -15.353515625, -14.6591796875, -13.96484375, -13.2705078125, -12.576171875, -11.8818359375, -11.1875, -10.4931640625, -9.798828125, -9.1044921875, -8.41015625, -7.7158203125, -7.021484375, -6.3271484375, -5.6328125, -4.9384765625, -4.244140625, -3.5498046875, -2.85546875, -2.1611328125, -1.466796875, -0.7724609375, -0.078125, 0.6162109375, 1.310546875, 2.0048828125, 2.69921875, 3.3935546875, 4.087890625, 4.7822265625, 5.4765625, 6.1708984375, 6.865234375, 7.5595703125, 8.25390625, 8.9482421875, 9.642578125, 10.3369140625, 11.03125, 11.7255859375, 12.419921875, 13.1142578125, 13.80859375, 14.5029296875, 15.197265625, 15.8916015625, 16.5859375, 17.2802734375, 17.974609375, 18.6689453125, 19.36328125, 20.0576171875, 20.751953125, 21.4462890625, 22.140625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 2.0, 9.0, 16.0, 12.0, 25.0, 17.0, 32.0, 37.0, 44.0, 71.0, 90.0, 111.0, 146.0, 208.0, 289.0, 395.0, 487.0, 443.0, 394.0, 340.0, 232.0, 180.0, 135.0, 83.0, 53.0, 58.0, 46.0, 36.0, 24.0, 16.0, 18.0, 9.0, 3.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.21875, -15.781494140625, -15.34423828125, -14.906982421875, -14.4697265625, -14.032470703125, -13.59521484375, -13.157958984375, -12.720703125, -12.283447265625, -11.84619140625, -11.408935546875, -10.9716796875, -10.534423828125, -10.09716796875, -9.659912109375, -9.22265625, -8.785400390625, -8.34814453125, -7.910888671875, -7.4736328125, -7.036376953125, -6.59912109375, -6.161865234375, -5.724609375, -5.287353515625, -4.85009765625, -4.412841796875, -3.9755859375, -3.538330078125, -3.10107421875, -2.663818359375, -2.2265625, -1.789306640625, -1.35205078125, -0.914794921875, -0.4775390625, -0.040283203125, 0.39697265625, 0.834228515625, 1.271484375, 1.708740234375, 2.14599609375, 2.583251953125, 3.0205078125, 3.457763671875, 3.89501953125, 4.332275390625, 4.76953125, 5.206787109375, 5.64404296875, 6.081298828125, 6.5185546875, 6.955810546875, 7.39306640625, 7.830322265625, 8.267578125, 8.704833984375, 9.14208984375, 9.579345703125, 10.0166015625, 10.453857421875, 10.89111328125, 11.328369140625, 11.765625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 2.0, 4.0, 8.0, 12.0, 13.0, 21.0, 20.0, 47.0, 41.0, 49.0, 70.0, 93.0, 103.0, 135.0, 180.0, 245.0, 348.0, 611.0, 1920.0, 801507.0, 3383480.0, 3254.0, 668.0, 365.0, 253.0, 186.0, 129.0, 120.0, 80.0, 73.0, 50.0, 34.0, 38.0, 26.0, 21.0, 26.0, 16.0, 6.0, 7.0, 8.0, 4.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-83.8125, -81.490234375, -79.16796875, -76.845703125, -74.5234375, -72.201171875, -69.87890625, -67.556640625, -65.234375, -62.912109375, -60.58984375, -58.267578125, -55.9453125, -53.623046875, -51.30078125, -48.978515625, -46.65625, -44.333984375, -42.01171875, -39.689453125, -37.3671875, -35.044921875, -32.72265625, -30.400390625, -28.078125, -25.755859375, -23.43359375, -21.111328125, -18.7890625, -16.466796875, -14.14453125, -11.822265625, -9.5, -7.177734375, -4.85546875, -2.533203125, -0.2109375, 2.111328125, 4.43359375, 6.755859375, 9.078125, 11.400390625, 13.72265625, 16.044921875, 18.3671875, 20.689453125, 23.01171875, 25.333984375, 27.65625, 29.978515625, 32.30078125, 34.623046875, 36.9453125, 39.267578125, 41.58984375, 43.912109375, 46.234375, 48.556640625, 50.87890625, 53.201171875, 55.5234375, 57.845703125, 60.16796875, 62.490234375, 64.8125]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 17.0, 94.0, 221.0, 308.0, 249.0, 102.0, 12.0, 7.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-172.65196228027344, -168.05654907226562, -163.4611358642578, -158.86572265625, -154.2703094482422, -149.67489624023438, -145.07948303222656, -140.48406982421875, -135.88865661621094, -131.29324340820312, -126.69783020019531, -122.1024169921875, -117.50700378417969, -112.91159057617188, -108.31617736816406, -103.72076416015625, -99.12535095214844, -94.52993774414062, -89.93452453613281, -85.339111328125, -80.74369812011719, -76.14828491210938, -71.55287170410156, -66.95745849609375, -62.36204528808594, -57.766632080078125, -53.17121887207031, -48.5758056640625, -43.98039245605469, -39.384979248046875, -34.78956604003906, -30.19415283203125, -25.59874725341797, -21.003334045410156, -16.407920837402344, -11.812507629394531, -7.217094421386719, -2.6216812133789062, 1.9737319946289062, 6.569145202636719, 11.164558410644531, 15.759971618652344, 20.355384826660156, 24.95079803466797, 29.54621124267578, 34.141624450683594, 38.737037658691406, 43.33245086669922, 47.92786407470703, 52.523277282714844, 57.118690490722656, 61.71410369873047, 66.30951690673828, 70.9049301147461, 75.5003433227539, 80.09575653076172, 84.69116973876953, 89.28658294677734, 93.88199615478516, 98.47740936279297, 103.07282257080078, 107.6682357788086, 112.2636489868164, 116.85906219482422, 121.45447540283203]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 5.0, 3.0, 1.0, 7.0, 9.0, 6.0, 13.0, 10.0, 9.0, 11.0, 20.0, 13.0, 25.0, 29.0, 13.0, 30.0, 29.0, 26.0, 20.0, 37.0, 25.0, 24.0, 44.0, 37.0, 35.0, 35.0, 35.0, 32.0, 31.0, 38.0, 29.0, 28.0, 25.0, 29.0, 25.0, 27.0, 21.0, 19.0, 34.0, 21.0, 15.0, 17.0, 9.0, 9.0, 8.0, 9.0, 9.0, 4.0, 6.0, 3.0, 2.0, 6.0, 4.0, 0.0, 1.0, 0.0, 2.0], "bins": [-40.26152038574219, -39.01441955566406, -37.76731872558594, -36.52022171020508, -35.27312088012695, -34.02602005004883, -32.77892303466797, -31.531822204589844, -30.28472137451172, -29.037620544433594, -27.7905216217041, -26.54342269897461, -25.296321868896484, -24.04922103881836, -22.802122116088867, -21.555023193359375, -20.30792236328125, -19.060821533203125, -17.813722610473633, -16.56662368774414, -15.319522857666016, -14.072422981262207, -12.825323104858398, -11.57822322845459, -10.331123352050781, -9.084023475646973, -7.836923599243164, -6.5898237228393555, -5.342723846435547, -4.095623970031738, -2.8485240936279297, -1.601424217224121, -0.3543243408203125, 0.8927755355834961, 2.1398754119873047, 3.3869752883911133, 4.634075164794922, 5.8811750411987305, 7.128274917602539, 8.375374794006348, 9.622474670410156, 10.869574546813965, 12.116674423217773, 13.363774299621582, 14.61087417602539, 15.8579740524292, 17.105073928833008, 18.3521728515625, 19.599273681640625, 20.84637451171875, 22.093473434448242, 23.340572357177734, 24.58767318725586, 25.834774017333984, 27.081872940063477, 28.32897186279297, 29.576072692871094, 30.82317352294922, 32.070274353027344, 33.3173713684082, 34.56447219848633, 35.81157302856445, 37.05867004394531, 38.30577087402344, 39.55287170410156]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 5.0, 4.0, 10.0, 4.0, 13.0, 22.0, 19.0, 18.0, 26.0, 29.0, 36.0, 28.0, 40.0, 27.0, 37.0, 52.0, 60.0, 50.0, 46.0, 52.0, 52.0, 41.0, 34.0, 43.0, 38.0, 26.0, 35.0, 32.0, 17.0, 20.0, 20.0, 16.0, 11.0, 14.0, 4.0, 7.0, 7.0, 5.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.390625, -8.1251220703125, -7.859619140625, -7.5941162109375, -7.32861328125, -7.0631103515625, -6.797607421875, -6.5321044921875, -6.2666015625, -6.0010986328125, -5.735595703125, -5.4700927734375, -5.20458984375, -4.9390869140625, -4.673583984375, -4.4080810546875, -4.142578125, -3.8770751953125, -3.611572265625, -3.3460693359375, -3.08056640625, -2.8150634765625, -2.549560546875, -2.2840576171875, -2.0185546875, -1.7530517578125, -1.487548828125, -1.2220458984375, -0.95654296875, -0.6910400390625, -0.425537109375, -0.1600341796875, 0.10546875, 0.3709716796875, 0.636474609375, 0.9019775390625, 1.16748046875, 1.4329833984375, 1.698486328125, 1.9639892578125, 2.2294921875, 2.4949951171875, 2.760498046875, 3.0260009765625, 3.29150390625, 3.5570068359375, 3.822509765625, 4.0880126953125, 4.353515625, 4.6190185546875, 4.884521484375, 5.1500244140625, 5.41552734375, 5.6810302734375, 5.946533203125, 6.2120361328125, 6.4775390625, 6.7430419921875, 7.008544921875, 7.2740478515625, 7.53955078125, 7.8050537109375, 8.070556640625, 8.3360595703125, 8.6015625]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 0.0, 2.0, 3.0, 7.0, 8.0, 12.0, 17.0, 23.0, 35.0, 58.0, 90.0, 106.0, 164.0, 199.0, 294.0, 469.0, 700.0, 982.0, 1487.0, 2244.0, 3464.0, 5486.0, 8428.0, 12647.0, 19975.0, 30603.0, 48223.0, 80141.0, 164656.0, 318036.0, 147060.0, 74595.0, 45243.0, 29313.0, 18864.0, 11998.0, 7745.0, 5200.0, 3293.0, 2160.0, 1484.0, 1028.0, 652.0, 425.0, 272.0, 222.0, 136.0, 93.0, 69.0, 47.0, 31.0, 15.0, 19.0, 7.0, 10.0, 12.0, 6.0, 3.0, 4.0, 2.0, 2.0], "bins": [-1.451171875, -1.40643310546875, -1.3616943359375, -1.31695556640625, -1.272216796875, -1.22747802734375, -1.1827392578125, -1.13800048828125, -1.09326171875, -1.04852294921875, -1.0037841796875, -0.95904541015625, -0.914306640625, -0.86956787109375, -0.8248291015625, -0.78009033203125, -0.7353515625, -0.69061279296875, -0.6458740234375, -0.60113525390625, -0.556396484375, -0.51165771484375, -0.4669189453125, -0.42218017578125, -0.37744140625, -0.33270263671875, -0.2879638671875, -0.24322509765625, -0.198486328125, -0.15374755859375, -0.1090087890625, -0.06427001953125, -0.01953125, 0.02520751953125, 0.0699462890625, 0.11468505859375, 0.159423828125, 0.20416259765625, 0.2489013671875, 0.29364013671875, 0.33837890625, 0.38311767578125, 0.4278564453125, 0.47259521484375, 0.517333984375, 0.56207275390625, 0.6068115234375, 0.65155029296875, 0.6962890625, 0.74102783203125, 0.7857666015625, 0.83050537109375, 0.875244140625, 0.91998291015625, 0.9647216796875, 1.00946044921875, 1.05419921875, 1.09893798828125, 1.1436767578125, 1.18841552734375, 1.233154296875, 1.27789306640625, 1.3226318359375, 1.36737060546875, 1.412109375]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 6.0, 4.0, 9.0, 9.0, 11.0, 12.0, 12.0, 20.0, 17.0, 16.0, 21.0, 21.0, 19.0, 29.0, 35.0, 22.0, 53.0, 24.0, 38.0, 30.0, 36.0, 1071.0, 32.0, 37.0, 46.0, 30.0, 38.0, 38.0, 26.0, 28.0, 23.0, 32.0, 29.0, 17.0, 23.0, 25.0, 16.0, 11.0, 10.0, 12.0, 10.0, 6.0, 3.0, 1.0, 5.0, 7.0, 0.0, 5.0, 3.0, 1.0, 3.0, 1.0], "bins": [-4.703125, -4.56304931640625, -4.4229736328125, -4.28289794921875, -4.142822265625, -4.00274658203125, -3.8626708984375, -3.72259521484375, -3.58251953125, -3.44244384765625, -3.3023681640625, -3.16229248046875, -3.022216796875, -2.88214111328125, -2.7420654296875, -2.60198974609375, -2.4619140625, -2.32183837890625, -2.1817626953125, -2.04168701171875, -1.901611328125, -1.76153564453125, -1.6214599609375, -1.48138427734375, -1.34130859375, -1.20123291015625, -1.0611572265625, -0.92108154296875, -0.781005859375, -0.64093017578125, -0.5008544921875, -0.36077880859375, -0.220703125, -0.08062744140625, 0.0594482421875, 0.19952392578125, 0.339599609375, 0.47967529296875, 0.6197509765625, 0.75982666015625, 0.89990234375, 1.03997802734375, 1.1800537109375, 1.32012939453125, 1.460205078125, 1.60028076171875, 1.7403564453125, 1.88043212890625, 2.0205078125, 2.16058349609375, 2.3006591796875, 2.44073486328125, 2.580810546875, 2.72088623046875, 2.8609619140625, 3.00103759765625, 3.14111328125, 3.28118896484375, 3.4212646484375, 3.56134033203125, 3.701416015625, 3.84149169921875, 3.9815673828125, 4.12164306640625, 4.26171875]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 0.0, 4.0, 7.0, 4.0, 12.0, 10.0, 24.0, 29.0, 51.0, 89.0, 96.0, 182.0, 245.0, 340.0, 459.0, 656.0, 1009.0, 1416.0, 2082.0, 2929.0, 4324.0, 6432.0, 9486.0, 13889.0, 21268.0, 32786.0, 51429.0, 83490.0, 154352.0, 1342536.0, 144546.0, 80185.0, 49437.0, 31292.0, 20057.0, 13422.0, 9043.0, 6078.0, 4198.0, 2804.0, 1967.0, 1357.0, 945.0, 685.0, 410.0, 305.0, 232.0, 151.0, 112.0, 69.0, 49.0, 56.0, 39.0, 17.0, 21.0, 12.0, 5.0, 8.0, 3.0, 1.0, 2.0], "bins": [-1.31640625, -1.275848388671875, -1.23529052734375, -1.194732666015625, -1.1541748046875, -1.113616943359375, -1.07305908203125, -1.032501220703125, -0.991943359375, -0.951385498046875, -0.91082763671875, -0.870269775390625, -0.8297119140625, -0.789154052734375, -0.74859619140625, -0.708038330078125, -0.66748046875, -0.626922607421875, -0.58636474609375, -0.545806884765625, -0.5052490234375, -0.464691162109375, -0.42413330078125, -0.383575439453125, -0.343017578125, -0.302459716796875, -0.26190185546875, -0.221343994140625, -0.1807861328125, -0.140228271484375, -0.09967041015625, -0.059112548828125, -0.0185546875, 0.022003173828125, 0.06256103515625, 0.103118896484375, 0.1436767578125, 0.184234619140625, 0.22479248046875, 0.265350341796875, 0.305908203125, 0.346466064453125, 0.38702392578125, 0.427581787109375, 0.4681396484375, 0.508697509765625, 0.54925537109375, 0.589813232421875, 0.63037109375, 0.670928955078125, 0.71148681640625, 0.752044677734375, 0.7926025390625, 0.833160400390625, 0.87371826171875, 0.914276123046875, 0.954833984375, 0.995391845703125, 1.03594970703125, 1.076507568359375, 1.1170654296875, 1.157623291015625, 1.19818115234375, 1.238739013671875, 1.279296875]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 9.0, 7.0, 16.0, 6.0, 17.0, 19.0, 11.0, 13.0, 28.0, 31.0, 57.0, 58.0, 76.0, 98.0, 113.0, 106.0, 83.0, 73.0, 39.0, 27.0, 22.0, 15.0, 11.0, 13.0, 20.0, 6.0, 9.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0010442733764648438, -0.0010156482458114624, -0.000987023115158081, -0.0009583979845046997, -0.0009297728538513184, -0.000901147723197937, -0.0008725225925445557, -0.0008438974618911743, -0.000815272331237793, -0.0007866472005844116, -0.0007580220699310303, -0.0007293969392776489, -0.0007007718086242676, -0.0006721466779708862, -0.0006435215473175049, -0.0006148964166641235, -0.0005862712860107422, -0.0005576461553573608, -0.0005290210247039795, -0.0005003958940505981, -0.0004717707633972168, -0.00044314563274383545, -0.0004145205020904541, -0.00038589537143707275, -0.0003572702407836914, -0.00032864511013031006, -0.0003000199794769287, -0.00027139484882354736, -0.00024276971817016602, -0.00021414458751678467, -0.00018551945686340332, -0.00015689432621002197, -0.00012826919555664062, -9.964406490325928e-05, -7.101893424987793e-05, -4.239380359649658e-05, -1.3768672943115234e-05, 1.4856457710266113e-05, 4.348158836364746e-05, 7.210671901702881e-05, 0.00010073184967041016, 0.0001293569803237915, 0.00015798211097717285, 0.0001866072416305542, 0.00021523237228393555, 0.0002438575029373169, 0.00027248263359069824, 0.0003011077642440796, 0.00032973289489746094, 0.0003583580255508423, 0.00038698315620422363, 0.000415608286857605, 0.00044423341751098633, 0.0004728585481643677, 0.000501483678817749, 0.0005301088094711304, 0.0005587339401245117, 0.0005873590707778931, 0.0006159842014312744, 0.0006446093320846558, 0.0006732344627380371, 0.0007018595933914185, 0.0007304847240447998, 0.0007591098546981812, 0.0007877349853515625]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 1.0, 2.0, 4.0, 9.0, 12.0, 15.0, 12.0, 18.0, 23.0, 36.0, 50.0, 81.0, 188.0, 445.0, 4089.0, 1040957.0, 1780.0, 366.0, 170.0, 76.0, 57.0, 32.0, 28.0, 18.0, 34.0, 15.0, 11.0, 4.0, 3.0, 6.0, 5.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.020538330078125, -0.01978898048400879, -0.019039630889892578, -0.018290281295776367, -0.017540931701660156, -0.016791582107543945, -0.016042232513427734, -0.015292882919311523, -0.014543533325195312, -0.013794183731079102, -0.01304483413696289, -0.01229548454284668, -0.011546134948730469, -0.010796785354614258, -0.010047435760498047, -0.009298086166381836, -0.008548736572265625, -0.007799386978149414, -0.007050037384033203, -0.006300687789916992, -0.005551338195800781, -0.00480198860168457, -0.004052639007568359, -0.0033032894134521484, -0.0025539398193359375, -0.0018045902252197266, -0.0010552406311035156, -0.0003058910369873047, 0.00044345855712890625, 0.0011928081512451172, 0.0019421577453613281, 0.002691507339477539, 0.00344085693359375, 0.004190206527709961, 0.004939556121826172, 0.005688905715942383, 0.006438255310058594, 0.007187604904174805, 0.007936954498291016, 0.008686304092407227, 0.009435653686523438, 0.010185003280639648, 0.01093435287475586, 0.01168370246887207, 0.012433052062988281, 0.013182401657104492, 0.013931751251220703, 0.014681100845336914, 0.015430450439453125, 0.016179800033569336, 0.016929149627685547, 0.017678499221801758, 0.01842784881591797, 0.01917719841003418, 0.01992654800415039, 0.0206758975982666, 0.021425247192382812, 0.022174596786499023, 0.022923946380615234, 0.023673295974731445, 0.024422645568847656, 0.025171995162963867, 0.025921344757080078, 0.02667069435119629, 0.0274200439453125]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 11.0, 277.0, 651.0, 75.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00207805004902184, -0.001988771138712764, -0.0018994922284036875, -0.001810213434509933, -0.0017209345242008567, -0.0016316556138917804, -0.001542376819998026, -0.0014530979096889496, -0.0013638189993798733, -0.001274540089070797, -0.0011852611787617207, -0.0010959823848679662, -0.0010067034745588899, -0.0009174245642498136, -0.0008281457121483982, -0.0007388668600469828, -0.0006495879497379065, -0.0005603090394288301, -0.00047103018732741475, -0.0003817513061221689, -0.00029247242491692305, -0.0002031935437116772, -0.00011391466250643134, -2.4635810405015945e-05, 6.464309990406036e-05, 0.00015392198110930622, 0.00024320086231455207, 0.0003324797435197979, 0.0004217586247250438, 0.0005110375350341201, 0.0006003163871355355, 0.0006895952392369509, 0.0007788743823766708, 0.0008681532926857471, 0.0009574321447871625, 0.001046710996888578, 0.0011359899071976542, 0.0012252688175067306, 0.001314547611400485, 0.0014038265217095613, 0.0014931054320186377, 0.001582384342327714, 0.0016716632526367903, 0.0017609420465305448, 0.001850220956839621, 0.0019394998671486974, 0.002028778661042452, 0.002118057571351528, 0.0022073364816606045, 0.002296615391969681, 0.002385894302278757, 0.0024751732125878334, 0.0025644521228969097, 0.0026537308003753424, 0.0027430097106844187, 0.002832288620993495, 0.0029215675313025713, 0.0030108464416116476, 0.003100125351920724, 0.0031894042622298002, 0.003278682939708233, 0.003367961850017309, 0.0034572407603263855, 0.003546519670635462, 0.003635798580944538]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 6.0, 3.0, 6.0, 3.0, 6.0, 11.0, 16.0, 9.0, 13.0, 18.0, 17.0, 21.0, 27.0, 29.0, 30.0, 28.0, 32.0, 30.0, 30.0, 30.0, 40.0, 29.0, 32.0, 47.0, 45.0, 38.0, 29.0, 21.0, 30.0, 42.0, 26.0, 26.0, 26.0, 27.0, 24.0, 18.0, 16.0, 17.0, 23.0, 14.0, 18.0, 13.0, 9.0, 6.0, 7.0, 7.0, 5.0, 5.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.0003203749656677246, -0.00031030457466840744, -0.00030023418366909027, -0.0002901637926697731, -0.00028009340167045593, -0.00027002301067113876, -0.0002599526196718216, -0.0002498822286725044, -0.00023981183767318726, -0.0002297414466738701, -0.00021967105567455292, -0.00020960066467523575, -0.00019953027367591858, -0.0001894598826766014, -0.00017938949167728424, -0.00016931910067796707, -0.0001592487096786499, -0.00014917831867933273, -0.00013910792768001556, -0.0001290375366806984, -0.00011896714568138123, -0.00010889675468206406, -9.882636368274689e-05, -8.875597268342972e-05, -7.868558168411255e-05, -6.861519068479538e-05, -5.854479968547821e-05, -4.847440868616104e-05, -3.840401768684387e-05, -2.8333626687526703e-05, -1.8263235688209534e-05, -8.192844688892365e-06, 1.8775463104248047e-06, 1.1947937309741974e-05, 2.2018328309059143e-05, 3.208871930837631e-05, 4.215911030769348e-05, 5.222950130701065e-05, 6.229989230632782e-05, 7.237028330564499e-05, 8.244067430496216e-05, 9.251106530427933e-05, 0.0001025814563035965, 0.00011265184730291367, 0.00012272223830223083, 0.000132792629301548, 0.00014286302030086517, 0.00015293341130018234, 0.0001630038022994995, 0.00017307419329881668, 0.00018314458429813385, 0.00019321497529745102, 0.0002032853662967682, 0.00021335575729608536, 0.00022342614829540253, 0.0002334965392947197, 0.00024356693029403687, 0.00025363732129335403, 0.0002637077122926712, 0.00027377810329198837, 0.00028384849429130554, 0.0002939188852906227, 0.0003039892762899399, 0.00031405966728925705, 0.0003241300582885742]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 5.0, 4.0, 10.0, 4.0, 13.0, 22.0, 19.0, 18.0, 26.0, 29.0, 36.0, 28.0, 40.0, 27.0, 37.0, 52.0, 60.0, 50.0, 46.0, 52.0, 52.0, 41.0, 34.0, 43.0, 38.0, 26.0, 35.0, 32.0, 17.0, 20.0, 20.0, 16.0, 11.0, 14.0, 4.0, 7.0, 7.0, 5.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.390625, -8.1251220703125, -7.859619140625, -7.5941162109375, -7.32861328125, -7.0631103515625, -6.797607421875, -6.5321044921875, -6.2666015625, -6.0010986328125, -5.735595703125, -5.4700927734375, -5.20458984375, -4.9390869140625, -4.673583984375, -4.4080810546875, -4.142578125, -3.8770751953125, -3.611572265625, -3.3460693359375, -3.08056640625, -2.8150634765625, -2.549560546875, -2.2840576171875, -2.0185546875, -1.7530517578125, -1.487548828125, -1.2220458984375, -0.95654296875, -0.6910400390625, -0.425537109375, -0.1600341796875, 0.10546875, 0.3709716796875, 0.636474609375, 0.9019775390625, 1.16748046875, 1.4329833984375, 1.698486328125, 1.9639892578125, 2.2294921875, 2.4949951171875, 2.760498046875, 3.0260009765625, 3.29150390625, 3.5570068359375, 3.822509765625, 4.0880126953125, 4.353515625, 4.6190185546875, 4.884521484375, 5.1500244140625, 5.41552734375, 5.6810302734375, 5.946533203125, 6.2120361328125, 6.4775390625, 6.7430419921875, 7.008544921875, 7.2740478515625, 7.53955078125, 7.8050537109375, 8.070556640625, 8.3360595703125, 8.6015625]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 2.0, 4.0, 7.0, 3.0, 7.0, 17.0, 21.0, 24.0, 38.0, 67.0, 111.0, 144.0, 264.0, 395.0, 702.0, 1303.0, 2369.0, 4628.0, 9473.0, 19906.0, 44483.0, 106852.0, 296657.0, 343922.0, 123068.0, 50087.0, 22274.0, 10467.0, 5243.0, 2652.0, 1357.0, 764.0, 434.0, 267.0, 185.0, 127.0, 75.0, 53.0, 32.0, 27.0, 11.0, 11.0, 9.0, 3.0, 6.0, 0.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-4.9921875, -4.849853515625, -4.70751953125, -4.565185546875, -4.4228515625, -4.280517578125, -4.13818359375, -3.995849609375, -3.853515625, -3.711181640625, -3.56884765625, -3.426513671875, -3.2841796875, -3.141845703125, -2.99951171875, -2.857177734375, -2.71484375, -2.572509765625, -2.43017578125, -2.287841796875, -2.1455078125, -2.003173828125, -1.86083984375, -1.718505859375, -1.576171875, -1.433837890625, -1.29150390625, -1.149169921875, -1.0068359375, -0.864501953125, -0.72216796875, -0.579833984375, -0.4375, -0.295166015625, -0.15283203125, -0.010498046875, 0.1318359375, 0.274169921875, 0.41650390625, 0.558837890625, 0.701171875, 0.843505859375, 0.98583984375, 1.128173828125, 1.2705078125, 1.412841796875, 1.55517578125, 1.697509765625, 1.83984375, 1.982177734375, 2.12451171875, 2.266845703125, 2.4091796875, 2.551513671875, 2.69384765625, 2.836181640625, 2.978515625, 3.120849609375, 3.26318359375, 3.405517578125, 3.5478515625, 3.690185546875, 3.83251953125, 3.974853515625, 4.1171875]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 8.0, 7.0, 3.0, 8.0, 7.0, 17.0, 23.0, 20.0, 18.0, 30.0, 29.0, 28.0, 33.0, 39.0, 41.0, 48.0, 56.0, 85.0, 386.0, 1597.0, 109.0, 60.0, 52.0, 51.0, 38.0, 44.0, 27.0, 33.0, 20.0, 33.0, 18.0, 16.0, 14.0, 12.0, 10.0, 12.0, 6.0, 2.0, 5.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.984375, -28.134765625, -27.28515625, -26.435546875, -25.5859375, -24.736328125, -23.88671875, -23.037109375, -22.1875, -21.337890625, -20.48828125, -19.638671875, -18.7890625, -17.939453125, -17.08984375, -16.240234375, -15.390625, -14.541015625, -13.69140625, -12.841796875, -11.9921875, -11.142578125, -10.29296875, -9.443359375, -8.59375, -7.744140625, -6.89453125, -6.044921875, -5.1953125, -4.345703125, -3.49609375, -2.646484375, -1.796875, -0.947265625, -0.09765625, 0.751953125, 1.6015625, 2.451171875, 3.30078125, 4.150390625, 5.0, 5.849609375, 6.69921875, 7.548828125, 8.3984375, 9.248046875, 10.09765625, 10.947265625, 11.796875, 12.646484375, 13.49609375, 14.345703125, 15.1953125, 16.044921875, 16.89453125, 17.744140625, 18.59375, 19.443359375, 20.29296875, 21.142578125, 21.9921875, 22.841796875, 23.69140625, 24.541015625, 25.390625]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 4.0, 5.0, 5.0, 13.0, 20.0, 11.0, 19.0, 20.0, 27.0, 45.0, 43.0, 74.0, 82.0, 120.0, 152.0, 214.0, 336.0, 590.0, 3365.0, 3014183.0, 123498.0, 1416.0, 423.0, 254.0, 199.0, 147.0, 97.0, 82.0, 51.0, 59.0, 30.0, 27.0, 26.0, 14.0, 13.0, 7.0, 6.0, 10.0, 10.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-60.75, -58.712890625, -56.67578125, -54.638671875, -52.6015625, -50.564453125, -48.52734375, -46.490234375, -44.453125, -42.416015625, -40.37890625, -38.341796875, -36.3046875, -34.267578125, -32.23046875, -30.193359375, -28.15625, -26.119140625, -24.08203125, -22.044921875, -20.0078125, -17.970703125, -15.93359375, -13.896484375, -11.859375, -9.822265625, -7.78515625, -5.748046875, -3.7109375, -1.673828125, 0.36328125, 2.400390625, 4.4375, 6.474609375, 8.51171875, 10.548828125, 12.5859375, 14.623046875, 16.66015625, 18.697265625, 20.734375, 22.771484375, 24.80859375, 26.845703125, 28.8828125, 30.919921875, 32.95703125, 34.994140625, 37.03125, 39.068359375, 41.10546875, 43.142578125, 45.1796875, 47.216796875, 49.25390625, 51.291015625, 53.328125, 55.365234375, 57.40234375, 59.439453125, 61.4765625, 63.513671875, 65.55078125, 67.587890625, 69.625]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [8.0, 468.0, 539.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.97726821899414, -6.076019763946533, -0.17477130889892578, 5.726476669311523, 11.627725601196289, 17.528974533081055, 23.430221557617188, 29.331470489501953, 35.23271942138672, 41.133968353271484, 47.03521728515625, 52.93646240234375, 58.83771514892578, 64.73896026611328, 70.64021301269531, 76.54145812988281, 82.44270324707031, 88.34394836425781, 94.24520111083984, 100.14644622802734, 106.04769897460938, 111.94894409179688, 117.85018920898438, 123.7514419555664, 129.65269470214844, 135.55393981933594, 141.45518493652344, 147.3564453125, 153.2576904296875, 159.158935546875, 165.0601806640625, 170.96142578125, 176.86268615722656, 182.76393127441406, 188.66517639160156, 194.56643676757812, 200.46768188476562, 206.36892700195312, 212.27017211914062, 218.17141723632812, 224.0726776123047, 229.9739227294922, 235.8751678466797, 241.77642822265625, 247.67767333984375, 253.57891845703125, 259.48016357421875, 265.38140869140625, 271.28265380859375, 277.18389892578125, 283.08514404296875, 288.98638916015625, 294.88763427734375, 300.7889099121094, 306.6901550292969, 312.5914001464844, 318.4926452636719, 324.3938903808594, 330.2951354980469, 336.1963806152344, 342.0976257324219, 347.9989013671875, 353.900146484375, 359.8013916015625, 365.70263671875]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 9.0, 10.0, 9.0, 9.0, 9.0, 11.0, 18.0, 23.0, 21.0, 28.0, 28.0, 40.0, 36.0, 44.0, 45.0, 38.0, 45.0, 37.0, 51.0, 44.0, 28.0, 41.0, 41.0, 44.0, 31.0, 38.0, 24.0, 25.0, 23.0, 26.0, 24.0, 22.0, 12.0, 9.0, 14.0, 14.0, 6.0, 5.0, 3.0, 2.0, 4.0, 7.0, 0.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.768829345703125, -59.7972297668457, -57.82563018798828, -55.85403060913086, -53.88243103027344, -51.910831451416016, -49.939231872558594, -47.96763229370117, -45.99603271484375, -44.02443313598633, -42.052833557128906, -40.081233978271484, -38.10963439941406, -36.13803482055664, -34.16643524169922, -32.1948356628418, -30.223234176635742, -28.25163459777832, -26.2800350189209, -24.308435440063477, -22.336835861206055, -20.365234375, -18.393634796142578, -16.422035217285156, -14.45043659210205, -12.478837013244629, -10.507237434387207, -8.535636901855469, -6.564037799835205, -4.592437744140625, -2.620838165283203, -0.6492385864257812, 1.3223609924316406, 3.2939605712890625, 5.265560150146484, 7.2371602058410645, 9.208759307861328, 11.180359840393066, 13.151959419250488, 15.12355899810791, 17.095157623291016, 19.066757202148438, 21.03835678100586, 23.00995635986328, 24.981555938720703, 26.953155517578125, 28.924755096435547, 30.89635467529297, 32.867958068847656, 34.83955764770508, 36.8111572265625, 38.78275680541992, 40.754356384277344, 42.725955963134766, 44.69755554199219, 46.66915512084961, 48.64075469970703, 50.61235427856445, 52.583953857421875, 54.5555534362793, 56.52715301513672, 58.49875259399414, 60.47035217285156, 62.441951751708984, 64.4135513305664]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 9.0, 6.0, 6.0, 10.0, 11.0, 21.0, 19.0, 27.0, 17.0, 35.0, 38.0, 34.0, 34.0, 39.0, 44.0, 55.0, 55.0, 51.0, 43.0, 47.0, 38.0, 41.0, 49.0, 40.0, 32.0, 19.0, 35.0, 26.0, 28.0, 17.0, 13.0, 17.0, 13.0, 8.0, 10.0, 1.0, 3.0, 3.0, 5.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.1015625, -8.825927734375, -8.55029296875, -8.274658203125, -7.9990234375, -7.723388671875, -7.44775390625, -7.172119140625, -6.896484375, -6.620849609375, -6.34521484375, -6.069580078125, -5.7939453125, -5.518310546875, -5.24267578125, -4.967041015625, -4.69140625, -4.415771484375, -4.14013671875, -3.864501953125, -3.5888671875, -3.313232421875, -3.03759765625, -2.761962890625, -2.486328125, -2.210693359375, -1.93505859375, -1.659423828125, -1.3837890625, -1.108154296875, -0.83251953125, -0.556884765625, -0.28125, -0.005615234375, 0.27001953125, 0.545654296875, 0.8212890625, 1.096923828125, 1.37255859375, 1.648193359375, 1.923828125, 2.199462890625, 2.47509765625, 2.750732421875, 3.0263671875, 3.302001953125, 3.57763671875, 3.853271484375, 4.12890625, 4.404541015625, 4.68017578125, 4.955810546875, 5.2314453125, 5.507080078125, 5.78271484375, 6.058349609375, 6.333984375, 6.609619140625, 6.88525390625, 7.160888671875, 7.4365234375, 7.712158203125, 7.98779296875, 8.263427734375, 8.5390625]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 3.0, 7.0, 6.0, 7.0, 18.0, 11.0, 17.0, 23.0, 25.0, 36.0, 26.0, 49.0, 54.0, 110.0, 218.0, 556.0, 1990.0, 13505.0, 757283.0, 3307535.0, 105667.0, 5095.0, 1163.0, 382.0, 137.0, 85.0, 47.0, 51.0, 24.0, 22.0, 24.0, 20.0, 13.0, 15.0, 12.0, 11.0, 6.0, 7.0, 3.0, 8.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-27.359375, -26.511962890625, -25.66455078125, -24.817138671875, -23.9697265625, -23.122314453125, -22.27490234375, -21.427490234375, -20.580078125, -19.732666015625, -18.88525390625, -18.037841796875, -17.1904296875, -16.343017578125, -15.49560546875, -14.648193359375, -13.80078125, -12.953369140625, -12.10595703125, -11.258544921875, -10.4111328125, -9.563720703125, -8.71630859375, -7.868896484375, -7.021484375, -6.174072265625, -5.32666015625, -4.479248046875, -3.6318359375, -2.784423828125, -1.93701171875, -1.089599609375, -0.2421875, 0.605224609375, 1.45263671875, 2.300048828125, 3.1474609375, 3.994873046875, 4.84228515625, 5.689697265625, 6.537109375, 7.384521484375, 8.23193359375, 9.079345703125, 9.9267578125, 10.774169921875, 11.62158203125, 12.468994140625, 13.31640625, 14.163818359375, 15.01123046875, 15.858642578125, 16.7060546875, 17.553466796875, 18.40087890625, 19.248291015625, 20.095703125, 20.943115234375, 21.79052734375, 22.637939453125, 23.4853515625, 24.332763671875, 25.18017578125, 26.027587890625, 26.875]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 10.0, 11.0, 13.0, 22.0, 25.0, 36.0, 52.0, 68.0, 98.0, 155.0, 190.0, 292.0, 441.0, 537.0, 575.0, 443.0, 309.0, 229.0, 152.0, 101.0, 85.0, 77.0, 48.0, 28.0, 30.0, 15.0, 12.0, 5.0, 11.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.046875, -17.5479736328125, -17.049072265625, -16.5501708984375, -16.05126953125, -15.5523681640625, -15.053466796875, -14.5545654296875, -14.0556640625, -13.5567626953125, -13.057861328125, -12.5589599609375, -12.06005859375, -11.5611572265625, -11.062255859375, -10.5633544921875, -10.064453125, -9.5655517578125, -9.066650390625, -8.5677490234375, -8.06884765625, -7.5699462890625, -7.071044921875, -6.5721435546875, -6.0732421875, -5.5743408203125, -5.075439453125, -4.5765380859375, -4.07763671875, -3.5787353515625, -3.079833984375, -2.5809326171875, -2.08203125, -1.5831298828125, -1.084228515625, -0.5853271484375, -0.08642578125, 0.4124755859375, 0.911376953125, 1.4102783203125, 1.9091796875, 2.4080810546875, 2.906982421875, 3.4058837890625, 3.90478515625, 4.4036865234375, 4.902587890625, 5.4014892578125, 5.900390625, 6.3992919921875, 6.898193359375, 7.3970947265625, 7.89599609375, 8.3948974609375, 8.893798828125, 9.3927001953125, 9.8916015625, 10.3905029296875, 10.889404296875, 11.3883056640625, 11.88720703125, 12.3861083984375, 12.885009765625, 13.3839111328125, 13.8828125]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 4.0, 6.0, 9.0, 15.0, 18.0, 21.0, 24.0, 27.0, 49.0, 44.0, 55.0, 72.0, 77.0, 117.0, 118.0, 138.0, 198.0, 314.0, 520.0, 1164.0, 25790.0, 4123332.0, 39022.0, 1308.0, 526.0, 308.0, 222.0, 150.0, 132.0, 90.0, 88.0, 65.0, 63.0, 43.0, 40.0, 25.0, 23.0, 22.0, 12.0, 8.0, 12.0, 5.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-64.6875, -62.4970703125, -60.306640625, -58.1162109375, -55.92578125, -53.7353515625, -51.544921875, -49.3544921875, -47.1640625, -44.9736328125, -42.783203125, -40.5927734375, -38.40234375, -36.2119140625, -34.021484375, -31.8310546875, -29.640625, -27.4501953125, -25.259765625, -23.0693359375, -20.87890625, -18.6884765625, -16.498046875, -14.3076171875, -12.1171875, -9.9267578125, -7.736328125, -5.5458984375, -3.35546875, -1.1650390625, 1.025390625, 3.2158203125, 5.40625, 7.5966796875, 9.787109375, 11.9775390625, 14.16796875, 16.3583984375, 18.548828125, 20.7392578125, 22.9296875, 25.1201171875, 27.310546875, 29.5009765625, 31.69140625, 33.8818359375, 36.072265625, 38.2626953125, 40.453125, 42.6435546875, 44.833984375, 47.0244140625, 49.21484375, 51.4052734375, 53.595703125, 55.7861328125, 57.9765625, 60.1669921875, 62.357421875, 64.5478515625, 66.73828125, 68.9287109375, 71.119140625, 73.3095703125, 75.5]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 24.0, 282.0, 551.0, 148.0, 9.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.84202575683594, -85.30484008789062, -77.76764678955078, -70.23045349121094, -62.693267822265625, -55.15607833862305, -47.61888885498047, -40.08169937133789, -32.54450988769531, -25.007320404052734, -17.470130920410156, -9.932941436767578, -2.395751953125, 5.141437530517578, 12.678627014160156, 20.215816497802734, 27.753005981445312, 35.29019546508789, 42.82738494873047, 50.36457443237305, 57.901763916015625, 65.43894958496094, 72.97614288330078, 80.51333618164062, 88.05052185058594, 95.58770751953125, 103.1249008178711, 110.66209411621094, 118.19927978515625, 125.73646545410156, 133.27365112304688, 140.81085205078125, 148.34805297851562, 155.88523864746094, 163.42242431640625, 170.95962524414062, 178.49681091308594, 186.03399658203125, 193.57119750976562, 201.10838317871094, 208.64556884765625, 216.18275451660156, 223.71994018554688, 231.25714111328125, 238.79432678222656, 246.33151245117188, 253.86871337890625, 261.4058837890625, 268.9430847167969, 276.48028564453125, 284.0174560546875, 291.5546569824219, 299.09185791015625, 306.6290283203125, 314.1662292480469, 321.7033996582031, 329.2406005859375, 336.7778015136719, 344.3149719238281, 351.8521728515625, 359.38934326171875, 366.9265441894531, 374.4637451171875, 382.00091552734375, 389.5381164550781]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 6.0, 3.0, 6.0, 6.0, 9.0, 10.0, 17.0, 19.0, 19.0, 23.0, 16.0, 28.0, 24.0, 33.0, 21.0, 30.0, 35.0, 48.0, 51.0, 38.0, 53.0, 35.0, 52.0, 45.0, 44.0, 45.0, 37.0, 32.0, 34.0, 26.0, 27.0, 28.0, 12.0, 21.0, 14.0, 9.0, 5.0, 14.0, 12.0, 7.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.310394287109375, -47.79655075073242, -46.282711029052734, -44.76886749267578, -43.255027770996094, -41.74118423461914, -40.22734069824219, -38.7135009765625, -37.19966125488281, -35.68581771850586, -34.17197799682617, -32.65813446044922, -31.14429473876953, -29.630451202392578, -28.116609573364258, -26.602767944335938, -25.088924407958984, -23.575082778930664, -22.061241149902344, -20.54739761352539, -19.033557891845703, -17.51971435546875, -16.00587272644043, -14.49203109741211, -12.978189468383789, -11.464347839355469, -9.950506210327148, -8.436663627624512, -6.922821998596191, -5.408980369567871, -3.8951377868652344, -2.381296157836914, -0.8674545288085938, 0.6463873386383057, 2.160229206085205, 3.6740713119506836, 5.187912940979004, 6.701754570007324, 8.215597152709961, 9.729438781738281, 11.243280410766602, 12.757122039794922, 14.270963668823242, 15.784806251525879, 17.298648834228516, 18.812488555908203, 20.326332092285156, 21.840173721313477, 23.354015350341797, 24.867856979370117, 26.381698608398438, 27.89554214477539, 29.409381866455078, 30.92322540283203, 32.43706512451172, 33.95090866088867, 35.464752197265625, 36.97859573364258, 38.492435455322266, 40.00627899169922, 41.520118713378906, 43.03396224975586, 44.54780578613281, 46.0616455078125, 47.57548522949219]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 9.0, 3.0, 5.0, 3.0, 8.0, 12.0, 13.0, 17.0, 23.0, 22.0, 24.0, 33.0, 33.0, 40.0, 42.0, 31.0, 43.0, 32.0, 43.0, 46.0, 32.0, 50.0, 35.0, 36.0, 36.0, 43.0, 35.0, 40.0, 30.0, 28.0, 26.0, 25.0, 12.0, 13.0, 17.0, 16.0, 11.0, 4.0, 7.0, 7.0, 6.0, 4.0, 6.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-8.234375, -7.9892578125, -7.744140625, -7.4990234375, -7.25390625, -7.0087890625, -6.763671875, -6.5185546875, -6.2734375, -6.0283203125, -5.783203125, -5.5380859375, -5.29296875, -5.0478515625, -4.802734375, -4.5576171875, -4.3125, -4.0673828125, -3.822265625, -3.5771484375, -3.33203125, -3.0869140625, -2.841796875, -2.5966796875, -2.3515625, -2.1064453125, -1.861328125, -1.6162109375, -1.37109375, -1.1259765625, -0.880859375, -0.6357421875, -0.390625, -0.1455078125, 0.099609375, 0.3447265625, 0.58984375, 0.8349609375, 1.080078125, 1.3251953125, 1.5703125, 1.8154296875, 2.060546875, 2.3056640625, 2.55078125, 2.7958984375, 3.041015625, 3.2861328125, 3.53125, 3.7763671875, 4.021484375, 4.2666015625, 4.51171875, 4.7568359375, 5.001953125, 5.2470703125, 5.4921875, 5.7373046875, 5.982421875, 6.2275390625, 6.47265625, 6.7177734375, 6.962890625, 7.2080078125, 7.453125]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 4.0, 3.0, 5.0, 9.0, 17.0, 16.0, 38.0, 66.0, 73.0, 123.0, 181.0, 312.0, 461.0, 611.0, 939.0, 1460.0, 2163.0, 3147.0, 4774.0, 7416.0, 11394.0, 17883.0, 28728.0, 46882.0, 80230.0, 155770.0, 309377.0, 162939.0, 82915.0, 48440.0, 29779.0, 18357.0, 11741.0, 7593.0, 5002.0, 3167.0, 2183.0, 1462.0, 949.0, 637.0, 456.0, 299.0, 206.0, 130.0, 70.0, 47.0, 41.0, 22.0, 20.0, 15.0, 6.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3583984375, -1.31390380859375, -1.2694091796875, -1.22491455078125, -1.180419921875, -1.13592529296875, -1.0914306640625, -1.04693603515625, -1.00244140625, -0.95794677734375, -0.9134521484375, -0.86895751953125, -0.824462890625, -0.77996826171875, -0.7354736328125, -0.69097900390625, -0.646484375, -0.60198974609375, -0.5574951171875, -0.51300048828125, -0.468505859375, -0.42401123046875, -0.3795166015625, -0.33502197265625, -0.29052734375, -0.24603271484375, -0.2015380859375, -0.15704345703125, -0.112548828125, -0.06805419921875, -0.0235595703125, 0.02093505859375, 0.0654296875, 0.10992431640625, 0.1544189453125, 0.19891357421875, 0.243408203125, 0.28790283203125, 0.3323974609375, 0.37689208984375, 0.42138671875, 0.46588134765625, 0.5103759765625, 0.55487060546875, 0.599365234375, 0.64385986328125, 0.6883544921875, 0.73284912109375, 0.77734375, 0.82183837890625, 0.8663330078125, 0.91082763671875, 0.955322265625, 0.99981689453125, 1.0443115234375, 1.08880615234375, 1.13330078125, 1.17779541015625, 1.2222900390625, 1.26678466796875, 1.311279296875, 1.35577392578125, 1.4002685546875, 1.44476318359375, 1.4892578125]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 5.0, 3.0, 3.0, 4.0, 13.0, 9.0, 7.0, 17.0, 16.0, 17.0, 15.0, 22.0, 26.0, 32.0, 30.0, 36.0, 31.0, 27.0, 35.0, 47.0, 48.0, 37.0, 1066.0, 36.0, 31.0, 41.0, 35.0, 40.0, 36.0, 33.0, 34.0, 25.0, 19.0, 21.0, 22.0, 19.0, 15.0, 12.0, 15.0, 11.0, 9.0, 5.0, 5.0, 8.0, 3.0, 6.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.28125, -5.12994384765625, -4.9786376953125, -4.82733154296875, -4.676025390625, -4.52471923828125, -4.3734130859375, -4.22210693359375, -4.07080078125, -3.91949462890625, -3.7681884765625, -3.61688232421875, -3.465576171875, -3.31427001953125, -3.1629638671875, -3.01165771484375, -2.8603515625, -2.70904541015625, -2.5577392578125, -2.40643310546875, -2.255126953125, -2.10382080078125, -1.9525146484375, -1.80120849609375, -1.64990234375, -1.49859619140625, -1.3472900390625, -1.19598388671875, -1.044677734375, -0.89337158203125, -0.7420654296875, -0.59075927734375, -0.439453125, -0.28814697265625, -0.1368408203125, 0.01446533203125, 0.165771484375, 0.31707763671875, 0.4683837890625, 0.61968994140625, 0.77099609375, 0.92230224609375, 1.0736083984375, 1.22491455078125, 1.376220703125, 1.52752685546875, 1.6788330078125, 1.83013916015625, 1.9814453125, 2.13275146484375, 2.2840576171875, 2.43536376953125, 2.586669921875, 2.73797607421875, 2.8892822265625, 3.04058837890625, 3.19189453125, 3.34320068359375, 3.4945068359375, 3.64581298828125, 3.797119140625, 3.94842529296875, 4.0997314453125, 4.25103759765625, 4.40234375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 8.0, 5.0, 10.0, 7.0, 15.0, 36.0, 29.0, 57.0, 57.0, 103.0, 148.0, 208.0, 324.0, 456.0, 712.0, 1020.0, 1625.0, 2313.0, 3477.0, 5388.0, 8255.0, 12485.0, 19647.0, 31724.0, 52579.0, 90581.0, 184203.0, 1356565.0, 134356.0, 72712.0, 43284.0, 26562.0, 16622.0, 10650.0, 7013.0, 4569.0, 3069.0, 2059.0, 1400.0, 888.0, 634.0, 435.0, 293.0, 190.0, 127.0, 89.0, 49.0, 42.0, 23.0, 23.0, 7.0, 2.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.486328125, -1.4403228759765625, -1.394317626953125, -1.3483123779296875, -1.30230712890625, -1.2563018798828125, -1.210296630859375, -1.1642913818359375, -1.1182861328125, -1.0722808837890625, -1.026275634765625, -0.9802703857421875, -0.93426513671875, -0.8882598876953125, -0.842254638671875, -0.7962493896484375, -0.750244140625, -0.7042388916015625, -0.658233642578125, -0.6122283935546875, -0.56622314453125, -0.5202178955078125, -0.474212646484375, -0.4282073974609375, -0.3822021484375, -0.3361968994140625, -0.290191650390625, -0.2441864013671875, -0.19818115234375, -0.1521759033203125, -0.106170654296875, -0.0601654052734375, -0.01416015625, 0.0318450927734375, 0.077850341796875, 0.1238555908203125, 0.16986083984375, 0.2158660888671875, 0.261871337890625, 0.3078765869140625, 0.3538818359375, 0.3998870849609375, 0.445892333984375, 0.4918975830078125, 0.53790283203125, 0.5839080810546875, 0.629913330078125, 0.6759185791015625, 0.721923828125, 0.7679290771484375, 0.813934326171875, 0.8599395751953125, 0.90594482421875, 0.9519500732421875, 0.997955322265625, 1.0439605712890625, 1.0899658203125, 1.1359710693359375, 1.181976318359375, 1.2279815673828125, 1.27398681640625, 1.3199920654296875, 1.365997314453125, 1.4120025634765625, 1.4580078125]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 6.0, 8.0, 7.0, 9.0, 7.0, 4.0, 21.0, 28.0, 25.0, 30.0, 47.0, 54.0, 68.0, 71.0, 93.0, 68.0, 87.0, 81.0, 62.0, 59.0, 37.0, 32.0, 24.0, 19.0, 15.0, 8.0, 12.0, 3.0, 4.0, 3.0, 4.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0009565353393554688, -0.0009300932288169861, -0.0009036511182785034, -0.0008772090077400208, -0.0008507668972015381, -0.0008243247866630554, -0.0007978826761245728, -0.0007714405655860901, -0.0007449984550476074, -0.0007185563445091248, -0.0006921142339706421, -0.0006656721234321594, -0.0006392300128936768, -0.0006127879023551941, -0.0005863457918167114, -0.0005599036812782288, -0.0005334615707397461, -0.0005070194602012634, -0.00048057734966278076, -0.0004541352391242981, -0.00042769312858581543, -0.00040125101804733276, -0.0003748089075088501, -0.00034836679697036743, -0.00032192468643188477, -0.0002954825758934021, -0.00026904046535491943, -0.00024259835481643677, -0.0002161562442779541, -0.00018971413373947144, -0.00016327202320098877, -0.0001368299126625061, -0.00011038780212402344, -8.394569158554077e-05, -5.7503581047058105e-05, -3.106147050857544e-05, -4.6193599700927734e-06, 2.1822750568389893e-05, 4.826486110687256e-05, 7.470697164535522e-05, 0.00010114908218383789, 0.00012759119272232056, 0.00015403330326080322, 0.0001804754137992859, 0.00020691752433776855, 0.00023335963487625122, 0.0002598017454147339, 0.00028624385595321655, 0.0003126859664916992, 0.0003391280770301819, 0.00036557018756866455, 0.0003920122981071472, 0.0004184544086456299, 0.00044489651918411255, 0.0004713386297225952, 0.0004977807402610779, 0.0005242228507995605, 0.0005506649613380432, 0.0005771070718765259, 0.0006035491824150085, 0.0006299912929534912, 0.0006564334034919739, 0.0006828755140304565, 0.0007093176245689392, 0.0007357597351074219]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 5.0, 5.0, 8.0, 10.0, 13.0, 12.0, 21.0, 25.0, 36.0, 53.0, 62.0, 129.0, 234.0, 588.0, 7248.0, 1037205.0, 1914.0, 426.0, 181.0, 119.0, 74.0, 59.0, 28.0, 22.0, 19.0, 12.0, 13.0, 9.0, 8.0, 5.0, 5.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0183258056640625, -0.017679929733276367, -0.017034053802490234, -0.0163881778717041, -0.01574230194091797, -0.015096426010131836, -0.014450550079345703, -0.01380467414855957, -0.013158798217773438, -0.012512922286987305, -0.011867046356201172, -0.011221170425415039, -0.010575294494628906, -0.009929418563842773, -0.00928354263305664, -0.008637666702270508, -0.007991790771484375, -0.007345914840698242, -0.006700038909912109, -0.0060541629791259766, -0.005408287048339844, -0.004762411117553711, -0.004116535186767578, -0.0034706592559814453, -0.0028247833251953125, -0.0021789073944091797, -0.0015330314636230469, -0.0008871555328369141, -0.00024127960205078125, 0.00040459632873535156, 0.0010504722595214844, 0.0016963481903076172, 0.00234222412109375, 0.002988100051879883, 0.0036339759826660156, 0.0042798519134521484, 0.004925727844238281, 0.005571603775024414, 0.006217479705810547, 0.00686335563659668, 0.0075092315673828125, 0.008155107498168945, 0.008800983428955078, 0.009446859359741211, 0.010092735290527344, 0.010738611221313477, 0.01138448715209961, 0.012030363082885742, 0.012676239013671875, 0.013322114944458008, 0.01396799087524414, 0.014613866806030273, 0.015259742736816406, 0.01590561866760254, 0.016551494598388672, 0.017197370529174805, 0.017843246459960938, 0.01848912239074707, 0.019134998321533203, 0.019780874252319336, 0.02042675018310547, 0.0210726261138916, 0.021718502044677734, 0.022364377975463867, 0.02301025390625]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 18.0, 30.0, 70.0, 106.0, 165.0, 191.0, 183.0, 124.0, 70.0, 25.0, 13.0, 4.0, 6.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006397537072189152, -0.0006200916832312942, -0.000600429717451334, -0.0005807676934637129, -0.0005611056694760919, -0.0005414436454884708, -0.0005217816215008497, -0.0005021196557208896, -0.0004824576317332685, -0.00046279560774564743, -0.0004431336128618568, -0.0004234716179780662, -0.00040380959399044514, -0.00038414757000282407, -0.00036448557511903346, -0.00034482358023524284, -0.0003251615562476218, -0.0003054995322600007, -0.0002858375373762101, -0.0002661755424924195, -0.0002465135185047984, -0.00022685150906909257, -0.00020718949963338673, -0.0001875274901976809, -0.00016786548076197505, -0.0001482034713262692, -0.00012854146189056337, -0.00010887945245485753, -8.921744301915169e-05, -6.955543358344585e-05, -4.9893424147740006e-05, -3.0231414712034166e-05, -1.0569463483989239e-05, 9.092545951716602e-06, 2.8754555387422442e-05, 4.841656482312828e-05, 6.807857425883412e-05, 8.774058369453996e-05, 0.0001074025931302458, 0.00012706460256595165, 0.00014672661200165749, 0.00016638862143736333, 0.00018605063087306917, 0.000205712640308775, 0.00022537464974448085, 0.0002450366737321019, 0.00026469866861589253, 0.00028436066349968314, 0.0003040226874873042, 0.0003236847114749253, 0.0003433467063587159, 0.0003630087012425065, 0.0003826707252301276, 0.00040233274921774864, 0.00042199474410153925, 0.00044165673898532987, 0.00046131876297295094, 0.000480980786960572, 0.0005006428109481931, 0.0005203047767281532, 0.0005399668007157743, 0.0005596288247033954, 0.0005792907904833555, 0.0005989528144709766, 0.0006186148384585977]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 4.0, 12.0, 8.0, 8.0, 10.0, 9.0, 14.0, 13.0, 27.0, 18.0, 23.0, 32.0, 46.0, 33.0, 38.0, 33.0, 39.0, 39.0, 34.0, 58.0, 41.0, 51.0, 41.0, 39.0, 39.0, 38.0, 23.0, 33.0, 37.0, 23.0, 24.0, 14.0, 22.0, 15.0, 15.0, 13.0, 10.0, 6.0, 3.0, 5.0, 3.0, 3.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00035965442657470703, -0.00034830905497074127, -0.0003369636833667755, -0.00032561831176280975, -0.000314272940158844, -0.00030292756855487823, -0.0002915821969509125, -0.0002802368253469467, -0.00026889145374298096, -0.0002575460821390152, -0.00024620071053504944, -0.00023485533893108368, -0.00022350996732711792, -0.00021216459572315216, -0.0002008192241191864, -0.00018947385251522064, -0.00017812848091125488, -0.00016678310930728912, -0.00015543773770332336, -0.0001440923660993576, -0.00013274699449539185, -0.00012140162289142609, -0.00011005625128746033, -9.871087968349457e-05, -8.736550807952881e-05, -7.602013647556305e-05, -6.467476487159729e-05, -5.332939326763153e-05, -4.198402166366577e-05, -3.063865005970001e-05, -1.9293278455734253e-05, -7.947906851768494e-06, 3.3974647521972656e-06, 1.4742836356163025e-05, 2.6088207960128784e-05, 3.7433579564094543e-05, 4.87789511680603e-05, 6.012432277202606e-05, 7.146969437599182e-05, 8.281506597995758e-05, 9.416043758392334e-05, 0.0001055058091878891, 0.00011685118079185486, 0.00012819655239582062, 0.00013954192399978638, 0.00015088729560375214, 0.0001622326672077179, 0.00017357803881168365, 0.00018492341041564941, 0.00019626878201961517, 0.00020761415362358093, 0.0002189595252275467, 0.00023030489683151245, 0.0002416502684354782, 0.00025299564003944397, 0.00026434101164340973, 0.0002756863832473755, 0.00028703175485134125, 0.000298377126455307, 0.00030972249805927277, 0.0003210678696632385, 0.0003324132412672043, 0.00034375861287117004, 0.0003551039844751358, 0.00036644935607910156]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 9.0, 3.0, 5.0, 3.0, 8.0, 12.0, 13.0, 17.0, 23.0, 22.0, 24.0, 33.0, 33.0, 40.0, 42.0, 31.0, 43.0, 32.0, 43.0, 46.0, 32.0, 50.0, 35.0, 36.0, 36.0, 43.0, 35.0, 40.0, 30.0, 28.0, 26.0, 25.0, 12.0, 13.0, 17.0, 16.0, 11.0, 4.0, 7.0, 7.0, 6.0, 4.0, 6.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-8.234375, -7.9892578125, -7.744140625, -7.4990234375, -7.25390625, -7.0087890625, -6.763671875, -6.5185546875, -6.2734375, -6.0283203125, -5.783203125, -5.5380859375, -5.29296875, -5.0478515625, -4.802734375, -4.5576171875, -4.3125, -4.0673828125, -3.822265625, -3.5771484375, -3.33203125, -3.0869140625, -2.841796875, -2.5966796875, -2.3515625, -2.1064453125, -1.861328125, -1.6162109375, -1.37109375, -1.1259765625, -0.880859375, -0.6357421875, -0.390625, -0.1455078125, 0.099609375, 0.3447265625, 0.58984375, 0.8349609375, 1.080078125, 1.3251953125, 1.5703125, 1.8154296875, 2.060546875, 2.3056640625, 2.55078125, 2.7958984375, 3.041015625, 3.2861328125, 3.53125, 3.7763671875, 4.021484375, 4.2666015625, 4.51171875, 4.7568359375, 5.001953125, 5.2470703125, 5.4921875, 5.7373046875, 5.982421875, 6.2275390625, 6.47265625, 6.7177734375, 6.962890625, 7.2080078125, 7.453125]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 2.0, 5.0, 9.0, 3.0, 12.0, 17.0, 22.0, 30.0, 37.0, 56.0, 62.0, 107.0, 136.0, 184.0, 360.0, 527.0, 1284.0, 2867.0, 8306.0, 26011.0, 88763.0, 396677.0, 395109.0, 88109.0, 25528.0, 8547.0, 2966.0, 1233.0, 575.0, 313.0, 203.0, 129.0, 99.0, 71.0, 47.0, 42.0, 30.0, 24.0, 18.0, 7.0, 6.0, 13.0, 5.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.21875, -7.95361328125, -7.6884765625, -7.42333984375, -7.158203125, -6.89306640625, -6.6279296875, -6.36279296875, -6.09765625, -5.83251953125, -5.5673828125, -5.30224609375, -5.037109375, -4.77197265625, -4.5068359375, -4.24169921875, -3.9765625, -3.71142578125, -3.4462890625, -3.18115234375, -2.916015625, -2.65087890625, -2.3857421875, -2.12060546875, -1.85546875, -1.59033203125, -1.3251953125, -1.06005859375, -0.794921875, -0.52978515625, -0.2646484375, 0.00048828125, 0.265625, 0.53076171875, 0.7958984375, 1.06103515625, 1.326171875, 1.59130859375, 1.8564453125, 2.12158203125, 2.38671875, 2.65185546875, 2.9169921875, 3.18212890625, 3.447265625, 3.71240234375, 3.9775390625, 4.24267578125, 4.5078125, 4.77294921875, 5.0380859375, 5.30322265625, 5.568359375, 5.83349609375, 6.0986328125, 6.36376953125, 6.62890625, 6.89404296875, 7.1591796875, 7.42431640625, 7.689453125, 7.95458984375, 8.2197265625, 8.48486328125, 8.75]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 2.0, 7.0, 7.0, 4.0, 9.0, 5.0, 9.0, 9.0, 10.0, 27.0, 17.0, 25.0, 30.0, 34.0, 32.0, 32.0, 43.0, 45.0, 41.0, 53.0, 80.0, 468.0, 1569.0, 100.0, 53.0, 44.0, 43.0, 36.0, 37.0, 24.0, 27.0, 22.0, 24.0, 17.0, 7.0, 13.0, 10.0, 8.0, 9.0, 7.0, 7.0, 4.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-21.875, -21.09423828125, -20.3134765625, -19.53271484375, -18.751953125, -17.97119140625, -17.1904296875, -16.40966796875, -15.62890625, -14.84814453125, -14.0673828125, -13.28662109375, -12.505859375, -11.72509765625, -10.9443359375, -10.16357421875, -9.3828125, -8.60205078125, -7.8212890625, -7.04052734375, -6.259765625, -5.47900390625, -4.6982421875, -3.91748046875, -3.13671875, -2.35595703125, -1.5751953125, -0.79443359375, -0.013671875, 0.76708984375, 1.5478515625, 2.32861328125, 3.109375, 3.89013671875, 4.6708984375, 5.45166015625, 6.232421875, 7.01318359375, 7.7939453125, 8.57470703125, 9.35546875, 10.13623046875, 10.9169921875, 11.69775390625, 12.478515625, 13.25927734375, 14.0400390625, 14.82080078125, 15.6015625, 16.38232421875, 17.1630859375, 17.94384765625, 18.724609375, 19.50537109375, 20.2861328125, 21.06689453125, 21.84765625, 22.62841796875, 23.4091796875, 24.18994140625, 24.970703125, 25.75146484375, 26.5322265625, 27.31298828125, 28.09375]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 6.0, 4.0, 10.0, 7.0, 19.0, 20.0, 19.0, 29.0, 26.0, 55.0, 61.0, 65.0, 97.0, 142.0, 215.0, 347.0, 855.0, 14172.0, 3116647.0, 10922.0, 752.0, 384.0, 230.0, 157.0, 118.0, 85.0, 64.0, 51.0, 41.0, 23.0, 15.0, 15.0, 16.0, 9.0, 13.0, 4.0, 2.0, 5.0, 0.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.0625, -56.0234375, -53.984375, -51.9453125, -49.90625, -47.8671875, -45.828125, -43.7890625, -41.75, -39.7109375, -37.671875, -35.6328125, -33.59375, -31.5546875, -29.515625, -27.4765625, -25.4375, -23.3984375, -21.359375, -19.3203125, -17.28125, -15.2421875, -13.203125, -11.1640625, -9.125, -7.0859375, -5.046875, -3.0078125, -0.96875, 1.0703125, 3.109375, 5.1484375, 7.1875, 9.2265625, 11.265625, 13.3046875, 15.34375, 17.3828125, 19.421875, 21.4609375, 23.5, 25.5390625, 27.578125, 29.6171875, 31.65625, 33.6953125, 35.734375, 37.7734375, 39.8125, 41.8515625, 43.890625, 45.9296875, 47.96875, 50.0078125, 52.046875, 54.0859375, 56.125, 58.1640625, 60.203125, 62.2421875, 64.28125, 66.3203125, 68.359375, 70.3984375, 72.4375]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 143.0, 745.0, 125.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.35588073730469, -49.089080810546875, -44.82228088378906, -40.55548095703125, -36.28868103027344, -32.021881103515625, -27.755077362060547, -23.488277435302734, -19.221477508544922, -14.95467758178711, -10.68787670135498, -6.421075820922852, -2.154275894165039, 2.1125240325927734, 6.379325866699219, 10.646125793457031, 14.912925720214844, 19.179725646972656, 23.44652557373047, 27.713327407836914, 31.980127334594727, 36.246925354003906, 40.513729095458984, 44.7805290222168, 49.04732894897461, 53.31412887573242, 57.580928802490234, 61.84773254394531, 66.11453247070312, 70.38133239746094, 74.64813232421875, 78.91493225097656, 83.18173217773438, 87.44853210449219, 91.71533203125, 95.98213195800781, 100.24893188476562, 104.51573181152344, 108.78253173828125, 113.04933166503906, 117.31613159179688, 121.58293151855469, 125.8497314453125, 130.1165313720703, 134.38333129882812, 138.65013122558594, 142.91693115234375, 147.18373107910156, 151.45053100585938, 155.7173309326172, 159.984130859375, 164.2509307861328, 168.51773071289062, 172.78453063964844, 177.05133056640625, 181.31813049316406, 185.58494567871094, 189.85174560546875, 194.11854553222656, 198.38534545898438, 202.6521453857422, 206.9189453125, 211.1857452392578, 215.45254516601562, 219.71934509277344]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 4.0, 4.0, 8.0, 11.0, 11.0, 18.0, 22.0, 19.0, 20.0, 24.0, 21.0, 30.0, 31.0, 41.0, 38.0, 41.0, 39.0, 49.0, 51.0, 51.0, 49.0, 50.0, 46.0, 43.0, 48.0, 31.0, 36.0, 22.0, 24.0, 16.0, 22.0, 17.0, 12.0, 13.0, 8.0, 6.0, 8.0, 4.0, 4.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-70.66156005859375, -68.5843276977539, -66.50709533691406, -64.42985534667969, -62.352622985839844, -60.275390625, -58.19815444946289, -56.12091827392578, -54.04368591308594, -51.966453552246094, -49.889217376708984, -47.811981201171875, -45.73474884033203, -43.65751647949219, -41.58028030395508, -39.50304412841797, -37.425811767578125, -35.34857940673828, -33.27134323120117, -31.194108963012695, -29.11687469482422, -27.039640426635742, -24.962406158447266, -22.88517189025879, -20.807937622070312, -18.730703353881836, -16.65346908569336, -14.576234817504883, -12.499000549316406, -10.42176628112793, -8.344532012939453, -6.267297744750977, -4.190055847167969, -2.112821578979492, -0.035587310791015625, 2.041646957397461, 4.1188812255859375, 6.196115493774414, 8.27334976196289, 10.350584030151367, 12.427818298339844, 14.50505256652832, 16.582286834716797, 18.659521102905273, 20.73675537109375, 22.813989639282227, 24.891223907470703, 26.96845817565918, 29.045692443847656, 31.122926712036133, 33.20016098022461, 35.27739715576172, 37.35462951660156, 39.431861877441406, 41.509098052978516, 43.586334228515625, 45.66356658935547, 47.74079895019531, 49.81803512573242, 51.89527130126953, 53.972503662109375, 56.04973602294922, 58.12697219848633, 60.20420837402344, 62.28144073486328]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 5.0, 5.0, 6.0, 6.0, 7.0, 5.0, 4.0, 10.0, 13.0, 24.0, 20.0, 28.0, 23.0, 35.0, 33.0, 40.0, 27.0, 39.0, 37.0, 37.0, 34.0, 42.0, 54.0, 51.0, 32.0, 33.0, 33.0, 37.0, 40.0, 35.0, 35.0, 28.0, 27.0, 21.0, 16.0, 12.0, 14.0, 11.0, 12.0, 8.0, 7.0, 7.0, 2.0, 7.0, 6.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.4375, -8.18475341796875, -7.9320068359375, -7.67926025390625, -7.426513671875, -7.17376708984375, -6.9210205078125, -6.66827392578125, -6.41552734375, -6.16278076171875, -5.9100341796875, -5.65728759765625, -5.404541015625, -5.15179443359375, -4.8990478515625, -4.64630126953125, -4.3935546875, -4.14080810546875, -3.8880615234375, -3.63531494140625, -3.382568359375, -3.12982177734375, -2.8770751953125, -2.62432861328125, -2.37158203125, -2.11883544921875, -1.8660888671875, -1.61334228515625, -1.360595703125, -1.10784912109375, -0.8551025390625, -0.60235595703125, -0.349609375, -0.09686279296875, 0.1558837890625, 0.40863037109375, 0.661376953125, 0.91412353515625, 1.1668701171875, 1.41961669921875, 1.67236328125, 1.92510986328125, 2.1778564453125, 2.43060302734375, 2.683349609375, 2.93609619140625, 3.1888427734375, 3.44158935546875, 3.6943359375, 3.94708251953125, 4.1998291015625, 4.45257568359375, 4.705322265625, 4.95806884765625, 5.2108154296875, 5.46356201171875, 5.71630859375, 5.96905517578125, 6.2218017578125, 6.47454833984375, 6.727294921875, 6.98004150390625, 7.2327880859375, 7.48553466796875, 7.73828125]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 4.0, 8.0, 4.0, 7.0, 7.0, 6.0, 13.0, 14.0, 23.0, 18.0, 33.0, 26.0, 45.0, 51.0, 70.0, 100.0, 156.0, 223.0, 422.0, 1052.0, 4643.0, 76832.0, 2811875.0, 1270577.0, 23678.0, 2611.0, 728.0, 332.0, 190.0, 138.0, 88.0, 63.0, 49.0, 41.0, 25.0, 28.0, 20.0, 17.0, 5.0, 13.0, 6.0, 8.0, 7.0, 11.0, 6.0, 3.0, 2.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-25.15625, -24.39013671875, -23.6240234375, -22.85791015625, -22.091796875, -21.32568359375, -20.5595703125, -19.79345703125, -19.02734375, -18.26123046875, -17.4951171875, -16.72900390625, -15.962890625, -15.19677734375, -14.4306640625, -13.66455078125, -12.8984375, -12.13232421875, -11.3662109375, -10.60009765625, -9.833984375, -9.06787109375, -8.3017578125, -7.53564453125, -6.76953125, -6.00341796875, -5.2373046875, -4.47119140625, -3.705078125, -2.93896484375, -2.1728515625, -1.40673828125, -0.640625, 0.12548828125, 0.8916015625, 1.65771484375, 2.423828125, 3.18994140625, 3.9560546875, 4.72216796875, 5.48828125, 6.25439453125, 7.0205078125, 7.78662109375, 8.552734375, 9.31884765625, 10.0849609375, 10.85107421875, 11.6171875, 12.38330078125, 13.1494140625, 13.91552734375, 14.681640625, 15.44775390625, 16.2138671875, 16.97998046875, 17.74609375, 18.51220703125, 19.2783203125, 20.04443359375, 20.810546875, 21.57666015625, 22.3427734375, 23.10888671875, 23.875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 10.0, 18.0, 27.0, 34.0, 36.0, 36.0, 68.0, 121.0, 162.0, 205.0, 262.0, 388.0, 523.0, 550.0, 462.0, 322.0, 239.0, 150.0, 115.0, 79.0, 75.0, 47.0, 32.0, 31.0, 19.0, 19.0, 10.0, 8.0, 8.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-17.65625, -17.1954345703125, -16.734619140625, -16.2738037109375, -15.81298828125, -15.3521728515625, -14.891357421875, -14.4305419921875, -13.9697265625, -13.5089111328125, -13.048095703125, -12.5872802734375, -12.12646484375, -11.6656494140625, -11.204833984375, -10.7440185546875, -10.283203125, -9.8223876953125, -9.361572265625, -8.9007568359375, -8.43994140625, -7.9791259765625, -7.518310546875, -7.0574951171875, -6.5966796875, -6.1358642578125, -5.675048828125, -5.2142333984375, -4.75341796875, -4.2926025390625, -3.831787109375, -3.3709716796875, -2.91015625, -2.4493408203125, -1.988525390625, -1.5277099609375, -1.06689453125, -0.6060791015625, -0.145263671875, 0.3155517578125, 0.7763671875, 1.2371826171875, 1.697998046875, 2.1588134765625, 2.61962890625, 3.0804443359375, 3.541259765625, 4.0020751953125, 4.462890625, 4.9237060546875, 5.384521484375, 5.8453369140625, 6.30615234375, 6.7669677734375, 7.227783203125, 7.6885986328125, 8.1494140625, 8.6102294921875, 9.071044921875, 9.5318603515625, 9.99267578125, 10.4534912109375, 10.914306640625, 11.3751220703125, 11.8359375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 10.0, 6.0, 6.0, 22.0, 32.0, 27.0, 28.0, 48.0, 51.0, 69.0, 93.0, 128.0, 134.0, 182.0, 211.0, 385.0, 711.0, 8580.0, 4148277.0, 32738.0, 975.0, 442.0, 261.0, 235.0, 163.0, 108.0, 94.0, 65.0, 55.0, 40.0, 30.0, 32.0, 13.0, 16.0, 5.0, 2.0, 3.0, 7.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-88.875, -86.0625, -83.25, -80.4375, -77.625, -74.8125, -72.0, -69.1875, -66.375, -63.5625, -60.75, -57.9375, -55.125, -52.3125, -49.5, -46.6875, -43.875, -41.0625, -38.25, -35.4375, -32.625, -29.8125, -27.0, -24.1875, -21.375, -18.5625, -15.75, -12.9375, -10.125, -7.3125, -4.5, -1.6875, 1.125, 3.9375, 6.75, 9.5625, 12.375, 15.1875, 18.0, 20.8125, 23.625, 26.4375, 29.25, 32.0625, 34.875, 37.6875, 40.5, 43.3125, 46.125, 48.9375, 51.75, 54.5625, 57.375, 60.1875, 63.0, 65.8125, 68.625, 71.4375, 74.25, 77.0625, 79.875, 82.6875, 85.5, 88.3125, 91.125]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 83.0, 745.0, 182.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.27461242675781, -40.204444885253906, -29.134273529052734, -18.064102172851562, -6.993934631347656, 4.07623291015625, 15.146408081054688, 26.216575622558594, 37.2867431640625, 48.356910705566406, 59.42708206176758, 70.49725341796875, 81.56742095947266, 92.63758850097656, 103.707763671875, 114.7779312133789, 125.84809875488281, 136.91827392578125, 147.98843383789062, 159.05860900878906, 170.1287841796875, 181.19894409179688, 192.2691192626953, 203.33929443359375, 214.40945434570312, 225.47962951660156, 236.54978942871094, 247.61996459960938, 258.69012451171875, 269.76031494140625, 280.8304748535156, 291.900634765625, 302.9708251953125, 314.0409851074219, 325.1111755371094, 336.18133544921875, 347.2514953613281, 358.3216552734375, 369.391845703125, 380.4620056152344, 391.53216552734375, 402.6023254394531, 413.6725158691406, 424.74267578125, 435.8128356933594, 446.88299560546875, 457.95318603515625, 469.0233459472656, 480.0935363769531, 491.1636962890625, 502.23388671875, 513.3040771484375, 524.3742065429688, 535.4443969726562, 546.5145263671875, 557.584716796875, 568.6549072265625, 579.72509765625, 590.7952270507812, 601.8654174804688, 612.9356079101562, 624.0057373046875, 635.075927734375, 646.1461181640625, 657.2162475585938]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 5.0, 2.0, 3.0, 3.0, 6.0, 9.0, 6.0, 10.0, 15.0, 6.0, 17.0, 14.0, 14.0, 16.0, 24.0, 30.0, 30.0, 29.0, 36.0, 37.0, 28.0, 32.0, 41.0, 40.0, 39.0, 45.0, 37.0, 35.0, 42.0, 35.0, 38.0, 29.0, 28.0, 39.0, 39.0, 28.0, 27.0, 19.0, 15.0, 14.0, 10.0, 8.0, 8.0, 8.0, 3.0, 8.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.751800537109375, -38.419742584228516, -37.087684631347656, -35.7556266784668, -34.42356872558594, -33.091514587402344, -31.75945472717285, -30.427398681640625, -29.095340728759766, -27.763282775878906, -26.431224822998047, -25.099166870117188, -23.76711082458496, -22.4350528717041, -21.102994918823242, -19.770938873291016, -18.438879013061523, -17.106821060180664, -15.774764060974121, -14.442706108093262, -13.110649108886719, -11.77859115600586, -10.446533203125, -9.114476203918457, -7.782418251037598, -6.4503607749938965, -5.118303298950195, -3.786245346069336, -2.4541878700256348, -1.1221303939819336, 0.20992755889892578, 1.5419845581054688, 2.874042510986328, 4.206099987030029, 5.5381574630737305, 6.87021541595459, 8.202272415161133, 9.534330368041992, 10.866388320922852, 12.198445320129395, 13.530503273010254, 14.862561225891113, 16.194618225097656, 17.526676177978516, 18.858734130859375, 20.190792083740234, 21.522850036621094, 22.85490608215332, 24.18696403503418, 25.51902198791504, 26.8510799407959, 28.183135986328125, 29.515193939208984, 30.847251892089844, 32.1793098449707, 33.51136779785156, 34.84342575073242, 36.17548370361328, 37.50754165649414, 38.839599609375, 40.17165756225586, 41.50371551513672, 42.83576965332031, 44.16782760620117, 45.49988555908203]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 5.0, 3.0, 1.0, 9.0, 11.0, 12.0, 10.0, 14.0, 11.0, 18.0, 26.0, 27.0, 33.0, 28.0, 32.0, 34.0, 42.0, 34.0, 48.0, 40.0, 45.0, 31.0, 50.0, 35.0, 34.0, 46.0, 43.0, 28.0, 32.0, 34.0, 31.0, 20.0, 22.0, 23.0, 17.0, 13.0, 15.0, 5.0, 8.0, 5.0, 7.0, 5.0, 5.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.2109375, -6.95849609375, -6.7060546875, -6.45361328125, -6.201171875, -5.94873046875, -5.6962890625, -5.44384765625, -5.19140625, -4.93896484375, -4.6865234375, -4.43408203125, -4.181640625, -3.92919921875, -3.6767578125, -3.42431640625, -3.171875, -2.91943359375, -2.6669921875, -2.41455078125, -2.162109375, -1.90966796875, -1.6572265625, -1.40478515625, -1.15234375, -0.89990234375, -0.6474609375, -0.39501953125, -0.142578125, 0.10986328125, 0.3623046875, 0.61474609375, 0.8671875, 1.11962890625, 1.3720703125, 1.62451171875, 1.876953125, 2.12939453125, 2.3818359375, 2.63427734375, 2.88671875, 3.13916015625, 3.3916015625, 3.64404296875, 3.896484375, 4.14892578125, 4.4013671875, 4.65380859375, 4.90625, 5.15869140625, 5.4111328125, 5.66357421875, 5.916015625, 6.16845703125, 6.4208984375, 6.67333984375, 6.92578125, 7.17822265625, 7.4306640625, 7.68310546875, 7.935546875, 8.18798828125, 8.4404296875, 8.69287109375, 8.9453125]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 5.0, 8.0, 10.0, 22.0, 21.0, 31.0, 49.0, 80.0, 100.0, 178.0, 234.0, 403.0, 557.0, 799.0, 1160.0, 1677.0, 2530.0, 3768.0, 5681.0, 8571.0, 13316.0, 20781.0, 33509.0, 56186.0, 99526.0, 220181.0, 287719.0, 119957.0, 65196.0, 38337.0, 23806.0, 15222.0, 9628.0, 6409.0, 4259.0, 2728.0, 1889.0, 1294.0, 880.0, 611.0, 421.0, 286.0, 177.0, 113.0, 93.0, 46.0, 41.0, 23.0, 21.0, 12.0, 5.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.5791015625, -1.52996826171875, -1.4808349609375, -1.43170166015625, -1.382568359375, -1.33343505859375, -1.2843017578125, -1.23516845703125, -1.18603515625, -1.13690185546875, -1.0877685546875, -1.03863525390625, -0.989501953125, -0.94036865234375, -0.8912353515625, -0.84210205078125, -0.79296875, -0.74383544921875, -0.6947021484375, -0.64556884765625, -0.596435546875, -0.54730224609375, -0.4981689453125, -0.44903564453125, -0.39990234375, -0.35076904296875, -0.3016357421875, -0.25250244140625, -0.203369140625, -0.15423583984375, -0.1051025390625, -0.05596923828125, -0.0068359375, 0.04229736328125, 0.0914306640625, 0.14056396484375, 0.189697265625, 0.23883056640625, 0.2879638671875, 0.33709716796875, 0.38623046875, 0.43536376953125, 0.4844970703125, 0.53363037109375, 0.582763671875, 0.63189697265625, 0.6810302734375, 0.73016357421875, 0.779296875, 0.82843017578125, 0.8775634765625, 0.92669677734375, 0.975830078125, 1.02496337890625, 1.0740966796875, 1.12322998046875, 1.17236328125, 1.22149658203125, 1.2706298828125, 1.31976318359375, 1.368896484375, 1.41802978515625, 1.4671630859375, 1.51629638671875, 1.5654296875]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 5.0, 7.0, 8.0, 5.0, 7.0, 13.0, 14.0, 9.0, 13.0, 10.0, 17.0, 30.0, 22.0, 36.0, 28.0, 26.0, 38.0, 41.0, 41.0, 37.0, 37.0, 53.0, 1064.0, 35.0, 41.0, 47.0, 47.0, 35.0, 26.0, 39.0, 33.0, 27.0, 24.0, 17.0, 16.0, 15.0, 19.0, 13.0, 10.0, 5.0, 5.0, 3.0, 8.0, 4.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.5546875, -5.38775634765625, -5.2208251953125, -5.05389404296875, -4.886962890625, -4.72003173828125, -4.5531005859375, -4.38616943359375, -4.21923828125, -4.05230712890625, -3.8853759765625, -3.71844482421875, -3.551513671875, -3.38458251953125, -3.2176513671875, -3.05072021484375, -2.8837890625, -2.71685791015625, -2.5499267578125, -2.38299560546875, -2.216064453125, -2.04913330078125, -1.8822021484375, -1.71527099609375, -1.54833984375, -1.38140869140625, -1.2144775390625, -1.04754638671875, -0.880615234375, -0.71368408203125, -0.5467529296875, -0.37982177734375, -0.212890625, -0.04595947265625, 0.1209716796875, 0.28790283203125, 0.454833984375, 0.62176513671875, 0.7886962890625, 0.95562744140625, 1.12255859375, 1.28948974609375, 1.4564208984375, 1.62335205078125, 1.790283203125, 1.95721435546875, 2.1241455078125, 2.29107666015625, 2.4580078125, 2.62493896484375, 2.7918701171875, 2.95880126953125, 3.125732421875, 3.29266357421875, 3.4595947265625, 3.62652587890625, 3.79345703125, 3.96038818359375, 4.1273193359375, 4.29425048828125, 4.461181640625, 4.62811279296875, 4.7950439453125, 4.96197509765625, 5.12890625]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 2.0, 3.0, 4.0, 3.0, 8.0, 11.0, 21.0, 24.0, 36.0, 71.0, 74.0, 111.0, 170.0, 234.0, 355.0, 464.0, 724.0, 999.0, 1500.0, 2325.0, 3266.0, 5121.0, 7627.0, 11432.0, 18300.0, 29260.0, 48011.0, 81870.0, 154466.0, 1367517.0, 152529.0, 81128.0, 47689.0, 28892.0, 17964.0, 11582.0, 7693.0, 5066.0, 3343.0, 2323.0, 1567.0, 1068.0, 747.0, 493.0, 313.0, 249.0, 150.0, 89.0, 75.0, 66.0, 38.0, 17.0, 15.0, 13.0, 12.0, 4.0, 0.0, 5.0, 2.0, 2.0, 1.0], "bins": [-1.546875, -1.499267578125, -1.45166015625, -1.404052734375, -1.3564453125, -1.308837890625, -1.26123046875, -1.213623046875, -1.166015625, -1.118408203125, -1.07080078125, -1.023193359375, -0.9755859375, -0.927978515625, -0.88037109375, -0.832763671875, -0.78515625, -0.737548828125, -0.68994140625, -0.642333984375, -0.5947265625, -0.547119140625, -0.49951171875, -0.451904296875, -0.404296875, -0.356689453125, -0.30908203125, -0.261474609375, -0.2138671875, -0.166259765625, -0.11865234375, -0.071044921875, -0.0234375, 0.024169921875, 0.07177734375, 0.119384765625, 0.1669921875, 0.214599609375, 0.26220703125, 0.309814453125, 0.357421875, 0.405029296875, 0.45263671875, 0.500244140625, 0.5478515625, 0.595458984375, 0.64306640625, 0.690673828125, 0.73828125, 0.785888671875, 0.83349609375, 0.881103515625, 0.9287109375, 0.976318359375, 1.02392578125, 1.071533203125, 1.119140625, 1.166748046875, 1.21435546875, 1.261962890625, 1.3095703125, 1.357177734375, 1.40478515625, 1.452392578125, 1.5]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 7.0, 5.0, 6.0, 8.0, 13.0, 8.0, 13.0, 16.0, 11.0, 17.0, 17.0, 29.0, 26.0, 36.0, 49.0, 41.0, 54.0, 42.0, 57.0, 56.0, 56.0, 50.0, 56.0, 31.0, 44.0, 37.0, 38.0, 29.0, 19.0, 19.0, 17.0, 16.0, 12.0, 12.0, 7.0, 13.0, 6.0, 4.0, 7.0, 6.0, 1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0008029937744140625, -0.0007777810096740723, -0.000752568244934082, -0.0007273554801940918, -0.0007021427154541016, -0.0006769299507141113, -0.0006517171859741211, -0.0006265044212341309, -0.0006012916564941406, -0.0005760788917541504, -0.0005508661270141602, -0.0005256533622741699, -0.0005004405975341797, -0.00047522783279418945, -0.0004500150680541992, -0.000424802303314209, -0.00039958953857421875, -0.0003743767738342285, -0.0003491640090942383, -0.00032395124435424805, -0.0002987384796142578, -0.0002735257148742676, -0.00024831295013427734, -0.0002231001853942871, -0.00019788742065429688, -0.00017267465591430664, -0.0001474618911743164, -0.00012224912643432617, -9.703636169433594e-05, -7.18235969543457e-05, -4.661083221435547e-05, -2.1398067474365234e-05, 3.814697265625e-06, 2.9027462005615234e-05, 5.424022674560547e-05, 7.94529914855957e-05, 0.00010466575622558594, 0.00012987852096557617, 0.0001550912857055664, 0.00018030405044555664, 0.00020551681518554688, 0.0002307295799255371, 0.00025594234466552734, 0.0002811551094055176, 0.0003063678741455078, 0.00033158063888549805, 0.0003567934036254883, 0.0003820061683654785, 0.00040721893310546875, 0.000432431697845459, 0.0004576444625854492, 0.00048285722732543945, 0.0005080699920654297, 0.0005332827568054199, 0.0005584955215454102, 0.0005837082862854004, 0.0006089210510253906, 0.0006341338157653809, 0.0006593465805053711, 0.0006845593452453613, 0.0007097721099853516, 0.0007349848747253418, 0.000760197639465332, 0.0007854104042053223, 0.0008106231689453125]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 7.0, 5.0, 6.0, 8.0, 13.0, 12.0, 25.0, 15.0, 28.0, 26.0, 36.0, 47.0, 58.0, 67.0, 90.0, 144.0, 324.0, 853.0, 54178.0, 989728.0, 1713.0, 455.0, 193.0, 111.0, 101.0, 64.0, 46.0, 34.0, 25.0, 21.0, 21.0, 20.0, 18.0, 15.0, 5.0, 10.0, 9.0, 1.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.018951416015625, -0.01834392547607422, -0.017736434936523438, -0.017128944396972656, -0.016521453857421875, -0.015913963317871094, -0.015306472778320312, -0.014698982238769531, -0.01409149169921875, -0.013484001159667969, -0.012876510620117188, -0.012269020080566406, -0.011661529541015625, -0.011054039001464844, -0.010446548461914062, -0.009839057922363281, -0.0092315673828125, -0.008624076843261719, -0.008016586303710938, -0.007409095764160156, -0.006801605224609375, -0.006194114685058594, -0.0055866241455078125, -0.004979133605957031, -0.00437164306640625, -0.0037641525268554688, -0.0031566619873046875, -0.0025491714477539062, -0.001941680908203125, -0.0013341903686523438, -0.0007266998291015625, -0.00011920928955078125, 0.00048828125, 0.0010957717895507812, 0.0017032623291015625, 0.0023107528686523438, 0.002918243408203125, 0.0035257339477539062, 0.0041332244873046875, 0.004740715026855469, 0.00534820556640625, 0.005955696105957031, 0.0065631866455078125, 0.007170677185058594, 0.007778167724609375, 0.008385658264160156, 0.008993148803710938, 0.009600639343261719, 0.0102081298828125, 0.010815620422363281, 0.011423110961914062, 0.012030601501464844, 0.012638092041015625, 0.013245582580566406, 0.013853073120117188, 0.014460563659667969, 0.01506805419921875, 0.01567554473876953, 0.016283035278320312, 0.016890525817871094, 0.017498016357421875, 0.018105506896972656, 0.018712997436523438, 0.01932048797607422, 0.019927978515625]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 6.0, 11.0, 19.0, 39.0, 62.0, 120.0, 114.0, 176.0, 168.0, 111.0, 78.0, 49.0, 24.0, 14.0, 8.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00031856464920565486, -0.0003005580510944128, -0.00028255145298317075, -0.0002645448548719287, -0.00024653825676068664, -0.00022853164409752935, -0.00021052503143437207, -0.00019251843332313, -0.00017451183521188796, -0.0001565052371006459, -0.00013849863898940384, -0.00012049202632624656, -0.0001024854282150045, -8.447883010376245e-05, -6.647222471656278e-05, -4.846561932936311e-05, -3.0459021218121052e-05, -1.2452419468900189e-05, 5.554182280320674e-06, 2.3560784029541537e-05, 4.15673857787624e-05, 5.9573983890004456e-05, 7.758058927720413e-05, 9.55871946644038e-05, 0.00011359379277564585, 0.0001316003908868879, 0.00014960698899812996, 0.00016761360166128725, 0.0001856201997725293, 0.00020362679788377136, 0.00022163341054692864, 0.0002396400086581707, 0.00025764660676941276, 0.0002756532048806548, 0.00029365980299189687, 0.0003116664011031389, 0.000329672999214381, 0.00034767959732562304, 0.00036568622454069555, 0.0003836928226519376, 0.00040169942076317966, 0.0004197060188744217, 0.00043771261698566377, 0.00045571921509690583, 0.00047372584231197834, 0.0004917324404232204, 0.0005097390385344625, 0.0005277456366457045, 0.0005457522347569466, 0.0005637588328681886, 0.0005817654309794307, 0.0005997720290906727, 0.0006177786272019148, 0.0006357852253131568, 0.0006537918234243989, 0.0006717984797433019, 0.000689805019646883, 0.0007078116177581251, 0.0007258182158693671, 0.0007438248139806092, 0.0007618314120918512, 0.0007798380102030933, 0.0007978446083143353, 0.0008158512646332383, 0.0008338578627444804]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 4.0, 8.0, 8.0, 9.0, 7.0, 9.0, 12.0, 20.0, 21.0, 30.0, 30.0, 31.0, 33.0, 23.0, 28.0, 35.0, 33.0, 42.0, 40.0, 43.0, 35.0, 46.0, 33.0, 45.0, 38.0, 30.0, 36.0, 36.0, 25.0, 30.0, 21.0, 23.0, 20.0, 15.0, 17.0, 8.0, 16.0, 14.0, 10.0, 9.0, 9.0, 5.0, 3.0, 4.0, 8.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004393458366394043, -0.00042517390102148056, -0.0004110019654035568, -0.0003968300297856331, -0.00038265809416770935, -0.0003684861585497856, -0.0003543142229318619, -0.00034014228731393814, -0.0003259703516960144, -0.00031179841607809067, -0.00029762648046016693, -0.0002834545448422432, -0.00026928260922431946, -0.0002551106736063957, -0.00024093873798847198, -0.00022676680237054825, -0.0002125948667526245, -0.00019842293113470078, -0.00018425099551677704, -0.0001700790598988533, -0.00015590712428092957, -0.00014173518866300583, -0.0001275632530450821, -0.00011339131742715836, -9.921938180923462e-05, -8.504744619131088e-05, -7.087551057338715e-05, -5.670357495546341e-05, -4.253163933753967e-05, -2.8359703719615936e-05, -1.41877681016922e-05, -1.5832483768463135e-08, 1.4156103134155273e-05, 2.832803875207901e-05, 4.2499974370002747e-05, 5.667190998792648e-05, 7.084384560585022e-05, 8.501578122377396e-05, 9.918771684169769e-05, 0.00011335965245962143, 0.00012753158807754517, 0.0001417035236954689, 0.00015587545931339264, 0.00017004739493131638, 0.0001842193305492401, 0.00019839126616716385, 0.00021256320178508759, 0.00022673513740301132, 0.00024090707302093506, 0.0002550790086388588, 0.00026925094425678253, 0.00028342287987470627, 0.00029759481549263, 0.00031176675111055374, 0.0003259386867284775, 0.0003401106223464012, 0.00035428255796432495, 0.0003684544935822487, 0.0003826264292001724, 0.00039679836481809616, 0.0004109703004360199, 0.00042514223605394363, 0.00043931417167186737, 0.0004534861072897911, 0.00046765804290771484]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 5.0, 3.0, 1.0, 9.0, 11.0, 12.0, 10.0, 14.0, 10.0, 19.0, 26.0, 27.0, 33.0, 28.0, 32.0, 34.0, 42.0, 34.0, 48.0, 40.0, 45.0, 31.0, 50.0, 35.0, 34.0, 46.0, 43.0, 28.0, 32.0, 34.0, 31.0, 20.0, 22.0, 23.0, 17.0, 13.0, 15.0, 5.0, 8.0, 5.0, 7.0, 5.0, 5.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.2109375, -6.95849609375, -6.7060546875, -6.45361328125, -6.201171875, -5.94873046875, -5.6962890625, -5.44384765625, -5.19140625, -4.93896484375, -4.6865234375, -4.43408203125, -4.181640625, -3.92919921875, -3.6767578125, -3.42431640625, -3.171875, -2.91943359375, -2.6669921875, -2.41455078125, -2.162109375, -1.90966796875, -1.6572265625, -1.40478515625, -1.15234375, -0.89990234375, -0.6474609375, -0.39501953125, -0.142578125, 0.10986328125, 0.3623046875, 0.61474609375, 0.8671875, 1.11962890625, 1.3720703125, 1.62451171875, 1.876953125, 2.12939453125, 2.3818359375, 2.63427734375, 2.88671875, 3.13916015625, 3.3916015625, 3.64404296875, 3.896484375, 4.14892578125, 4.4013671875, 4.65380859375, 4.90625, 5.15869140625, 5.4111328125, 5.66357421875, 5.916015625, 6.16845703125, 6.4208984375, 6.67333984375, 6.92578125, 7.17822265625, 7.4306640625, 7.68310546875, 7.935546875, 8.18798828125, 8.4404296875, 8.69287109375, 8.9453125]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 1.0, 7.0, 5.0, 9.0, 15.0, 17.0, 20.0, 24.0, 19.0, 44.0, 54.0, 64.0, 109.0, 141.0, 221.0, 352.0, 584.0, 1146.0, 2849.0, 10364.0, 66836.0, 727810.0, 205763.0, 23388.0, 4848.0, 1751.0, 793.0, 441.0, 270.0, 160.0, 110.0, 87.0, 52.0, 49.0, 33.0, 25.0, 24.0, 18.0, 9.0, 10.0, 7.0, 7.0, 5.0, 5.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.40625, -12.939697265625, -12.47314453125, -12.006591796875, -11.5400390625, -11.073486328125, -10.60693359375, -10.140380859375, -9.673828125, -9.207275390625, -8.74072265625, -8.274169921875, -7.8076171875, -7.341064453125, -6.87451171875, -6.407958984375, -5.94140625, -5.474853515625, -5.00830078125, -4.541748046875, -4.0751953125, -3.608642578125, -3.14208984375, -2.675537109375, -2.208984375, -1.742431640625, -1.27587890625, -0.809326171875, -0.3427734375, 0.123779296875, 0.59033203125, 1.056884765625, 1.5234375, 1.989990234375, 2.45654296875, 2.923095703125, 3.3896484375, 3.856201171875, 4.32275390625, 4.789306640625, 5.255859375, 5.722412109375, 6.18896484375, 6.655517578125, 7.1220703125, 7.588623046875, 8.05517578125, 8.521728515625, 8.98828125, 9.454833984375, 9.92138671875, 10.387939453125, 10.8544921875, 11.321044921875, 11.78759765625, 12.254150390625, 12.720703125, 13.187255859375, 13.65380859375, 14.120361328125, 14.5869140625, 15.053466796875, 15.52001953125, 15.986572265625, 16.453125]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 2.0, 8.0, 4.0, 8.0, 11.0, 16.0, 15.0, 14.0, 20.0, 22.0, 30.0, 36.0, 48.0, 55.0, 54.0, 61.0, 64.0, 189.0, 1834.0, 146.0, 55.0, 45.0, 39.0, 50.0, 48.0, 39.0, 30.0, 9.0, 25.0, 20.0, 11.0, 11.0, 8.0, 7.0, 4.0, 4.0, 6.0, 2.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.171875, -23.181396484375, -22.19091796875, -21.200439453125, -20.2099609375, -19.219482421875, -18.22900390625, -17.238525390625, -16.248046875, -15.257568359375, -14.26708984375, -13.276611328125, -12.2861328125, -11.295654296875, -10.30517578125, -9.314697265625, -8.32421875, -7.333740234375, -6.34326171875, -5.352783203125, -4.3623046875, -3.371826171875, -2.38134765625, -1.390869140625, -0.400390625, 0.590087890625, 1.58056640625, 2.571044921875, 3.5615234375, 4.552001953125, 5.54248046875, 6.532958984375, 7.5234375, 8.513916015625, 9.50439453125, 10.494873046875, 11.4853515625, 12.475830078125, 13.46630859375, 14.456787109375, 15.447265625, 16.437744140625, 17.42822265625, 18.418701171875, 19.4091796875, 20.399658203125, 21.39013671875, 22.380615234375, 23.37109375, 24.361572265625, 25.35205078125, 26.342529296875, 27.3330078125, 28.323486328125, 29.31396484375, 30.304443359375, 31.294921875, 32.285400390625, 33.27587890625, 34.266357421875, 35.2568359375, 36.247314453125, 37.23779296875, 38.228271484375, 39.21875]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 9.0, 5.0, 6.0, 8.0, 10.0, 14.0, 18.0, 17.0, 22.0, 27.0, 39.0, 46.0, 71.0, 93.0, 168.0, 260.0, 880.0, 18017.0, 3120481.0, 4276.0, 511.0, 223.0, 139.0, 96.0, 68.0, 40.0, 36.0, 29.0, 20.0, 12.0, 18.0, 12.0, 12.0, 11.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0], "bins": [-116.5625, -113.5986328125, -110.634765625, -107.6708984375, -104.70703125, -101.7431640625, -98.779296875, -95.8154296875, -92.8515625, -89.8876953125, -86.923828125, -83.9599609375, -80.99609375, -78.0322265625, -75.068359375, -72.1044921875, -69.140625, -66.1767578125, -63.212890625, -60.2490234375, -57.28515625, -54.3212890625, -51.357421875, -48.3935546875, -45.4296875, -42.4658203125, -39.501953125, -36.5380859375, -33.57421875, -30.6103515625, -27.646484375, -24.6826171875, -21.71875, -18.7548828125, -15.791015625, -12.8271484375, -9.86328125, -6.8994140625, -3.935546875, -0.9716796875, 1.9921875, 4.9560546875, 7.919921875, 10.8837890625, 13.84765625, 16.8115234375, 19.775390625, 22.7392578125, 25.703125, 28.6669921875, 31.630859375, 34.5947265625, 37.55859375, 40.5224609375, 43.486328125, 46.4501953125, 49.4140625, 52.3779296875, 55.341796875, 58.3056640625, 61.26953125, 64.2333984375, 67.197265625, 70.1611328125, 73.125]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 47.0, 563.0, 383.0, 23.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.39124298095703, -23.571990966796875, -18.75273895263672, -13.93348503112793, -9.114233016967773, -4.294981002807617, 0.5242729187011719, 5.343524932861328, 10.162776947021484, 14.98202896118164, 19.801280975341797, 24.620534896850586, 29.439786911010742, 34.25904083251953, 39.07829284667969, 43.897544860839844, 48.716796875, 53.536048889160156, 58.35530090332031, 63.17455291748047, 67.99380493164062, 72.81305694580078, 77.63230895996094, 82.45156860351562, 87.27081298828125, 92.0900650024414, 96.90931701660156, 101.72856903076172, 106.54782104492188, 111.36707305908203, 116.18632507324219, 121.00558471679688, 125.82484436035156, 130.64410400390625, 135.46334838867188, 140.28260803222656, 145.1018524169922, 149.92111206054688, 154.7403564453125, 159.5596160888672, 164.3788604736328, 169.1981201171875, 174.01736450195312, 178.8366241455078, 183.65586853027344, 188.47512817382812, 193.29437255859375, 198.11363220214844, 202.93289184570312, 207.7521514892578, 212.57139587402344, 217.39065551757812, 222.20989990234375, 227.02915954589844, 231.84840393066406, 236.66766357421875, 241.48690795898438, 246.30616760253906, 251.1254119873047, 255.94467163085938, 260.763916015625, 265.5831604003906, 270.4024353027344, 275.2216796875, 280.0409240722656]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 3.0, 6.0, 4.0, 6.0, 5.0, 9.0, 12.0, 13.0, 17.0, 12.0, 18.0, 24.0, 23.0, 27.0, 28.0, 32.0, 25.0, 23.0, 38.0, 43.0, 31.0, 41.0, 40.0, 43.0, 29.0, 43.0, 48.0, 37.0, 47.0, 26.0, 29.0, 33.0, 31.0, 20.0, 19.0, 25.0, 22.0, 12.0, 12.0, 10.0, 2.0, 4.0, 5.0, 5.0, 6.0, 3.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-78.53504943847656, -76.17727661132812, -73.81950378417969, -71.46173095703125, -69.10395812988281, -66.74617767333984, -64.3884048461914, -62.03063201904297, -59.67285919189453, -57.315086364746094, -54.957313537597656, -52.59953689575195, -50.241764068603516, -47.88399124145508, -45.526214599609375, -43.16844177246094, -40.8106689453125, -38.45289611816406, -36.095123291015625, -33.73734664916992, -31.379573822021484, -29.021800994873047, -26.664026260375977, -24.306251525878906, -21.94847869873047, -19.59070587158203, -17.23293113708496, -14.875157356262207, -12.517383575439453, -10.1596097946167, -7.801836013793945, -5.444061279296875, -3.0862884521484375, -0.7285146713256836, 1.6292591094970703, 3.987032890319824, 6.344806671142578, 8.702580451965332, 11.060354232788086, 13.418128967285156, 15.775901794433594, 18.13367462158203, 20.4914493560791, 22.849224090576172, 25.20699691772461, 27.564769744873047, 29.922544479370117, 32.28031921386719, 34.638092041015625, 36.99586486816406, 39.3536376953125, 41.7114143371582, 44.06918716430664, 46.42695999145508, 48.78473663330078, 51.14250946044922, 53.500282287597656, 55.858055114746094, 58.21582794189453, 60.573604583740234, 62.93137741088867, 65.28915405273438, 67.64692687988281, 70.00469970703125, 72.36247253417969]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 4.0, 4.0, 2.0, 2.0, 3.0, 3.0, 5.0, 8.0, 8.0, 14.0, 9.0, 8.0, 12.0, 14.0, 31.0, 32.0, 26.0, 29.0, 34.0, 31.0, 40.0, 40.0, 36.0, 35.0, 31.0, 51.0, 45.0, 39.0, 38.0, 37.0, 32.0, 35.0, 42.0, 31.0, 26.0, 28.0, 27.0, 19.0, 17.0, 13.0, 18.0, 8.0, 6.0, 9.0, 7.0, 7.0, 1.0, 3.0, 5.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.89453125, -7.63104248046875, -7.3675537109375, -7.10406494140625, -6.840576171875, -6.57708740234375, -6.3135986328125, -6.05010986328125, -5.78662109375, -5.52313232421875, -5.2596435546875, -4.99615478515625, -4.732666015625, -4.46917724609375, -4.2056884765625, -3.94219970703125, -3.6787109375, -3.41522216796875, -3.1517333984375, -2.88824462890625, -2.624755859375, -2.36126708984375, -2.0977783203125, -1.83428955078125, -1.57080078125, -1.30731201171875, -1.0438232421875, -0.78033447265625, -0.516845703125, -0.25335693359375, 0.0101318359375, 0.27362060546875, 0.537109375, 0.80059814453125, 1.0640869140625, 1.32757568359375, 1.591064453125, 1.85455322265625, 2.1180419921875, 2.38153076171875, 2.64501953125, 2.90850830078125, 3.1719970703125, 3.43548583984375, 3.698974609375, 3.96246337890625, 4.2259521484375, 4.48944091796875, 4.7529296875, 5.01641845703125, 5.2799072265625, 5.54339599609375, 5.806884765625, 6.07037353515625, 6.3338623046875, 6.59735107421875, 6.86083984375, 7.12432861328125, 7.3878173828125, 7.65130615234375, 7.914794921875, 8.17828369140625, 8.4417724609375, 8.70526123046875, 8.96875]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 5.0, 4.0, 5.0, 5.0, 5.0, 6.0, 16.0, 9.0, 10.0, 25.0, 33.0, 38.0, 42.0, 50.0, 80.0, 119.0, 127.0, 203.0, 307.0, 469.0, 919.0, 1708.0, 3551.0, 8965.0, 28523.0, 112309.0, 446083.0, 1215584.0, 1447833.0, 675357.0, 185081.0, 44107.0, 12812.0, 4717.0, 2185.0, 1069.0, 677.0, 373.0, 228.0, 167.0, 123.0, 74.0, 64.0, 50.0, 30.0, 29.0, 26.0, 10.0, 12.0, 21.0, 13.0, 7.0, 6.0, 6.0, 7.0, 2.0, 1.0, 5.0], "bins": [-9.6484375, -9.3660888671875, -9.083740234375, -8.8013916015625, -8.51904296875, -8.2366943359375, -7.954345703125, -7.6719970703125, -7.3896484375, -7.1072998046875, -6.824951171875, -6.5426025390625, -6.26025390625, -5.9779052734375, -5.695556640625, -5.4132080078125, -5.130859375, -4.8485107421875, -4.566162109375, -4.2838134765625, -4.00146484375, -3.7191162109375, -3.436767578125, -3.1544189453125, -2.8720703125, -2.5897216796875, -2.307373046875, -2.0250244140625, -1.74267578125, -1.4603271484375, -1.177978515625, -0.8956298828125, -0.61328125, -0.3309326171875, -0.048583984375, 0.2337646484375, 0.51611328125, 0.7984619140625, 1.080810546875, 1.3631591796875, 1.6455078125, 1.9278564453125, 2.210205078125, 2.4925537109375, 2.77490234375, 3.0572509765625, 3.339599609375, 3.6219482421875, 3.904296875, 4.1866455078125, 4.468994140625, 4.7513427734375, 5.03369140625, 5.3160400390625, 5.598388671875, 5.8807373046875, 6.1630859375, 6.4454345703125, 6.727783203125, 7.0101318359375, 7.29248046875, 7.5748291015625, 7.857177734375, 8.1395263671875, 8.421875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 5.0, 7.0, 11.0, 11.0, 10.0, 14.0, 19.0, 36.0, 40.0, 54.0, 73.0, 84.0, 133.0, 150.0, 190.0, 265.0, 350.0, 406.0, 425.0, 380.0, 364.0, 240.0, 180.0, 146.0, 115.0, 92.0, 77.0, 44.0, 44.0, 21.0, 30.0, 14.0, 10.0, 15.0, 9.0, 5.0, 6.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.3984375, -12.9422607421875, -12.486083984375, -12.0299072265625, -11.57373046875, -11.1175537109375, -10.661376953125, -10.2052001953125, -9.7490234375, -9.2928466796875, -8.836669921875, -8.3804931640625, -7.92431640625, -7.4681396484375, -7.011962890625, -6.5557861328125, -6.099609375, -5.6434326171875, -5.187255859375, -4.7310791015625, -4.27490234375, -3.8187255859375, -3.362548828125, -2.9063720703125, -2.4501953125, -1.9940185546875, -1.537841796875, -1.0816650390625, -0.62548828125, -0.1693115234375, 0.286865234375, 0.7430419921875, 1.19921875, 1.6553955078125, 2.111572265625, 2.5677490234375, 3.02392578125, 3.4801025390625, 3.936279296875, 4.3924560546875, 4.8486328125, 5.3048095703125, 5.760986328125, 6.2171630859375, 6.67333984375, 7.1295166015625, 7.585693359375, 8.0418701171875, 8.498046875, 8.9542236328125, 9.410400390625, 9.8665771484375, 10.32275390625, 10.7789306640625, 11.235107421875, 11.6912841796875, 12.1474609375, 12.6036376953125, 13.059814453125, 13.5159912109375, 13.97216796875, 14.4283447265625, 14.884521484375, 15.3406982421875, 15.796875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 2.0, 8.0, 16.0, 13.0, 27.0, 22.0, 37.0, 53.0, 76.0, 84.0, 94.0, 130.0, 199.0, 218.0, 296.0, 432.0, 866.0, 5894.0, 3563987.0, 616856.0, 2812.0, 637.0, 368.0, 274.0, 213.0, 144.0, 105.0, 115.0, 64.0, 77.0, 48.0, 27.0, 21.0, 22.0, 8.0, 9.0, 5.0, 6.0, 7.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-73.625, -71.3154296875, -69.005859375, -66.6962890625, -64.38671875, -62.0771484375, -59.767578125, -57.4580078125, -55.1484375, -52.8388671875, -50.529296875, -48.2197265625, -45.91015625, -43.6005859375, -41.291015625, -38.9814453125, -36.671875, -34.3623046875, -32.052734375, -29.7431640625, -27.43359375, -25.1240234375, -22.814453125, -20.5048828125, -18.1953125, -15.8857421875, -13.576171875, -11.2666015625, -8.95703125, -6.6474609375, -4.337890625, -2.0283203125, 0.28125, 2.5908203125, 4.900390625, 7.2099609375, 9.51953125, 11.8291015625, 14.138671875, 16.4482421875, 18.7578125, 21.0673828125, 23.376953125, 25.6865234375, 27.99609375, 30.3056640625, 32.615234375, 34.9248046875, 37.234375, 39.5439453125, 41.853515625, 44.1630859375, 46.47265625, 48.7822265625, 51.091796875, 53.4013671875, 55.7109375, 58.0205078125, 60.330078125, 62.6396484375, 64.94921875, 67.2587890625, 69.568359375, 71.8779296875, 74.1875]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 14.0, 332.0, 604.0, 64.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.36856842041016, -83.17698669433594, -72.98539733886719, -62.79381561279297, -52.602230072021484, -42.41064453125, -32.21906280517578, -22.02747344970703, -11.835891723632812, -1.6443071365356445, 8.547277450561523, 18.738861083984375, 28.93044662475586, 39.122032165527344, 49.31361389160156, 59.50520324707031, 69.69678497314453, 79.88836669921875, 90.0799560546875, 100.27153778076172, 110.46311950683594, 120.65470886230469, 130.84628295898438, 141.03787231445312, 151.22946166992188, 161.42105102539062, 171.6126251220703, 181.80421447753906, 191.9958038330078, 202.1873779296875, 212.37896728515625, 222.570556640625, 232.76211547851562, 242.95370483398438, 253.14527893066406, 263.33685302734375, 273.5284423828125, 283.72003173828125, 293.91162109375, 304.10321044921875, 314.2947998046875, 324.48638916015625, 334.677978515625, 344.86956787109375, 355.0611267089844, 365.2527160644531, 375.4443054199219, 385.6358947753906, 395.82745361328125, 406.01904296875, 416.21063232421875, 426.4022216796875, 436.5937805175781, 446.7853698730469, 456.9769592285156, 467.1685485839844, 477.3601379394531, 487.5517272949219, 497.7433166503906, 507.93487548828125, 518.12646484375, 528.3180541992188, 538.5096435546875, 548.7012329101562, 558.892822265625]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 1.0, 5.0, 7.0, 11.0, 8.0, 7.0, 24.0, 21.0, 15.0, 20.0, 23.0, 24.0, 29.0, 27.0, 40.0, 50.0, 47.0, 43.0, 43.0, 46.0, 51.0, 43.0, 47.0, 42.0, 43.0, 40.0, 34.0, 32.0, 23.0, 23.0, 26.0, 17.0, 17.0, 13.0, 13.0, 13.0, 7.0, 9.0, 5.0, 7.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.166202545166016, -54.38456344604492, -52.60292434692383, -50.8212890625, -49.039649963378906, -47.25801086425781, -45.47637176513672, -43.694732666015625, -41.91309356689453, -40.13145446777344, -38.349815368652344, -36.56817626953125, -34.78654098510742, -33.00490188598633, -31.223262786865234, -29.44162368774414, -27.659988403320312, -25.87834930419922, -24.096712112426758, -22.315073013305664, -20.533435821533203, -18.75179672241211, -16.970157623291016, -15.188519477844238, -13.406881332397461, -11.625243186950684, -9.843605041503906, -8.061965942382812, -6.280327796936035, -4.498689651489258, -2.717050552368164, -0.9354124069213867, 0.8462295532226562, 2.6278679370880127, 4.409506320953369, 6.191144943237305, 7.972783088684082, 9.75442123413086, 11.536060333251953, 13.31769847869873, 15.099336624145508, 16.8809757232666, 18.662612915039062, 20.444252014160156, 22.22589111328125, 24.00752830505371, 25.789167404174805, 27.570804595947266, 29.35244369506836, 31.134082794189453, 32.91572189331055, 34.697357177734375, 36.47899627685547, 38.26063537597656, 40.042274475097656, 41.82391357421875, 43.605552673339844, 45.38719177246094, 47.16883087158203, 48.950469970703125, 50.73210525512695, 52.51374435424805, 54.29538345336914, 56.077022552490234, 57.85865783691406]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 8.0, 7.0, 3.0, 4.0, 8.0, 12.0, 9.0, 9.0, 10.0, 11.0, 18.0, 24.0, 16.0, 18.0, 25.0, 35.0, 31.0, 40.0, 32.0, 30.0, 32.0, 38.0, 34.0, 42.0, 36.0, 33.0, 25.0, 43.0, 34.0, 30.0, 39.0, 31.0, 32.0, 29.0, 22.0, 25.0, 25.0, 24.0, 14.0, 16.0, 5.0, 7.0, 11.0, 6.0, 5.0, 9.0, 3.0, 0.0, 3.0, 0.0, 6.0, 1.0, 2.0, 1.0, 2.0, 3.0], "bins": [-7.50390625, -7.27252197265625, -7.0411376953125, -6.80975341796875, -6.578369140625, -6.34698486328125, -6.1156005859375, -5.88421630859375, -5.65283203125, -5.42144775390625, -5.1900634765625, -4.95867919921875, -4.727294921875, -4.49591064453125, -4.2645263671875, -4.03314208984375, -3.8017578125, -3.57037353515625, -3.3389892578125, -3.10760498046875, -2.876220703125, -2.64483642578125, -2.4134521484375, -2.18206787109375, -1.95068359375, -1.71929931640625, -1.4879150390625, -1.25653076171875, -1.025146484375, -0.79376220703125, -0.5623779296875, -0.33099365234375, -0.099609375, 0.13177490234375, 0.3631591796875, 0.59454345703125, 0.825927734375, 1.05731201171875, 1.2886962890625, 1.52008056640625, 1.75146484375, 1.98284912109375, 2.2142333984375, 2.44561767578125, 2.677001953125, 2.90838623046875, 3.1397705078125, 3.37115478515625, 3.6025390625, 3.83392333984375, 4.0653076171875, 4.29669189453125, 4.528076171875, 4.75946044921875, 4.9908447265625, 5.22222900390625, 5.45361328125, 5.68499755859375, 5.9163818359375, 6.14776611328125, 6.379150390625, 6.61053466796875, 6.8419189453125, 7.07330322265625, 7.3046875]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 0.0, 5.0, 2.0, 3.0, 2.0, 1.0, 15.0, 27.0, 28.0, 48.0, 83.0, 124.0, 153.0, 271.0, 443.0, 699.0, 1107.0, 1579.0, 2450.0, 3855.0, 5826.0, 9051.0, 14919.0, 24567.0, 41244.0, 69347.0, 129414.0, 322161.0, 195211.0, 91581.0, 52648.0, 30528.0, 19065.0, 11599.0, 7412.0, 4734.0, 2865.0, 1811.0, 1302.0, 809.0, 522.0, 342.0, 257.0, 140.0, 113.0, 72.0, 51.0, 31.0, 15.0, 12.0, 8.0, 10.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-1.6376953125, -1.586090087890625, -1.53448486328125, -1.482879638671875, -1.4312744140625, -1.379669189453125, -1.32806396484375, -1.276458740234375, -1.224853515625, -1.173248291015625, -1.12164306640625, -1.070037841796875, -1.0184326171875, -0.966827392578125, -0.91522216796875, -0.863616943359375, -0.81201171875, -0.760406494140625, -0.70880126953125, -0.657196044921875, -0.6055908203125, -0.553985595703125, -0.50238037109375, -0.450775146484375, -0.399169921875, -0.347564697265625, -0.29595947265625, -0.244354248046875, -0.1927490234375, -0.141143798828125, -0.08953857421875, -0.037933349609375, 0.013671875, 0.065277099609375, 0.11688232421875, 0.168487548828125, 0.2200927734375, 0.271697998046875, 0.32330322265625, 0.374908447265625, 0.426513671875, 0.478118896484375, 0.52972412109375, 0.581329345703125, 0.6329345703125, 0.684539794921875, 0.73614501953125, 0.787750244140625, 0.83935546875, 0.890960693359375, 0.94256591796875, 0.994171142578125, 1.0457763671875, 1.097381591796875, 1.14898681640625, 1.200592041015625, 1.252197265625, 1.303802490234375, 1.35540771484375, 1.407012939453125, 1.4586181640625, 1.510223388671875, 1.56182861328125, 1.613433837890625, 1.6650390625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 6.0, 3.0, 1.0, 11.0, 9.0, 8.0, 14.0, 19.0, 21.0, 20.0, 18.0, 23.0, 34.0, 28.0, 34.0, 31.0, 45.0, 37.0, 42.0, 43.0, 44.0, 1068.0, 52.0, 44.0, 43.0, 41.0, 31.0, 26.0, 26.0, 26.0, 23.0, 29.0, 25.0, 24.0, 11.0, 10.0, 14.0, 9.0, 6.0, 9.0, 5.0, 3.0, 3.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.04296875, -4.8790283203125, -4.715087890625, -4.5511474609375, -4.38720703125, -4.2232666015625, -4.059326171875, -3.8953857421875, -3.7314453125, -3.5675048828125, -3.403564453125, -3.2396240234375, -3.07568359375, -2.9117431640625, -2.747802734375, -2.5838623046875, -2.419921875, -2.2559814453125, -2.092041015625, -1.9281005859375, -1.76416015625, -1.6002197265625, -1.436279296875, -1.2723388671875, -1.1083984375, -0.9444580078125, -0.780517578125, -0.6165771484375, -0.45263671875, -0.2886962890625, -0.124755859375, 0.0391845703125, 0.203125, 0.3670654296875, 0.531005859375, 0.6949462890625, 0.85888671875, 1.0228271484375, 1.186767578125, 1.3507080078125, 1.5146484375, 1.6785888671875, 1.842529296875, 2.0064697265625, 2.17041015625, 2.3343505859375, 2.498291015625, 2.6622314453125, 2.826171875, 2.9901123046875, 3.154052734375, 3.3179931640625, 3.48193359375, 3.6458740234375, 3.809814453125, 3.9737548828125, 4.1376953125, 4.3016357421875, 4.465576171875, 4.6295166015625, 4.79345703125, 4.9573974609375, 5.121337890625, 5.2852783203125, 5.44921875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 7.0, 3.0, 4.0, 5.0, 8.0, 17.0, 20.0, 32.0, 33.0, 49.0, 72.0, 85.0, 174.0, 214.0, 279.0, 475.0, 663.0, 952.0, 1433.0, 1995.0, 3053.0, 4498.0, 6943.0, 10632.0, 16518.0, 25977.0, 42145.0, 71027.0, 132457.0, 1365994.0, 182847.0, 88124.0, 51508.0, 31535.0, 19836.0, 12748.0, 8280.0, 5324.0, 3687.0, 2343.0, 1640.0, 1122.0, 717.0, 517.0, 353.0, 240.0, 189.0, 113.0, 73.0, 59.0, 50.0, 24.0, 18.0, 17.0, 9.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 3.0], "bins": [-1.4931640625, -1.446044921875, -1.39892578125, -1.351806640625, -1.3046875, -1.257568359375, -1.21044921875, -1.163330078125, -1.1162109375, -1.069091796875, -1.02197265625, -0.974853515625, -0.927734375, -0.880615234375, -0.83349609375, -0.786376953125, -0.7392578125, -0.692138671875, -0.64501953125, -0.597900390625, -0.55078125, -0.503662109375, -0.45654296875, -0.409423828125, -0.3623046875, -0.315185546875, -0.26806640625, -0.220947265625, -0.173828125, -0.126708984375, -0.07958984375, -0.032470703125, 0.0146484375, 0.061767578125, 0.10888671875, 0.156005859375, 0.203125, 0.250244140625, 0.29736328125, 0.344482421875, 0.3916015625, 0.438720703125, 0.48583984375, 0.532958984375, 0.580078125, 0.627197265625, 0.67431640625, 0.721435546875, 0.7685546875, 0.815673828125, 0.86279296875, 0.909912109375, 0.95703125, 1.004150390625, 1.05126953125, 1.098388671875, 1.1455078125, 1.192626953125, 1.23974609375, 1.286865234375, 1.333984375, 1.381103515625, 1.42822265625, 1.475341796875, 1.5224609375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 1.0, 9.0, 6.0, 6.0, 8.0, 14.0, 18.0, 23.0, 36.0, 25.0, 38.0, 47.0, 66.0, 80.0, 90.0, 87.0, 85.0, 66.0, 52.0, 50.0, 37.0, 33.0, 25.0, 31.0, 17.0, 12.0, 6.0, 8.0, 14.0, 3.0, 6.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007677078247070312, -0.0007363408803939819, -0.0007049739360809326, -0.0006736069917678833, -0.000642240047454834, -0.0006108731031417847, -0.0005795061588287354, -0.000548139214515686, -0.0005167722702026367, -0.0004854053258895874, -0.0004540383815765381, -0.00042267143726348877, -0.00039130449295043945, -0.00035993754863739014, -0.0003285706043243408, -0.0002972036600112915, -0.0002658367156982422, -0.00023446977138519287, -0.00020310282707214355, -0.00017173588275909424, -0.00014036893844604492, -0.0001090019941329956, -7.763504981994629e-05, -4.626810550689697e-05, -1.4901161193847656e-05, 1.646578311920166e-05, 4.7832727432250977e-05, 7.919967174530029e-05, 0.00011056661605834961, 0.00014193356037139893, 0.00017330050468444824, 0.00020466744899749756, 0.00023603439331054688, 0.0002674013376235962, 0.0002987682819366455, 0.0003301352262496948, 0.00036150217056274414, 0.00039286911487579346, 0.0004242360591888428, 0.0004556030035018921, 0.0004869699478149414, 0.0005183368921279907, 0.00054970383644104, 0.0005810707807540894, 0.0006124377250671387, 0.000643804669380188, 0.0006751716136932373, 0.0007065385580062866, 0.0007379055023193359, 0.0007692724466323853, 0.0008006393909454346, 0.0008320063352584839, 0.0008633732795715332, 0.0008947402238845825, 0.0009261071681976318, 0.0009574741125106812, 0.0009888410568237305, 0.0010202080011367798, 0.001051574945449829, 0.0010829418897628784, 0.0011143088340759277, 0.001145675778388977, 0.0011770427227020264, 0.0012084096670150757, 0.001239776611328125]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 9.0, 3.0, 6.0, 5.0, 6.0, 13.0, 17.0, 15.0, 16.0, 32.0, 36.0, 63.0, 63.0, 96.0, 133.0, 334.0, 1154.0, 995323.0, 49814.0, 731.0, 231.0, 119.0, 94.0, 54.0, 50.0, 35.0, 32.0, 21.0, 9.0, 8.0, 10.0, 8.0, 7.0, 2.0, 4.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.023101806640625, -0.022418975830078125, -0.02173614501953125, -0.021053314208984375, -0.0203704833984375, -0.019687652587890625, -0.01900482177734375, -0.018321990966796875, -0.01763916015625, -0.016956329345703125, -0.01627349853515625, -0.015590667724609375, -0.0149078369140625, -0.014225006103515625, -0.01354217529296875, -0.012859344482421875, -0.012176513671875, -0.011493682861328125, -0.01081085205078125, -0.010128021240234375, -0.0094451904296875, -0.008762359619140625, -0.00807952880859375, -0.007396697998046875, -0.0067138671875, -0.006031036376953125, -0.00534820556640625, -0.004665374755859375, -0.0039825439453125, -0.003299713134765625, -0.00261688232421875, -0.001934051513671875, -0.001251220703125, -0.000568389892578125, 0.00011444091796875, 0.000797271728515625, 0.0014801025390625, 0.002162933349609375, 0.00284576416015625, 0.003528594970703125, 0.00421142578125, 0.004894256591796875, 0.00557708740234375, 0.006259918212890625, 0.0069427490234375, 0.007625579833984375, 0.00830841064453125, 0.008991241455078125, 0.009674072265625, 0.010356903076171875, 0.01103973388671875, 0.011722564697265625, 0.0124053955078125, 0.013088226318359375, 0.01377105712890625, 0.014453887939453125, 0.01513671875, 0.015819549560546875, 0.01650238037109375, 0.017185211181640625, 0.0178680419921875, 0.018550872802734375, 0.01923370361328125, 0.019916534423828125, 0.020599365234375]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 32.0, 169.0, 530.0, 253.0, 27.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0032556939404457808, -0.0031960508786141872, -0.00313640758395195, -0.0030767645221203566, -0.003017121460288763, -0.002957478165626526, -0.0028978351037949324, -0.002838192041963339, -0.0027785487473011017, -0.002718905685469508, -0.002659262390807271, -0.0025996193289756775, -0.002539976267144084, -0.002480332972481847, -0.0024206899106502533, -0.002361046615988016, -0.0023014035541564226, -0.002241760492324829, -0.002182117197662592, -0.0021224741358309984, -0.002062831073999405, -0.0020031877793371677, -0.0019435447175055742, -0.0018839015392586589, -0.0018242584774270654, -0.00176461529918015, -0.0017049722373485565, -0.0016453290591016412, -0.0015856858808547258, -0.0015260428190231323, -0.001466399640776217, -0.0014067564625293016, -0.0013471131678670645, -0.0012874699896201491, -0.0012278269277885556, -0.0011681837495416403, -0.001108540571294725, -0.0010488973930478096, -0.000989254331216216, -0.0009296111529693007, -0.0008699680911377072, -0.0008103249710984528, -0.0007506817928515375, -0.000691038672812283, -0.0006313954945653677, -0.0005717523745261133, -0.0005121092544868588, -0.0004524660762399435, -0.00039282289799302816, -0.0003331797488499433, -0.0002735365997068584, -0.00021389346511568874, -0.00015425031597260386, -9.46071813814342e-05, -3.496403223834932e-05, 2.4679116904735565e-05, 8.432226604782045e-05, 0.00014396541519090533, 0.00020360856433399022, 0.0002632517134770751, 0.0003228948335163295, 0.0003825379826594144, 0.0004421811318024993, 0.0005018243100494146, 0.0005614674300886691]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 3.0, 3.0, 5.0, 3.0, 8.0, 14.0, 9.0, 9.0, 15.0, 12.0, 13.0, 11.0, 19.0, 24.0, 21.0, 28.0, 26.0, 29.0, 29.0, 25.0, 44.0, 38.0, 34.0, 47.0, 35.0, 33.0, 41.0, 41.0, 27.0, 33.0, 33.0, 42.0, 28.0, 26.0, 20.0, 26.0, 25.0, 23.0, 18.0, 19.0, 8.0, 11.0, 20.0, 6.0, 8.0, 9.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0], "bins": [-0.0003854036331176758, -0.00037386640906333923, -0.0003623291850090027, -0.00035079196095466614, -0.0003392547369003296, -0.00032771751284599304, -0.0003161802887916565, -0.00030464306473731995, -0.0002931058406829834, -0.00028156861662864685, -0.0002700313925743103, -0.00025849416851997375, -0.0002469569444656372, -0.00023541972041130066, -0.0002238824963569641, -0.00021234527230262756, -0.00020080804824829102, -0.00018927082419395447, -0.00017773360013961792, -0.00016619637608528137, -0.00015465915203094482, -0.00014312192797660828, -0.00013158470392227173, -0.00012004747986793518, -0.00010851025581359863, -9.697303175926208e-05, -8.543580770492554e-05, -7.389858365058899e-05, -6.236135959625244e-05, -5.0824135541915894e-05, -3.9286911487579346e-05, -2.7749687433242798e-05, -1.621246337890625e-05, -4.675239324569702e-06, 6.861984729766846e-06, 1.8399208784103394e-05, 2.993643283843994e-05, 4.147365689277649e-05, 5.301088094711304e-05, 6.454810500144958e-05, 7.608532905578613e-05, 8.762255311012268e-05, 9.915977716445923e-05, 0.00011069700121879578, 0.00012223422527313232, 0.00013377144932746887, 0.00014530867338180542, 0.00015684589743614197, 0.00016838312149047852, 0.00017992034554481506, 0.0001914575695991516, 0.00020299479365348816, 0.0002145320177078247, 0.00022606924176216125, 0.0002376064658164978, 0.00024914368987083435, 0.0002606809139251709, 0.00027221813797950745, 0.000283755362033844, 0.00029529258608818054, 0.0003068298101425171, 0.00031836703419685364, 0.0003299042582511902, 0.00034144148230552673, 0.0003529787063598633]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 8.0, 7.0, 3.0, 4.0, 8.0, 12.0, 9.0, 9.0, 10.0, 11.0, 18.0, 24.0, 16.0, 18.0, 25.0, 35.0, 31.0, 40.0, 32.0, 30.0, 32.0, 38.0, 34.0, 42.0, 36.0, 33.0, 25.0, 43.0, 34.0, 30.0, 39.0, 31.0, 32.0, 29.0, 22.0, 25.0, 25.0, 24.0, 14.0, 16.0, 5.0, 7.0, 11.0, 6.0, 5.0, 9.0, 3.0, 0.0, 3.0, 0.0, 6.0, 1.0, 2.0, 1.0, 2.0, 3.0], "bins": [-7.50390625, -7.27252197265625, -7.0411376953125, -6.80975341796875, -6.578369140625, -6.34698486328125, -6.1156005859375, -5.88421630859375, -5.65283203125, -5.42144775390625, -5.1900634765625, -4.95867919921875, -4.727294921875, -4.49591064453125, -4.2645263671875, -4.03314208984375, -3.8017578125, -3.57037353515625, -3.3389892578125, -3.10760498046875, -2.876220703125, -2.64483642578125, -2.4134521484375, -2.18206787109375, -1.95068359375, -1.71929931640625, -1.4879150390625, -1.25653076171875, -1.025146484375, -0.79376220703125, -0.5623779296875, -0.33099365234375, -0.099609375, 0.13177490234375, 0.3631591796875, 0.59454345703125, 0.825927734375, 1.05731201171875, 1.2886962890625, 1.52008056640625, 1.75146484375, 1.98284912109375, 2.2142333984375, 2.44561767578125, 2.677001953125, 2.90838623046875, 3.1397705078125, 3.37115478515625, 3.6025390625, 3.83392333984375, 4.0653076171875, 4.29669189453125, 4.528076171875, 4.75946044921875, 4.9908447265625, 5.22222900390625, 5.45361328125, 5.68499755859375, 5.9163818359375, 6.14776611328125, 6.379150390625, 6.61053466796875, 6.8419189453125, 7.07330322265625, 7.3046875]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 12.0, 5.0, 9.0, 7.0, 18.0, 14.0, 27.0, 25.0, 32.0, 45.0, 59.0, 72.0, 140.0, 183.0, 306.0, 541.0, 937.0, 1814.0, 3365.0, 6513.0, 13250.0, 27490.0, 62414.0, 159513.0, 364860.0, 241245.0, 90987.0, 38251.0, 17661.0, 8752.0, 4511.0, 2374.0, 1254.0, 683.0, 418.0, 245.0, 152.0, 108.0, 63.0, 53.0, 39.0, 17.0, 14.0, 15.0, 15.0, 15.0, 7.0, 8.0, 5.0, 3.0, 5.0, 1.0, 3.0, 3.0, 2.0, 4.0, 1.0], "bins": [-5.7578125, -5.57623291015625, -5.3946533203125, -5.21307373046875, -5.031494140625, -4.84991455078125, -4.6683349609375, -4.48675537109375, -4.30517578125, -4.12359619140625, -3.9420166015625, -3.76043701171875, -3.578857421875, -3.39727783203125, -3.2156982421875, -3.03411865234375, -2.8525390625, -2.67095947265625, -2.4893798828125, -2.30780029296875, -2.126220703125, -1.94464111328125, -1.7630615234375, -1.58148193359375, -1.39990234375, -1.21832275390625, -1.0367431640625, -0.85516357421875, -0.673583984375, -0.49200439453125, -0.3104248046875, -0.12884521484375, 0.052734375, 0.23431396484375, 0.4158935546875, 0.59747314453125, 0.779052734375, 0.96063232421875, 1.1422119140625, 1.32379150390625, 1.50537109375, 1.68695068359375, 1.8685302734375, 2.05010986328125, 2.231689453125, 2.41326904296875, 2.5948486328125, 2.77642822265625, 2.9580078125, 3.13958740234375, 3.3211669921875, 3.50274658203125, 3.684326171875, 3.86590576171875, 4.0474853515625, 4.22906494140625, 4.41064453125, 4.59222412109375, 4.7738037109375, 4.95538330078125, 5.136962890625, 5.31854248046875, 5.5001220703125, 5.68170166015625, 5.86328125]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 4.0, 3.0, 6.0, 6.0, 4.0, 2.0, 5.0, 5.0, 6.0, 7.0, 12.0, 17.0, 22.0, 17.0, 20.0, 26.0, 21.0, 29.0, 28.0, 32.0, 26.0, 34.0, 47.0, 45.0, 80.0, 227.0, 1647.0, 191.0, 56.0, 45.0, 50.0, 44.0, 37.0, 33.0, 35.0, 21.0, 25.0, 21.0, 22.0, 10.0, 16.0, 8.0, 13.0, 8.0, 10.0, 10.0, 4.0, 11.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.140625, -20.422119140625, -19.70361328125, -18.985107421875, -18.2666015625, -17.548095703125, -16.82958984375, -16.111083984375, -15.392578125, -14.674072265625, -13.95556640625, -13.237060546875, -12.5185546875, -11.800048828125, -11.08154296875, -10.363037109375, -9.64453125, -8.926025390625, -8.20751953125, -7.489013671875, -6.7705078125, -6.052001953125, -5.33349609375, -4.614990234375, -3.896484375, -3.177978515625, -2.45947265625, -1.740966796875, -1.0224609375, -0.303955078125, 0.41455078125, 1.133056640625, 1.8515625, 2.570068359375, 3.28857421875, 4.007080078125, 4.7255859375, 5.444091796875, 6.16259765625, 6.881103515625, 7.599609375, 8.318115234375, 9.03662109375, 9.755126953125, 10.4736328125, 11.192138671875, 11.91064453125, 12.629150390625, 13.34765625, 14.066162109375, 14.78466796875, 15.503173828125, 16.2216796875, 16.940185546875, 17.65869140625, 18.377197265625, 19.095703125, 19.814208984375, 20.53271484375, 21.251220703125, 21.9697265625, 22.688232421875, 23.40673828125, 24.125244140625, 24.84375]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 3.0, 2.0, 8.0, 6.0, 10.0, 11.0, 9.0, 11.0, 15.0, 13.0, 25.0, 18.0, 31.0, 37.0, 64.0, 76.0, 98.0, 109.0, 118.0, 189.0, 276.0, 466.0, 907.0, 7739.0, 1910025.0, 1216385.0, 6531.0, 969.0, 429.0, 257.0, 192.0, 140.0, 101.0, 80.0, 53.0, 59.0, 54.0, 44.0, 31.0, 27.0, 21.0, 10.0, 11.0, 4.0, 10.0, 7.0, 6.0, 5.0, 7.0, 5.0, 1.0, 4.0, 1.0, 4.0, 2.0], "bins": [-39.5, -38.33740234375, -37.1748046875, -36.01220703125, -34.849609375, -33.68701171875, -32.5244140625, -31.36181640625, -30.19921875, -29.03662109375, -27.8740234375, -26.71142578125, -25.548828125, -24.38623046875, -23.2236328125, -22.06103515625, -20.8984375, -19.73583984375, -18.5732421875, -17.41064453125, -16.248046875, -15.08544921875, -13.9228515625, -12.76025390625, -11.59765625, -10.43505859375, -9.2724609375, -8.10986328125, -6.947265625, -5.78466796875, -4.6220703125, -3.45947265625, -2.296875, -1.13427734375, 0.0283203125, 1.19091796875, 2.353515625, 3.51611328125, 4.6787109375, 5.84130859375, 7.00390625, 8.16650390625, 9.3291015625, 10.49169921875, 11.654296875, 12.81689453125, 13.9794921875, 15.14208984375, 16.3046875, 17.46728515625, 18.6298828125, 19.79248046875, 20.955078125, 22.11767578125, 23.2802734375, 24.44287109375, 25.60546875, 26.76806640625, 27.9306640625, 29.09326171875, 30.255859375, 31.41845703125, 32.5810546875, 33.74365234375, 34.90625]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 9.0, 61.0, 299.0, 440.0, 175.0, 28.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.195556640625, -71.82279205322266, -69.45002746582031, -67.07726287841797, -64.70449829101562, -62.33173370361328, -59.95896911621094, -57.586204528808594, -55.21343994140625, -52.840675354003906, -50.46791076660156, -48.09514617919922, -45.722381591796875, -43.34961700439453, -40.97685241699219, -38.604087829589844, -36.231319427490234, -33.85855484008789, -31.485790252685547, -29.113025665283203, -26.74026107788086, -24.367496490478516, -21.99472999572754, -19.621965408325195, -17.24920082092285, -14.876436233520508, -12.503671646118164, -10.130906105041504, -7.75814151763916, -5.385376930236816, -3.0126113891601562, -0.6398468017578125, 1.7329177856445312, 4.105682373046875, 6.478447437286377, 8.851212501525879, 11.223977088928223, 13.596741676330566, 15.969507217407227, 18.34227180480957, 20.715036392211914, 23.087800979614258, 25.4605655670166, 27.833332061767578, 30.206096649169922, 32.578861236572266, 34.95162582397461, 37.32439041137695, 39.6971549987793, 42.06991958618164, 44.442684173583984, 46.81544876098633, 49.18821334838867, 51.560977935791016, 53.933746337890625, 56.30651092529297, 58.67927551269531, 61.052040100097656, 63.4248046875, 65.79756927490234, 68.17033386230469, 70.54309844970703, 72.91586303710938, 75.28862762451172, 77.66139221191406]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 8.0, 13.0, 18.0, 12.0, 15.0, 20.0, 23.0, 24.0, 31.0, 29.0, 41.0, 48.0, 39.0, 50.0, 39.0, 50.0, 32.0, 50.0, 49.0, 55.0, 49.0, 45.0, 34.0, 21.0, 37.0, 31.0, 28.0, 17.0, 17.0, 12.0, 15.0, 8.0, 8.0, 8.0, 8.0, 8.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.954627990722656, -59.82500076293945, -57.695377349853516, -55.56575012207031, -53.436126708984375, -51.30649948120117, -49.17687225341797, -47.04724884033203, -44.91762161254883, -42.787994384765625, -40.65837097167969, -38.528743743896484, -36.39911651611328, -34.269493103027344, -32.13986587524414, -30.01024055480957, -27.880615234375, -25.75098991394043, -23.62136459350586, -21.491737365722656, -19.362112045288086, -17.232486724853516, -15.102860450744629, -12.973234176635742, -10.843608856201172, -8.713983535766602, -6.584357261657715, -4.454731464385986, -2.325105667114258, -0.1954803466796875, 1.9341459274291992, 4.063772201538086, 6.193397521972656, 8.323022842407227, 10.452649116516113, 12.582275390625, 14.71190071105957, 16.84152603149414, 18.971153259277344, 21.100778579711914, 23.230403900146484, 25.360029220581055, 27.489654541015625, 29.619281768798828, 31.7489070892334, 33.87853240966797, 36.00815963745117, 38.137786865234375, 40.26741027832031, 42.397037506103516, 44.52666091918945, 46.656288146972656, 48.785911560058594, 50.9155387878418, 53.045166015625, 55.17478942871094, 57.30441665649414, 59.434043884277344, 61.56366729736328, 63.693294525146484, 65.82292175292969, 67.95254516601562, 70.08216857910156, 72.21179962158203, 74.34142303466797]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 4.0, 6.0, 6.0, 10.0, 10.0, 10.0, 15.0, 14.0, 16.0, 7.0, 27.0, 22.0, 28.0, 28.0, 31.0, 32.0, 40.0, 39.0, 29.0, 29.0, 41.0, 43.0, 33.0, 28.0, 43.0, 41.0, 38.0, 34.0, 35.0, 31.0, 28.0, 29.0, 21.0, 19.0, 24.0, 33.0, 14.0, 12.0, 6.0, 7.0, 4.0, 9.0, 4.0, 6.0, 3.0, 3.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-7.76171875, -7.52093505859375, -7.2801513671875, -7.03936767578125, -6.798583984375, -6.55780029296875, -6.3170166015625, -6.07623291015625, -5.83544921875, -5.59466552734375, -5.3538818359375, -5.11309814453125, -4.872314453125, -4.63153076171875, -4.3907470703125, -4.14996337890625, -3.9091796875, -3.66839599609375, -3.4276123046875, -3.18682861328125, -2.946044921875, -2.70526123046875, -2.4644775390625, -2.22369384765625, -1.98291015625, -1.74212646484375, -1.5013427734375, -1.26055908203125, -1.019775390625, -0.77899169921875, -0.5382080078125, -0.29742431640625, -0.056640625, 0.18414306640625, 0.4249267578125, 0.66571044921875, 0.906494140625, 1.14727783203125, 1.3880615234375, 1.62884521484375, 1.86962890625, 2.11041259765625, 2.3511962890625, 2.59197998046875, 2.832763671875, 3.07354736328125, 3.3143310546875, 3.55511474609375, 3.7958984375, 4.03668212890625, 4.2774658203125, 4.51824951171875, 4.759033203125, 4.99981689453125, 5.2406005859375, 5.48138427734375, 5.72216796875, 5.96295166015625, 6.2037353515625, 6.44451904296875, 6.685302734375, 6.92608642578125, 7.1668701171875, 7.40765380859375, 7.6484375]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 1.0, 6.0, 7.0, 4.0, 18.0, 11.0, 14.0, 28.0, 29.0, 25.0, 32.0, 45.0, 60.0, 84.0, 114.0, 230.0, 558.0, 2414.0, 26896.0, 1737650.0, 2382529.0, 39120.0, 3028.0, 623.0, 231.0, 126.0, 101.0, 70.0, 49.0, 29.0, 31.0, 28.0, 13.0, 18.0, 15.0, 12.0, 8.0, 6.0, 6.0, 5.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-32.71875, -31.785400390625, -30.85205078125, -29.918701171875, -28.9853515625, -28.052001953125, -27.11865234375, -26.185302734375, -25.251953125, -24.318603515625, -23.38525390625, -22.451904296875, -21.5185546875, -20.585205078125, -19.65185546875, -18.718505859375, -17.78515625, -16.851806640625, -15.91845703125, -14.985107421875, -14.0517578125, -13.118408203125, -12.18505859375, -11.251708984375, -10.318359375, -9.385009765625, -8.45166015625, -7.518310546875, -6.5849609375, -5.651611328125, -4.71826171875, -3.784912109375, -2.8515625, -1.918212890625, -0.98486328125, -0.051513671875, 0.8818359375, 1.815185546875, 2.74853515625, 3.681884765625, 4.615234375, 5.548583984375, 6.48193359375, 7.415283203125, 8.3486328125, 9.281982421875, 10.21533203125, 11.148681640625, 12.08203125, 13.015380859375, 13.94873046875, 14.882080078125, 15.8154296875, 16.748779296875, 17.68212890625, 18.615478515625, 19.548828125, 20.482177734375, 21.41552734375, 22.348876953125, 23.2822265625, 24.215576171875, 25.14892578125, 26.082275390625, 27.015625]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 0.0, 2.0, 6.0, 4.0, 6.0, 10.0, 11.0, 6.0, 15.0, 25.0, 20.0, 33.0, 45.0, 57.0, 64.0, 89.0, 126.0, 176.0, 203.0, 273.0, 354.0, 444.0, 424.0, 376.0, 321.0, 232.0, 174.0, 133.0, 95.0, 72.0, 63.0, 54.0, 44.0, 39.0, 24.0, 20.0, 15.0, 10.0, 8.0, 1.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.125, -9.7252197265625, -9.325439453125, -8.9256591796875, -8.52587890625, -8.1260986328125, -7.726318359375, -7.3265380859375, -6.9267578125, -6.5269775390625, -6.127197265625, -5.7274169921875, -5.32763671875, -4.9278564453125, -4.528076171875, -4.1282958984375, -3.728515625, -3.3287353515625, -2.928955078125, -2.5291748046875, -2.12939453125, -1.7296142578125, -1.329833984375, -0.9300537109375, -0.5302734375, -0.1304931640625, 0.269287109375, 0.6690673828125, 1.06884765625, 1.4686279296875, 1.868408203125, 2.2681884765625, 2.66796875, 3.0677490234375, 3.467529296875, 3.8673095703125, 4.26708984375, 4.6668701171875, 5.066650390625, 5.4664306640625, 5.8662109375, 6.2659912109375, 6.665771484375, 7.0655517578125, 7.46533203125, 7.8651123046875, 8.264892578125, 8.6646728515625, 9.064453125, 9.4642333984375, 9.864013671875, 10.2637939453125, 10.66357421875, 11.0633544921875, 11.463134765625, 11.8629150390625, 12.2626953125, 12.6624755859375, 13.062255859375, 13.4620361328125, 13.86181640625, 14.2615966796875, 14.661376953125, 15.0611572265625, 15.4609375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 6.0, 4.0, 8.0, 8.0, 7.0, 12.0, 12.0, 15.0, 24.0, 26.0, 37.0, 58.0, 56.0, 73.0, 111.0, 126.0, 138.0, 199.0, 240.0, 384.0, 1096.0, 25311.0, 4108963.0, 54236.0, 1394.0, 506.0, 335.0, 196.0, 156.0, 115.0, 99.0, 71.0, 62.0, 46.0, 36.0, 30.0, 28.0, 11.0, 14.0, 8.0, 10.0, 4.0, 4.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-75.0, -72.6240234375, -70.248046875, -67.8720703125, -65.49609375, -63.1201171875, -60.744140625, -58.3681640625, -55.9921875, -53.6162109375, -51.240234375, -48.8642578125, -46.48828125, -44.1123046875, -41.736328125, -39.3603515625, -36.984375, -34.6083984375, -32.232421875, -29.8564453125, -27.48046875, -25.1044921875, -22.728515625, -20.3525390625, -17.9765625, -15.6005859375, -13.224609375, -10.8486328125, -8.47265625, -6.0966796875, -3.720703125, -1.3447265625, 1.03125, 3.4072265625, 5.783203125, 8.1591796875, 10.53515625, 12.9111328125, 15.287109375, 17.6630859375, 20.0390625, 22.4150390625, 24.791015625, 27.1669921875, 29.54296875, 31.9189453125, 34.294921875, 36.6708984375, 39.046875, 41.4228515625, 43.798828125, 46.1748046875, 48.55078125, 50.9267578125, 53.302734375, 55.6787109375, 58.0546875, 60.4306640625, 62.806640625, 65.1826171875, 67.55859375, 69.9345703125, 72.310546875, 74.6865234375, 77.0625]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 60.0, 646.0, 292.0, 19.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.8647232055664, -63.52165985107422, -54.178592681884766, -44.83552551269531, -35.492462158203125, -26.149398803710938, -16.806331634521484, -7.463264465332031, 1.8797988891601562, 11.222864151000977, 20.565929412841797, 29.908994674682617, 39.25205993652344, 48.595123291015625, 57.93819046020508, 67.28125762939453, 76.62432098388672, 85.9673843383789, 95.31045532226562, 104.65351867675781, 113.99658203125, 123.33964538574219, 132.68270874023438, 142.02578735351562, 151.36883544921875, 160.71189880371094, 170.05496215820312, 179.3980255126953, 188.7410888671875, 198.08416748046875, 207.42723083496094, 216.77029418945312, 226.11334228515625, 235.45640563964844, 244.79946899414062, 254.1425323486328, 263.485595703125, 272.82867431640625, 282.1717224121094, 291.5148010253906, 300.85784912109375, 310.200927734375, 319.5439758300781, 328.8870544433594, 338.2301025390625, 347.57318115234375, 356.9162292480469, 366.2593078613281, 375.6023864746094, 384.9454650878906, 394.28851318359375, 403.631591796875, 412.9746398925781, 422.3177185058594, 431.6607666015625, 441.00384521484375, 450.346923828125, 459.69000244140625, 469.0330505371094, 478.3761291503906, 487.71917724609375, 497.062255859375, 506.4053039550781, 515.7484130859375, 525.0914306640625]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 4.0, 6.0, 11.0, 2.0, 6.0, 9.0, 18.0, 19.0, 18.0, 25.0, 31.0, 31.0, 23.0, 34.0, 41.0, 26.0, 28.0, 34.0, 31.0, 47.0, 42.0, 51.0, 42.0, 42.0, 45.0, 41.0, 45.0, 35.0, 31.0, 28.0, 31.0, 20.0, 17.0, 16.0, 18.0, 10.0, 13.0, 5.0, 6.0, 5.0, 3.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-44.88072204589844, -43.396484375, -41.91224670410156, -40.428009033203125, -38.94377136230469, -37.45953369140625, -35.97529602050781, -34.491058349609375, -33.00682067871094, -31.5225830078125, -30.038345336914062, -28.554107666015625, -27.069869995117188, -25.58563232421875, -24.101394653320312, -22.617156982421875, -21.132919311523438, -19.648681640625, -18.164443969726562, -16.680206298828125, -15.195968627929688, -13.71173095703125, -12.227493286132812, -10.743255615234375, -9.259017944335938, -7.7747802734375, -6.2905426025390625, -4.806304931640625, -3.3220672607421875, -1.83782958984375, -0.3535919189453125, 1.130645751953125, 2.614879608154297, 4.099117279052734, 5.583354949951172, 7.067592620849609, 8.551830291748047, 10.036067962646484, 11.520305633544922, 13.00454330444336, 14.488780975341797, 15.973018646240234, 17.457256317138672, 18.94149398803711, 20.425731658935547, 21.909969329833984, 23.394207000732422, 24.87844467163086, 26.362682342529297, 27.846920013427734, 29.331157684326172, 30.81539535522461, 32.29963302612305, 33.783870697021484, 35.26810836791992, 36.75234603881836, 38.2365837097168, 39.720821380615234, 41.20505905151367, 42.68929672241211, 44.17353439331055, 45.657772064208984, 47.14200973510742, 48.62624740600586, 50.1104850769043]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 8.0, 4.0, 6.0, 12.0, 20.0, 12.0, 12.0, 15.0, 19.0, 25.0, 20.0, 25.0, 33.0, 29.0, 26.0, 37.0, 38.0, 47.0, 41.0, 29.0, 35.0, 33.0, 40.0, 40.0, 26.0, 40.0, 37.0, 34.0, 29.0, 28.0, 23.0, 27.0, 35.0, 10.0, 17.0, 13.0, 15.0, 14.0, 7.0, 9.0, 7.0, 7.0, 4.0, 5.0, 4.0, 1.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.26171875, -7.02142333984375, -6.7811279296875, -6.54083251953125, -6.300537109375, -6.06024169921875, -5.8199462890625, -5.57965087890625, -5.33935546875, -5.09906005859375, -4.8587646484375, -4.61846923828125, -4.378173828125, -4.13787841796875, -3.8975830078125, -3.65728759765625, -3.4169921875, -3.17669677734375, -2.9364013671875, -2.69610595703125, -2.455810546875, -2.21551513671875, -1.9752197265625, -1.73492431640625, -1.49462890625, -1.25433349609375, -1.0140380859375, -0.77374267578125, -0.533447265625, -0.29315185546875, -0.0528564453125, 0.18743896484375, 0.427734375, 0.66802978515625, 0.9083251953125, 1.14862060546875, 1.388916015625, 1.62921142578125, 1.8695068359375, 2.10980224609375, 2.35009765625, 2.59039306640625, 2.8306884765625, 3.07098388671875, 3.311279296875, 3.55157470703125, 3.7918701171875, 4.03216552734375, 4.2724609375, 4.51275634765625, 4.7530517578125, 4.99334716796875, 5.233642578125, 5.47393798828125, 5.7142333984375, 5.95452880859375, 6.19482421875, 6.43511962890625, 6.6754150390625, 6.91571044921875, 7.156005859375, 7.39630126953125, 7.6365966796875, 7.87689208984375, 8.1171875]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 3.0, 6.0, 10.0, 16.0, 21.0, 28.0, 29.0, 48.0, 83.0, 107.0, 148.0, 203.0, 321.0, 403.0, 638.0, 880.0, 1178.0, 1726.0, 2538.0, 3521.0, 5135.0, 7258.0, 10423.0, 15495.0, 22814.0, 34347.0, 53577.0, 88104.0, 169772.0, 285359.0, 131464.0, 72880.0, 46109.0, 29934.0, 19890.0, 13586.0, 9093.0, 6340.0, 4523.0, 3043.0, 2228.0, 1649.0, 1019.0, 722.0, 578.0, 436.0, 275.0, 161.0, 139.0, 102.0, 59.0, 44.0, 33.0, 24.0, 16.0, 6.0, 9.0, 7.0, 3.0, 5.0], "bins": [-1.396484375, -1.354583740234375, -1.31268310546875, -1.270782470703125, -1.2288818359375, -1.186981201171875, -1.14508056640625, -1.103179931640625, -1.061279296875, -1.019378662109375, -0.97747802734375, -0.935577392578125, -0.8936767578125, -0.851776123046875, -0.80987548828125, -0.767974853515625, -0.72607421875, -0.684173583984375, -0.64227294921875, -0.600372314453125, -0.5584716796875, -0.516571044921875, -0.47467041015625, -0.432769775390625, -0.390869140625, -0.348968505859375, -0.30706787109375, -0.265167236328125, -0.2232666015625, -0.181365966796875, -0.13946533203125, -0.097564697265625, -0.0556640625, -0.013763427734375, 0.02813720703125, 0.070037841796875, 0.1119384765625, 0.153839111328125, 0.19573974609375, 0.237640380859375, 0.279541015625, 0.321441650390625, 0.36334228515625, 0.405242919921875, 0.4471435546875, 0.489044189453125, 0.53094482421875, 0.572845458984375, 0.61474609375, 0.656646728515625, 0.69854736328125, 0.740447998046875, 0.7823486328125, 0.824249267578125, 0.86614990234375, 0.908050537109375, 0.949951171875, 0.991851806640625, 1.03375244140625, 1.075653076171875, 1.1175537109375, 1.159454345703125, 1.20135498046875, 1.243255615234375, 1.28515625]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 1.0, 4.0, 9.0, 5.0, 4.0, 2.0, 5.0, 10.0, 12.0, 19.0, 20.0, 10.0, 20.0, 22.0, 26.0, 23.0, 33.0, 38.0, 40.0, 34.0, 36.0, 34.0, 26.0, 1075.0, 44.0, 49.0, 37.0, 41.0, 43.0, 33.0, 30.0, 25.0, 32.0, 29.0, 25.0, 16.0, 13.0, 27.0, 14.0, 10.0, 6.0, 13.0, 5.0, 12.0, 6.0, 4.0, 2.0, 4.0, 1.0, 4.0, 3.0, 2.0, 0.0, 1.0], "bins": [-5.25, -5.0946044921875, -4.939208984375, -4.7838134765625, -4.62841796875, -4.4730224609375, -4.317626953125, -4.1622314453125, -4.0068359375, -3.8514404296875, -3.696044921875, -3.5406494140625, -3.38525390625, -3.2298583984375, -3.074462890625, -2.9190673828125, -2.763671875, -2.6082763671875, -2.452880859375, -2.2974853515625, -2.14208984375, -1.9866943359375, -1.831298828125, -1.6759033203125, -1.5205078125, -1.3651123046875, -1.209716796875, -1.0543212890625, -0.89892578125, -0.7435302734375, -0.588134765625, -0.4327392578125, -0.27734375, -0.1219482421875, 0.033447265625, 0.1888427734375, 0.34423828125, 0.4996337890625, 0.655029296875, 0.8104248046875, 0.9658203125, 1.1212158203125, 1.276611328125, 1.4320068359375, 1.58740234375, 1.7427978515625, 1.898193359375, 2.0535888671875, 2.208984375, 2.3643798828125, 2.519775390625, 2.6751708984375, 2.83056640625, 2.9859619140625, 3.141357421875, 3.2967529296875, 3.4521484375, 3.6075439453125, 3.762939453125, 3.9183349609375, 4.07373046875, 4.2291259765625, 4.384521484375, 4.5399169921875, 4.6953125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 4.0, 1.0, 2.0, 6.0, 8.0, 13.0, 22.0, 23.0, 48.0, 76.0, 90.0, 144.0, 166.0, 297.0, 404.0, 623.0, 890.0, 1275.0, 1779.0, 2811.0, 3851.0, 5676.0, 8687.0, 13040.0, 19900.0, 31542.0, 50910.0, 86635.0, 169445.0, 1357638.0, 138647.0, 76003.0, 45042.0, 28008.0, 17751.0, 11594.0, 7672.0, 5094.0, 3507.0, 2435.0, 1650.0, 1099.0, 821.0, 550.0, 383.0, 274.0, 191.0, 102.0, 104.0, 74.0, 44.0, 22.0, 28.0, 14.0, 16.0, 11.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-1.462890625, -1.4177093505859375, -1.372528076171875, -1.3273468017578125, -1.28216552734375, -1.2369842529296875, -1.191802978515625, -1.1466217041015625, -1.1014404296875, -1.0562591552734375, -1.011077880859375, -0.9658966064453125, -0.92071533203125, -0.8755340576171875, -0.830352783203125, -0.7851715087890625, -0.739990234375, -0.6948089599609375, -0.649627685546875, -0.6044464111328125, -0.55926513671875, -0.5140838623046875, -0.468902587890625, -0.4237213134765625, -0.3785400390625, -0.3333587646484375, -0.288177490234375, -0.2429962158203125, -0.19781494140625, -0.1526336669921875, -0.107452392578125, -0.0622711181640625, -0.01708984375, 0.0280914306640625, 0.073272705078125, 0.1184539794921875, 0.16363525390625, 0.2088165283203125, 0.253997802734375, 0.2991790771484375, 0.3443603515625, 0.3895416259765625, 0.434722900390625, 0.4799041748046875, 0.52508544921875, 0.5702667236328125, 0.615447998046875, 0.6606292724609375, 0.705810546875, 0.7509918212890625, 0.796173095703125, 0.8413543701171875, 0.88653564453125, 0.9317169189453125, 0.976898193359375, 1.0220794677734375, 1.0672607421875, 1.1124420166015625, 1.157623291015625, 1.2028045654296875, 1.24798583984375, 1.2931671142578125, 1.338348388671875, 1.3835296630859375, 1.4287109375]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 4.0, 0.0, 1.0, 4.0, 2.0, 5.0, 7.0, 12.0, 13.0, 9.0, 21.0, 34.0, 39.0, 53.0, 70.0, 92.0, 103.0, 89.0, 117.0, 81.0, 76.0, 43.0, 39.0, 25.0, 15.0, 14.0, 9.0, 4.0, 4.0, 1.0, 4.0, 8.0, 4.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00116729736328125, -0.0011277049779891968, -0.0010881125926971436, -0.0010485202074050903, -0.0010089278221130371, -0.0009693354368209839, -0.0009297430515289307, -0.0008901506662368774, -0.0008505582809448242, -0.000810965895652771, -0.0007713735103607178, -0.0007317811250686646, -0.0006921887397766113, -0.0006525963544845581, -0.0006130039691925049, -0.0005734115839004517, -0.0005338191986083984, -0.0004942268133163452, -0.000454634428024292, -0.00041504204273223877, -0.00037544965744018555, -0.0003358572721481323, -0.0002962648868560791, -0.0002566725015640259, -0.00021708011627197266, -0.00017748773097991943, -0.0001378953456878662, -9.830296039581299e-05, -5.8710575103759766e-05, -1.9118189811706543e-05, 2.047419548034668e-05, 6.00665807723999e-05, 9.965896606445312e-05, 0.00013925135135650635, 0.00017884373664855957, 0.0002184361219406128, 0.000258028507232666, 0.00029762089252471924, 0.00033721327781677246, 0.0003768056631088257, 0.0004163980484008789, 0.00045599043369293213, 0.0004955828189849854, 0.0005351752042770386, 0.0005747675895690918, 0.000614359974861145, 0.0006539523601531982, 0.0006935447454452515, 0.0007331371307373047, 0.0007727295160293579, 0.0008123219013214111, 0.0008519142866134644, 0.0008915066719055176, 0.0009310990571975708, 0.000970691442489624, 0.0010102838277816772, 0.0010498762130737305, 0.0010894685983657837, 0.001129060983657837, 0.0011686533689498901, 0.0012082457542419434, 0.0012478381395339966, 0.0012874305248260498, 0.001327022910118103, 0.0013666152954101562]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 6.0, 3.0, 7.0, 4.0, 7.0, 7.0, 5.0, 7.0, 13.0, 18.0, 38.0, 27.0, 51.0, 87.0, 132.0, 255.0, 602.0, 153361.0, 892369.0, 799.0, 305.0, 145.0, 79.0, 60.0, 53.0, 37.0, 20.0, 11.0, 14.0, 12.0, 11.0, 1.0, 3.0, 2.0, 3.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02978515625, -0.028935909271240234, -0.02808666229248047, -0.027237415313720703, -0.026388168334960938, -0.025538921356201172, -0.024689674377441406, -0.02384042739868164, -0.022991180419921875, -0.02214193344116211, -0.021292686462402344, -0.020443439483642578, -0.019594192504882812, -0.018744945526123047, -0.01789569854736328, -0.017046451568603516, -0.01619720458984375, -0.015347957611083984, -0.014498710632324219, -0.013649463653564453, -0.012800216674804688, -0.011950969696044922, -0.011101722717285156, -0.01025247573852539, -0.009403228759765625, -0.00855398178100586, -0.007704734802246094, -0.006855487823486328, -0.0060062408447265625, -0.005156993865966797, -0.004307746887207031, -0.0034584999084472656, -0.0026092529296875, -0.0017600059509277344, -0.0009107589721679688, -6.151199340820312e-05, 0.0007877349853515625, 0.0016369819641113281, 0.0024862289428710938, 0.0033354759216308594, 0.004184722900390625, 0.005033969879150391, 0.005883216857910156, 0.006732463836669922, 0.0075817108154296875, 0.008430957794189453, 0.009280204772949219, 0.010129451751708984, 0.01097869873046875, 0.011827945709228516, 0.012677192687988281, 0.013526439666748047, 0.014375686645507812, 0.015224933624267578, 0.016074180603027344, 0.01692342758178711, 0.017772674560546875, 0.01862192153930664, 0.019471168518066406, 0.020320415496826172, 0.021169662475585938, 0.022018909454345703, 0.02286815643310547, 0.023717403411865234, 0.024566650390625]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 91.0, 635.0, 269.0, 15.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.004511009901762009, -0.004430022556334734, -0.004349035210907459, -0.004268048331141472, -0.004187060985714197, -0.0041060736402869225, -0.004025086294859648, -0.00394409941509366, -0.0038631120696663857, -0.003782124724239111, -0.00370113761164248, -0.003620150266215205, -0.003539163153618574, -0.0034581758081912994, -0.0033771886955946684, -0.0032962013501673937, -0.0032152142375707626, -0.003134226892143488, -0.003053239779546857, -0.002972252434119582, -0.002891265321522951, -0.0028102779760956764, -0.0027292908634990454, -0.0026483035180717707, -0.002567316172644496, -0.0024863288272172213, -0.00240534171462059, -0.0023243543691933155, -0.0022433672565966845, -0.0021623799111694098, -0.0020813927985727787, -0.002000405453145504, -0.0019194182241335511, -0.0018384309951215982, -0.0017574437661096454, -0.0016764565370976925, -0.0015954693080857396, -0.0015144820790737867, -0.001433494733646512, -0.001352507621049881, -0.0012715202756226063, -0.0011905330466106534, -0.0011095458175987005, -0.0010285585885867476, -0.0009475713595747948, -0.0008665841305628419, -0.0007855968433432281, -0.0007046096143312752, -0.0006236224435269833, -0.0005426352145150304, -0.0004616479855030775, -0.0003806607273872942, -0.0002996734983753413, -0.00021868626936338842, -0.00013769901124760509, -5.671178223565221e-05, 2.427544677630067e-05, 0.00010526268306421116, 0.00018624991935212165, 0.00026723716291598976, 0.00034822439192794263, 0.0004292116209398955, 0.0005101988790556788, 0.0005911861080676317, 0.0006721733370795846]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 5.0, 6.0, 7.0, 8.0, 6.0, 7.0, 11.0, 11.0, 26.0, 15.0, 17.0, 25.0, 23.0, 26.0, 30.0, 27.0, 35.0, 39.0, 35.0, 50.0, 33.0, 48.0, 36.0, 33.0, 41.0, 28.0, 47.0, 32.0, 39.0, 36.0, 34.0, 29.0, 27.0, 23.0, 10.0, 16.0, 16.0, 14.0, 10.0, 10.0, 6.0, 11.0, 11.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003864765167236328, -0.000372045673429966, -0.00035761483013629913, -0.0003431839868426323, -0.00032875314354896545, -0.0003143223002552986, -0.0002998914569616318, -0.00028546061366796494, -0.0002710297703742981, -0.00025659892708063126, -0.00024216808378696442, -0.00022773724049329758, -0.00021330639719963074, -0.0001988755539059639, -0.00018444471061229706, -0.00017001386731863022, -0.00015558302402496338, -0.00014115218073129654, -0.0001267213374376297, -0.00011229049414396286, -9.785965085029602e-05, -8.342880755662918e-05, -6.899796426296234e-05, -5.45671209692955e-05, -4.013627767562866e-05, -2.5705434381961823e-05, -1.1274591088294983e-05, 3.1562522053718567e-06, 1.7587095499038696e-05, 3.2017938792705536e-05, 4.6448782086372375e-05, 6.0879625380039215e-05, 7.531046867370605e-05, 8.97413119673729e-05, 0.00010417215526103973, 0.00011860299855470657, 0.0001330338418483734, 0.00014746468514204025, 0.0001618955284357071, 0.00017632637172937393, 0.00019075721502304077, 0.0002051880583167076, 0.00021961890161037445, 0.0002340497449040413, 0.00024848058819770813, 0.00026291143149137497, 0.0002773422747850418, 0.00029177311807870865, 0.0003062039613723755, 0.00032063480466604233, 0.00033506564795970917, 0.000349496491253376, 0.00036392733454704285, 0.0003783581778407097, 0.0003927890211343765, 0.00040721986442804337, 0.0004216507077217102, 0.00043608155101537704, 0.0004505123943090439, 0.0004649432376027107, 0.00047937408089637756, 0.0004938049241900444, 0.0005082357674837112, 0.0005226666107773781, 0.0005370974540710449]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 8.0, 4.0, 6.0, 12.0, 20.0, 12.0, 12.0, 15.0, 19.0, 25.0, 20.0, 25.0, 33.0, 29.0, 26.0, 37.0, 38.0, 47.0, 41.0, 29.0, 35.0, 33.0, 40.0, 40.0, 26.0, 40.0, 37.0, 34.0, 29.0, 28.0, 23.0, 27.0, 35.0, 10.0, 17.0, 13.0, 15.0, 14.0, 7.0, 9.0, 7.0, 7.0, 4.0, 5.0, 4.0, 1.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.26171875, -7.02142333984375, -6.7811279296875, -6.54083251953125, -6.300537109375, -6.06024169921875, -5.8199462890625, -5.57965087890625, -5.33935546875, -5.09906005859375, -4.8587646484375, -4.61846923828125, -4.378173828125, -4.13787841796875, -3.8975830078125, -3.65728759765625, -3.4169921875, -3.17669677734375, -2.9364013671875, -2.69610595703125, -2.455810546875, -2.21551513671875, -1.9752197265625, -1.73492431640625, -1.49462890625, -1.25433349609375, -1.0140380859375, -0.77374267578125, -0.533447265625, -0.29315185546875, -0.0528564453125, 0.18743896484375, 0.427734375, 0.66802978515625, 0.9083251953125, 1.14862060546875, 1.388916015625, 1.62921142578125, 1.8695068359375, 2.10980224609375, 2.35009765625, 2.59039306640625, 2.8306884765625, 3.07098388671875, 3.311279296875, 3.55157470703125, 3.7918701171875, 4.03216552734375, 4.2724609375, 4.51275634765625, 4.7530517578125, 4.99334716796875, 5.233642578125, 5.47393798828125, 5.7142333984375, 5.95452880859375, 6.19482421875, 6.43511962890625, 6.6754150390625, 6.91571044921875, 7.156005859375, 7.39630126953125, 7.6365966796875, 7.87689208984375, 8.1171875]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 8.0, 6.0, 4.0, 16.0, 23.0, 18.0, 14.0, 26.0, 42.0, 38.0, 39.0, 74.0, 96.0, 129.0, 179.0, 283.0, 501.0, 1184.0, 4496.0, 29551.0, 314677.0, 631551.0, 54741.0, 7579.0, 1567.0, 570.0, 313.0, 209.0, 160.0, 101.0, 77.0, 71.0, 53.0, 23.0, 26.0, 23.0, 19.0, 15.0, 7.0, 12.0, 8.0, 8.0, 3.0, 4.0, 5.0, 0.0, 1.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.34375, -13.867919921875, -13.39208984375, -12.916259765625, -12.4404296875, -11.964599609375, -11.48876953125, -11.012939453125, -10.537109375, -10.061279296875, -9.58544921875, -9.109619140625, -8.6337890625, -8.157958984375, -7.68212890625, -7.206298828125, -6.73046875, -6.254638671875, -5.77880859375, -5.302978515625, -4.8271484375, -4.351318359375, -3.87548828125, -3.399658203125, -2.923828125, -2.447998046875, -1.97216796875, -1.496337890625, -1.0205078125, -0.544677734375, -0.06884765625, 0.406982421875, 0.8828125, 1.358642578125, 1.83447265625, 2.310302734375, 2.7861328125, 3.261962890625, 3.73779296875, 4.213623046875, 4.689453125, 5.165283203125, 5.64111328125, 6.116943359375, 6.5927734375, 7.068603515625, 7.54443359375, 8.020263671875, 8.49609375, 8.971923828125, 9.44775390625, 9.923583984375, 10.3994140625, 10.875244140625, 11.35107421875, 11.826904296875, 12.302734375, 12.778564453125, 13.25439453125, 13.730224609375, 14.2060546875, 14.681884765625, 15.15771484375, 15.633544921875, 16.109375]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 2.0, 3.0, 9.0, 4.0, 6.0, 13.0, 10.0, 17.0, 19.0, 19.0, 25.0, 21.0, 25.0, 27.0, 36.0, 42.0, 35.0, 35.0, 46.0, 67.0, 101.0, 348.0, 1519.0, 146.0, 61.0, 52.0, 39.0, 44.0, 36.0, 34.0, 31.0, 18.0, 25.0, 18.0, 14.0, 12.0, 18.0, 5.0, 10.0, 12.0, 15.0, 6.0, 6.0, 8.0, 5.0, 5.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.671875, -20.953369140625, -20.23486328125, -19.516357421875, -18.7978515625, -18.079345703125, -17.36083984375, -16.642333984375, -15.923828125, -15.205322265625, -14.48681640625, -13.768310546875, -13.0498046875, -12.331298828125, -11.61279296875, -10.894287109375, -10.17578125, -9.457275390625, -8.73876953125, -8.020263671875, -7.3017578125, -6.583251953125, -5.86474609375, -5.146240234375, -4.427734375, -3.709228515625, -2.99072265625, -2.272216796875, -1.5537109375, -0.835205078125, -0.11669921875, 0.601806640625, 1.3203125, 2.038818359375, 2.75732421875, 3.475830078125, 4.1943359375, 4.912841796875, 5.63134765625, 6.349853515625, 7.068359375, 7.786865234375, 8.50537109375, 9.223876953125, 9.9423828125, 10.660888671875, 11.37939453125, 12.097900390625, 12.81640625, 13.534912109375, 14.25341796875, 14.971923828125, 15.6904296875, 16.408935546875, 17.12744140625, 17.845947265625, 18.564453125, 19.282958984375, 20.00146484375, 20.719970703125, 21.4384765625, 22.156982421875, 22.87548828125, 23.593994140625, 24.3125]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 6.0, 4.0, 7.0, 7.0, 6.0, 9.0, 16.0, 13.0, 9.0, 18.0, 17.0, 16.0, 22.0, 34.0, 33.0, 56.0, 60.0, 100.0, 147.0, 194.0, 371.0, 1020.0, 7822.0, 2972903.0, 158355.0, 2807.0, 661.0, 295.0, 193.0, 126.0, 89.0, 56.0, 43.0, 24.0, 28.0, 27.0, 25.0, 21.0, 19.0, 14.0, 10.0, 7.0, 6.0, 9.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.46875, -54.7978515625, -53.126953125, -51.4560546875, -49.78515625, -48.1142578125, -46.443359375, -44.7724609375, -43.1015625, -41.4306640625, -39.759765625, -38.0888671875, -36.41796875, -34.7470703125, -33.076171875, -31.4052734375, -29.734375, -28.0634765625, -26.392578125, -24.7216796875, -23.05078125, -21.3798828125, -19.708984375, -18.0380859375, -16.3671875, -14.6962890625, -13.025390625, -11.3544921875, -9.68359375, -8.0126953125, -6.341796875, -4.6708984375, -3.0, -1.3291015625, 0.341796875, 2.0126953125, 3.68359375, 5.3544921875, 7.025390625, 8.6962890625, 10.3671875, 12.0380859375, 13.708984375, 15.3798828125, 17.05078125, 18.7216796875, 20.392578125, 22.0634765625, 23.734375, 25.4052734375, 27.076171875, 28.7470703125, 30.41796875, 32.0888671875, 33.759765625, 35.4306640625, 37.1015625, 38.7724609375, 40.443359375, 42.1142578125, 43.78515625, 45.4560546875, 47.126953125, 48.7978515625, 50.46875]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 13.0, 60.0, 434.0, 419.0, 74.0, 15.0], "bins": [-216.2816619873047, -212.73399353027344, -209.1863250732422, -205.638671875, -202.09100341796875, -198.5433349609375, -194.99566650390625, -191.447998046875, -187.90032958984375, -184.3526611328125, -180.80499267578125, -177.25733947753906, -173.7096710205078, -170.16200256347656, -166.6143341064453, -163.06666564941406, -159.51901245117188, -155.97134399414062, -152.42367553710938, -148.8760223388672, -145.32835388183594, -141.7806854248047, -138.23301696777344, -134.6853485107422, -131.1376953125, -127.59002685546875, -124.04236602783203, -120.49469757080078, -116.94703674316406, -113.39936828613281, -109.85169982910156, -106.30403137207031, -102.7563705444336, -99.20870208740234, -95.66104125976562, -92.11337280273438, -88.56570434570312, -85.0180435180664, -81.47037506103516, -77.92271423339844, -74.37504577636719, -70.82737731933594, -67.27971649169922, -63.73204803466797, -60.184383392333984, -56.63671875, -53.08905029296875, -49.541385650634766, -45.99372100830078, -42.4460563659668, -38.89839172363281, -35.35072326660156, -31.803058624267578, -28.255393981933594, -24.707727432250977, -21.16006088256836, -17.612394332885742, -14.064728736877441, -10.51706314086914, -6.96939754486084, -3.421731948852539, 0.1259326934814453, 3.6735992431640625, 7.22126579284668, 10.768930435180664]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 3.0, 1.0, 9.0, 4.0, 11.0, 9.0, 10.0, 5.0, 7.0, 9.0, 15.0, 21.0, 24.0, 18.0, 21.0, 25.0, 31.0, 27.0, 34.0, 45.0, 36.0, 38.0, 36.0, 43.0, 43.0, 46.0, 43.0, 38.0, 44.0, 34.0, 33.0, 30.0, 31.0, 17.0, 28.0, 17.0, 20.0, 10.0, 22.0, 11.0, 11.0, 8.0, 5.0, 7.0, 6.0, 8.0, 3.0, 4.0, 3.0, 6.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-60.735069274902344, -58.828399658203125, -56.921730041503906, -55.01506042480469, -53.10839080810547, -51.20172119140625, -49.29505157470703, -47.38838195800781, -45.481712341308594, -43.575042724609375, -41.668373107910156, -39.76170349121094, -37.85503387451172, -35.9483642578125, -34.04169464111328, -32.13502502441406, -30.22835922241211, -28.32168960571289, -26.415019989013672, -24.508350372314453, -22.601680755615234, -20.695011138916016, -18.78834342956543, -16.88167381286621, -14.975004196166992, -13.068334579467773, -11.161664962768555, -9.254996299743652, -7.348326683044434, -5.441657066345215, -3.5349884033203125, -1.6283187866210938, 0.278350830078125, 2.1850202083587646, 4.091689586639404, 5.998358726501465, 7.905028343200684, 9.811697959899902, 11.718366622924805, 13.625036239624023, 15.531705856323242, 17.43837547302246, 19.34504508972168, 21.251712799072266, 23.158382415771484, 25.065052032470703, 26.971721649169922, 28.87839126586914, 30.78506088256836, 32.69173049926758, 34.5984001159668, 36.505069732666016, 38.411739349365234, 40.31840896606445, 42.225074768066406, 44.131744384765625, 46.038414001464844, 47.94508361816406, 49.85175323486328, 51.7584228515625, 53.66509246826172, 55.57176208496094, 57.478431701660156, 59.385101318359375, 61.291770935058594]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 5.0, 6.0, 9.0, 8.0, 9.0, 21.0, 21.0, 17.0, 7.0, 21.0, 20.0, 30.0, 26.0, 34.0, 29.0, 43.0, 36.0, 27.0, 31.0, 32.0, 44.0, 35.0, 36.0, 39.0, 23.0, 43.0, 36.0, 34.0, 38.0, 33.0, 23.0, 30.0, 16.0, 21.0, 19.0, 12.0, 11.0, 16.0, 12.0, 13.0, 6.0, 7.0, 4.0, 4.0, 7.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-7.9140625, -7.6708984375, -7.427734375, -7.1845703125, -6.94140625, -6.6982421875, -6.455078125, -6.2119140625, -5.96875, -5.7255859375, -5.482421875, -5.2392578125, -4.99609375, -4.7529296875, -4.509765625, -4.2666015625, -4.0234375, -3.7802734375, -3.537109375, -3.2939453125, -3.05078125, -2.8076171875, -2.564453125, -2.3212890625, -2.078125, -1.8349609375, -1.591796875, -1.3486328125, -1.10546875, -0.8623046875, -0.619140625, -0.3759765625, -0.1328125, 0.1103515625, 0.353515625, 0.5966796875, 0.83984375, 1.0830078125, 1.326171875, 1.5693359375, 1.8125, 2.0556640625, 2.298828125, 2.5419921875, 2.78515625, 3.0283203125, 3.271484375, 3.5146484375, 3.7578125, 4.0009765625, 4.244140625, 4.4873046875, 4.73046875, 4.9736328125, 5.216796875, 5.4599609375, 5.703125, 5.9462890625, 6.189453125, 6.4326171875, 6.67578125, 6.9189453125, 7.162109375, 7.4052734375, 7.6484375]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 9.0, 4.0, 6.0, 7.0, 12.0, 17.0, 15.0, 17.0, 27.0, 24.0, 42.0, 62.0, 70.0, 109.0, 155.0, 363.0, 681.0, 1668.0, 6980.0, 80822.0, 2229830.0, 1806054.0, 58252.0, 5979.0, 1564.0, 610.0, 322.0, 172.0, 117.0, 85.0, 38.0, 24.0, 26.0, 17.0, 21.0, 13.0, 19.0, 11.0, 10.0, 8.0, 4.0, 3.0, 3.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.734375, -22.967529296875, -22.20068359375, -21.433837890625, -20.6669921875, -19.900146484375, -19.13330078125, -18.366455078125, -17.599609375, -16.832763671875, -16.06591796875, -15.299072265625, -14.5322265625, -13.765380859375, -12.99853515625, -12.231689453125, -11.46484375, -10.697998046875, -9.93115234375, -9.164306640625, -8.3974609375, -7.630615234375, -6.86376953125, -6.096923828125, -5.330078125, -4.563232421875, -3.79638671875, -3.029541015625, -2.2626953125, -1.495849609375, -0.72900390625, 0.037841796875, 0.8046875, 1.571533203125, 2.33837890625, 3.105224609375, 3.8720703125, 4.638916015625, 5.40576171875, 6.172607421875, 6.939453125, 7.706298828125, 8.47314453125, 9.239990234375, 10.0068359375, 10.773681640625, 11.54052734375, 12.307373046875, 13.07421875, 13.841064453125, 14.60791015625, 15.374755859375, 16.1416015625, 16.908447265625, 17.67529296875, 18.442138671875, 19.208984375, 19.975830078125, 20.74267578125, 21.509521484375, 22.2763671875, 23.043212890625, 23.81005859375, 24.576904296875, 25.34375]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 1.0, 3.0, 5.0, 13.0, 9.0, 12.0, 11.0, 12.0, 24.0, 45.0, 51.0, 67.0, 75.0, 108.0, 139.0, 174.0, 244.0, 296.0, 370.0, 408.0, 465.0, 350.0, 287.0, 228.0, 145.0, 148.0, 97.0, 61.0, 68.0, 45.0, 34.0, 21.0, 16.0, 9.0, 10.0, 8.0, 4.0, 1.0, 2.0, 2.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-14.5546875, -14.1494140625, -13.744140625, -13.3388671875, -12.93359375, -12.5283203125, -12.123046875, -11.7177734375, -11.3125, -10.9072265625, -10.501953125, -10.0966796875, -9.69140625, -9.2861328125, -8.880859375, -8.4755859375, -8.0703125, -7.6650390625, -7.259765625, -6.8544921875, -6.44921875, -6.0439453125, -5.638671875, -5.2333984375, -4.828125, -4.4228515625, -4.017578125, -3.6123046875, -3.20703125, -2.8017578125, -2.396484375, -1.9912109375, -1.5859375, -1.1806640625, -0.775390625, -0.3701171875, 0.03515625, 0.4404296875, 0.845703125, 1.2509765625, 1.65625, 2.0615234375, 2.466796875, 2.8720703125, 3.27734375, 3.6826171875, 4.087890625, 4.4931640625, 4.8984375, 5.3037109375, 5.708984375, 6.1142578125, 6.51953125, 6.9248046875, 7.330078125, 7.7353515625, 8.140625, 8.5458984375, 8.951171875, 9.3564453125, 9.76171875, 10.1669921875, 10.572265625, 10.9775390625, 11.3828125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 6.0, 4.0, 6.0, 12.0, 10.0, 11.0, 18.0, 28.0, 32.0, 44.0, 44.0, 62.0, 75.0, 96.0, 102.0, 175.0, 221.0, 465.0, 1033.0, 7537.0, 2455691.0, 1719792.0, 6375.0, 1022.0, 438.0, 247.0, 178.0, 127.0, 98.0, 60.0, 57.0, 44.0, 35.0, 32.0, 23.0, 21.0, 14.0, 16.0, 8.0, 8.0, 7.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-67.0, -64.96826171875, -62.9365234375, -60.90478515625, -58.873046875, -56.84130859375, -54.8095703125, -52.77783203125, -50.74609375, -48.71435546875, -46.6826171875, -44.65087890625, -42.619140625, -40.58740234375, -38.5556640625, -36.52392578125, -34.4921875, -32.46044921875, -30.4287109375, -28.39697265625, -26.365234375, -24.33349609375, -22.3017578125, -20.27001953125, -18.23828125, -16.20654296875, -14.1748046875, -12.14306640625, -10.111328125, -8.07958984375, -6.0478515625, -4.01611328125, -1.984375, 0.04736328125, 2.0791015625, 4.11083984375, 6.142578125, 8.17431640625, 10.2060546875, 12.23779296875, 14.26953125, 16.30126953125, 18.3330078125, 20.36474609375, 22.396484375, 24.42822265625, 26.4599609375, 28.49169921875, 30.5234375, 32.55517578125, 34.5869140625, 36.61865234375, 38.650390625, 40.68212890625, 42.7138671875, 44.74560546875, 46.77734375, 48.80908203125, 50.8408203125, 52.87255859375, 54.904296875, 56.93603515625, 58.9677734375, 60.99951171875, 63.03125]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 21.0, 256.0, 587.0, 143.0, 7.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-235.29290771484375, -227.54730224609375, -219.80169677734375, -212.05609130859375, -204.31048583984375, -196.56488037109375, -188.81927490234375, -181.07366943359375, -173.32806396484375, -165.58245849609375, -157.83685302734375, -150.09124755859375, -142.34564208984375, -134.60003662109375, -126.85443115234375, -119.10882568359375, -111.36322021484375, -103.61761474609375, -95.87200927734375, -88.12640380859375, -80.38079833984375, -72.63519287109375, -64.88958740234375, -57.14398193359375, -49.39837646484375, -41.65277099609375, -33.90716552734375, -26.16156005859375, -18.41595458984375, -10.67034912109375, -2.92474365234375, 4.82086181640625, 12.56646728515625, 20.31207275390625, 28.05767822265625, 35.80328369140625, 43.54888916015625, 51.29449462890625, 59.04010009765625, 66.78570556640625, 74.53131103515625, 82.27691650390625, 90.02252197265625, 97.76812744140625, 105.51373291015625, 113.25933837890625, 121.00494384765625, 128.75054931640625, 136.49615478515625, 144.24176025390625, 151.98736572265625, 159.73297119140625, 167.47857666015625, 175.22418212890625, 182.96978759765625, 190.71539306640625, 198.46099853515625, 206.20660400390625, 213.95220947265625, 221.69781494140625, 229.44342041015625, 237.18902587890625, 244.93463134765625, 252.68023681640625, 260.42584228515625]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 0.0, 5.0, 5.0, 10.0, 12.0, 15.0, 10.0, 16.0, 13.0, 18.0, 19.0, 24.0, 28.0, 25.0, 29.0, 33.0, 28.0, 44.0, 37.0, 31.0, 49.0, 39.0, 49.0, 34.0, 42.0, 26.0, 45.0, 39.0, 24.0, 31.0, 23.0, 25.0, 25.0, 25.0, 25.0, 14.0, 18.0, 11.0, 12.0, 13.0, 4.0, 9.0, 7.0, 5.0, 1.0, 3.0, 3.0, 2.0, 1.0, 3.0], "bins": [-52.00878143310547, -50.58837127685547, -49.16796112060547, -47.74755096435547, -46.32714080810547, -44.90673065185547, -43.48632049560547, -42.06591033935547, -40.64550018310547, -39.22509002685547, -37.80467987060547, -36.38426971435547, -34.96385955810547, -33.54344940185547, -32.12303924560547, -30.70262908935547, -29.28221893310547, -27.86180877685547, -26.44139862060547, -25.02098846435547, -23.60057830810547, -22.18016815185547, -20.75975799560547, -19.33934783935547, -17.91893768310547, -16.49852752685547, -15.078117370605469, -13.657707214355469, -12.237297058105469, -10.816886901855469, -9.396476745605469, -7.976066589355469, -6.555656433105469, -5.135246276855469, -3.7148361206054688, -2.2944259643554688, -0.8740158081054688, 0.5463943481445312, 1.9668045043945312, 3.3872146606445312, 4.807624816894531, 6.228034973144531, 7.648445129394531, 9.068855285644531, 10.489265441894531, 11.909675598144531, 13.330085754394531, 14.750495910644531, 16.17090606689453, 17.59131622314453, 19.01172637939453, 20.43213653564453, 21.85254669189453, 23.27295684814453, 24.69336700439453, 26.11377716064453, 27.53418731689453, 28.95459747314453, 30.37500762939453, 31.79541778564453, 33.21582794189453, 34.63623809814453, 36.05664825439453, 37.47705841064453, 38.89746856689453]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 8.0, 3.0, 9.0, 8.0, 8.0, 11.0, 12.0, 15.0, 15.0, 27.0, 19.0, 21.0, 22.0, 28.0, 28.0, 37.0, 23.0, 31.0, 39.0, 38.0, 46.0, 49.0, 31.0, 36.0, 31.0, 37.0, 49.0, 36.0, 31.0, 37.0, 26.0, 25.0, 25.0, 27.0, 19.0, 7.0, 18.0, 11.0, 12.0, 8.0, 8.0, 6.0, 7.0, 3.0, 1.0, 1.0, 6.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0], "bins": [-8.234375, -7.9849853515625, -7.735595703125, -7.4862060546875, -7.23681640625, -6.9874267578125, -6.738037109375, -6.4886474609375, -6.2392578125, -5.9898681640625, -5.740478515625, -5.4910888671875, -5.24169921875, -4.9923095703125, -4.742919921875, -4.4935302734375, -4.244140625, -3.9947509765625, -3.745361328125, -3.4959716796875, -3.24658203125, -2.9971923828125, -2.747802734375, -2.4984130859375, -2.2490234375, -1.9996337890625, -1.750244140625, -1.5008544921875, -1.25146484375, -1.0020751953125, -0.752685546875, -0.5032958984375, -0.25390625, -0.0045166015625, 0.244873046875, 0.4942626953125, 0.74365234375, 0.9930419921875, 1.242431640625, 1.4918212890625, 1.7412109375, 1.9906005859375, 2.239990234375, 2.4893798828125, 2.73876953125, 2.9881591796875, 3.237548828125, 3.4869384765625, 3.736328125, 3.9857177734375, 4.235107421875, 4.4844970703125, 4.73388671875, 4.9832763671875, 5.232666015625, 5.4820556640625, 5.7314453125, 5.9808349609375, 6.230224609375, 6.4796142578125, 6.72900390625, 6.9783935546875, 7.227783203125, 7.4771728515625, 7.7265625]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 4.0, 5.0, 3.0, 1.0, 7.0, 10.0, 16.0, 25.0, 32.0, 49.0, 65.0, 103.0, 148.0, 198.0, 292.0, 503.0, 806.0, 1154.0, 1748.0, 2619.0, 3979.0, 6218.0, 9787.0, 14920.0, 24021.0, 39294.0, 68080.0, 133280.0, 346729.0, 184190.0, 84446.0, 47563.0, 28426.0, 17754.0, 11317.0, 7099.0, 4725.0, 3071.0, 1993.0, 1325.0, 832.0, 575.0, 364.0, 271.0, 171.0, 121.0, 73.0, 44.0, 27.0, 25.0, 12.0, 15.0, 16.0, 6.0, 1.0, 5.0, 3.0, 0.0, 1.0, 2.0, 2.0], "bins": [-1.7158203125, -1.661651611328125, -1.60748291015625, -1.553314208984375, -1.4991455078125, -1.444976806640625, -1.39080810546875, -1.336639404296875, -1.282470703125, -1.228302001953125, -1.17413330078125, -1.119964599609375, -1.0657958984375, -1.011627197265625, -0.95745849609375, -0.903289794921875, -0.84912109375, -0.794952392578125, -0.74078369140625, -0.686614990234375, -0.6324462890625, -0.578277587890625, -0.52410888671875, -0.469940185546875, -0.415771484375, -0.361602783203125, -0.30743408203125, -0.253265380859375, -0.1990966796875, -0.144927978515625, -0.09075927734375, -0.036590576171875, 0.017578125, 0.071746826171875, 0.12591552734375, 0.180084228515625, 0.2342529296875, 0.288421630859375, 0.34259033203125, 0.396759033203125, 0.450927734375, 0.505096435546875, 0.55926513671875, 0.613433837890625, 0.6676025390625, 0.721771240234375, 0.77593994140625, 0.830108642578125, 0.88427734375, 0.938446044921875, 0.99261474609375, 1.046783447265625, 1.1009521484375, 1.155120849609375, 1.20928955078125, 1.263458251953125, 1.317626953125, 1.371795654296875, 1.42596435546875, 1.480133056640625, 1.5343017578125, 1.588470458984375, 1.64263916015625, 1.696807861328125, 1.7509765625]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 0.0, 0.0, 4.0, 3.0, 2.0, 4.0, 6.0, 6.0, 7.0, 3.0, 11.0, 18.0, 13.0, 14.0, 16.0, 23.0, 24.0, 22.0, 40.0, 32.0, 36.0, 41.0, 35.0, 42.0, 41.0, 35.0, 29.0, 1062.0, 43.0, 32.0, 32.0, 39.0, 35.0, 38.0, 27.0, 23.0, 29.0, 21.0, 19.0, 16.0, 15.0, 21.0, 10.0, 15.0, 11.0, 6.0, 7.0, 5.0, 3.0, 5.0, 7.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.89453125, -4.7332763671875, -4.572021484375, -4.4107666015625, -4.24951171875, -4.0882568359375, -3.927001953125, -3.7657470703125, -3.6044921875, -3.4432373046875, -3.281982421875, -3.1207275390625, -2.95947265625, -2.7982177734375, -2.636962890625, -2.4757080078125, -2.314453125, -2.1531982421875, -1.991943359375, -1.8306884765625, -1.66943359375, -1.5081787109375, -1.346923828125, -1.1856689453125, -1.0244140625, -0.8631591796875, -0.701904296875, -0.5406494140625, -0.37939453125, -0.2181396484375, -0.056884765625, 0.1043701171875, 0.265625, 0.4268798828125, 0.588134765625, 0.7493896484375, 0.91064453125, 1.0718994140625, 1.233154296875, 1.3944091796875, 1.5556640625, 1.7169189453125, 1.878173828125, 2.0394287109375, 2.20068359375, 2.3619384765625, 2.523193359375, 2.6844482421875, 2.845703125, 3.0069580078125, 3.168212890625, 3.3294677734375, 3.49072265625, 3.6519775390625, 3.813232421875, 3.9744873046875, 4.1357421875, 4.2969970703125, 4.458251953125, 4.6195068359375, 4.78076171875, 4.9420166015625, 5.103271484375, 5.2645263671875, 5.42578125]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 9.0, 11.0, 9.0, 13.0, 32.0, 32.0, 47.0, 66.0, 91.0, 157.0, 190.0, 277.0, 455.0, 572.0, 871.0, 1235.0, 1767.0, 2571.0, 3735.0, 5401.0, 8205.0, 11949.0, 18275.0, 28510.0, 45361.0, 75993.0, 135381.0, 1338591.0, 174302.0, 91029.0, 54434.0, 33591.0, 21157.0, 14007.0, 9027.0, 6189.0, 4123.0, 2909.0, 1962.0, 1377.0, 970.0, 659.0, 510.0, 312.0, 225.0, 166.0, 120.0, 77.0, 53.0, 52.0, 26.0, 25.0, 8.0, 12.0, 5.0, 2.0, 3.0, 3.0, 0.0, 3.0], "bins": [-1.486328125, -1.43939208984375, -1.3924560546875, -1.34552001953125, -1.298583984375, -1.25164794921875, -1.2047119140625, -1.15777587890625, -1.11083984375, -1.06390380859375, -1.0169677734375, -0.97003173828125, -0.923095703125, -0.87615966796875, -0.8292236328125, -0.78228759765625, -0.7353515625, -0.68841552734375, -0.6414794921875, -0.59454345703125, -0.547607421875, -0.50067138671875, -0.4537353515625, -0.40679931640625, -0.35986328125, -0.31292724609375, -0.2659912109375, -0.21905517578125, -0.172119140625, -0.12518310546875, -0.0782470703125, -0.03131103515625, 0.015625, 0.06256103515625, 0.1094970703125, 0.15643310546875, 0.203369140625, 0.25030517578125, 0.2972412109375, 0.34417724609375, 0.39111328125, 0.43804931640625, 0.4849853515625, 0.53192138671875, 0.578857421875, 0.62579345703125, 0.6727294921875, 0.71966552734375, 0.7666015625, 0.81353759765625, 0.8604736328125, 0.90740966796875, 0.954345703125, 1.00128173828125, 1.0482177734375, 1.09515380859375, 1.14208984375, 1.18902587890625, 1.2359619140625, 1.28289794921875, 1.329833984375, 1.37677001953125, 1.4237060546875, 1.47064208984375, 1.517578125]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 6.0, 5.0, 9.0, 8.0, 5.0, 21.0, 17.0, 17.0, 23.0, 38.0, 42.0, 63.0, 67.0, 70.0, 93.0, 99.0, 77.0, 69.0, 58.0, 40.0, 45.0, 31.0, 24.0, 18.0, 15.0, 8.0, 12.0, 3.0, 6.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000896453857421875, -0.0008655339479446411, -0.0008346140384674072, -0.0008036941289901733, -0.0007727742195129395, -0.0007418543100357056, -0.0007109344005584717, -0.0006800144910812378, -0.0006490945816040039, -0.00061817467212677, -0.0005872547626495361, -0.0005563348531723022, -0.0005254149436950684, -0.0004944950342178345, -0.0004635751247406006, -0.0004326552152633667, -0.0004017353057861328, -0.0003708153963088989, -0.00033989548683166504, -0.00030897557735443115, -0.00027805566787719727, -0.0002471357583999634, -0.0002162158489227295, -0.0001852959394454956, -0.00015437602996826172, -0.00012345612049102783, -9.253621101379395e-05, -6.161630153656006e-05, -3.069639205932617e-05, 2.2351741790771484e-07, 3.11434268951416e-05, 6.206333637237549e-05, 9.298324584960938e-05, 0.00012390315532684326, 0.00015482306480407715, 0.00018574297428131104, 0.00021666288375854492, 0.0002475827932357788, 0.0002785027027130127, 0.0003094226121902466, 0.00034034252166748047, 0.00037126243114471436, 0.00040218234062194824, 0.00043310225009918213, 0.000464022159576416, 0.0004949420690536499, 0.0005258619785308838, 0.0005567818880081177, 0.0005877017974853516, 0.0006186217069625854, 0.0006495416164398193, 0.0006804615259170532, 0.0007113814353942871, 0.000742301344871521, 0.0007732212543487549, 0.0008041411638259888, 0.0008350610733032227, 0.0008659809827804565, 0.0008969008922576904, 0.0009278208017349243, 0.0009587407112121582, 0.000989660620689392, 0.001020580530166626, 0.0010515004396438599, 0.0010824203491210938]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 2.0, 10.0, 11.0, 17.0, 23.0, 27.0, 32.0, 61.0, 90.0, 141.0, 276.0, 751.0, 732384.0, 313414.0, 690.0, 236.0, 125.0, 80.0, 42.0, 43.0, 23.0, 23.0, 8.0, 11.0, 9.0, 2.0, 3.0, 10.0, 3.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0291900634765625, -0.02837848663330078, -0.027566909790039062, -0.026755332946777344, -0.025943756103515625, -0.025132179260253906, -0.024320602416992188, -0.02350902557373047, -0.02269744873046875, -0.02188587188720703, -0.021074295043945312, -0.020262718200683594, -0.019451141357421875, -0.018639564514160156, -0.017827987670898438, -0.01701641082763672, -0.016204833984375, -0.015393257141113281, -0.014581680297851562, -0.013770103454589844, -0.012958526611328125, -0.012146949768066406, -0.011335372924804688, -0.010523796081542969, -0.00971221923828125, -0.008900642395019531, -0.008089065551757812, -0.007277488708496094, -0.006465911865234375, -0.005654335021972656, -0.0048427581787109375, -0.004031181335449219, -0.0032196044921875, -0.0024080276489257812, -0.0015964508056640625, -0.0007848739624023438, 2.6702880859375e-05, 0.0008382797241210938, 0.0016498565673828125, 0.0024614334106445312, 0.00327301025390625, 0.004084587097167969, 0.0048961639404296875, 0.005707740783691406, 0.006519317626953125, 0.007330894470214844, 0.008142471313476562, 0.008954048156738281, 0.009765625, 0.010577201843261719, 0.011388778686523438, 0.012200355529785156, 0.013011932373046875, 0.013823509216308594, 0.014635086059570312, 0.015446662902832031, 0.01625823974609375, 0.01706981658935547, 0.017881393432617188, 0.018692970275878906, 0.019504547119140625, 0.020316123962402344, 0.021127700805664062, 0.02193927764892578, 0.0227508544921875]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 11.0, 14.0, 92.0, 261.0, 352.0, 201.0, 63.0, 18.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008420677040703595, -0.0008044264977797866, -0.0007667853496968746, -0.0007291441434063017, -0.0006915029371157289, -0.0006538617890328169, -0.000616220582742244, -0.0005785793764516711, -0.0005409382283687592, -0.0005032970220781863, -0.0004656558739952743, -0.0004280146677047014, -0.000390373490517959, -0.0003527323133312166, -0.0003150911070406437, -0.00027744992985390127, -0.00023980875266715884, -0.00020216757548041642, -0.00016452638374175876, -0.0001268851920031011, -8.924401481635869e-05, -5.160283762961626e-05, -1.3961645890958607e-05, 2.3679545847699046e-05, 6.132072303444147e-05, 9.896190749714151e-05, 0.00013660309195984155, 0.0001742442836984992, 0.00021188546088524163, 0.00024952663807198405, 0.00028716784436255693, 0.00032480902154929936, 0.00036245014052838087, 0.0004000913177151233, 0.0004377324949018657, 0.0004753737011924386, 0.0005130148492753506, 0.0005506560555659235, 0.0005882972618564963, 0.0006259384099394083, 0.0006635796162299812, 0.0007012208225205541, 0.000738861970603466, 0.0007765031768940389, 0.0008141443831846118, 0.0008517855312675238, 0.0008894267375580966, 0.0009270679438486695, 0.0009647090919315815, 0.0010023502400144935, 0.0010399915045127273, 0.0010776326525956392, 0.0011152738006785512, 0.0011529149487614632, 0.001190556213259697, 0.001228197361342609, 0.001265838509425521, 0.0013034796575084329, 0.0013411209220066667, 0.0013787620700895786, 0.0014164032181724906, 0.0014540443662554026, 0.0014916856307536364, 0.0015293267788365483, 0.0015669680433347821]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 7.0, 3.0, 7.0, 4.0, 9.0, 13.0, 9.0, 11.0, 14.0, 15.0, 31.0, 33.0, 20.0, 19.0, 28.0, 33.0, 34.0, 35.0, 28.0, 39.0, 31.0, 42.0, 46.0, 24.0, 39.0, 40.0, 41.0, 29.0, 25.0, 31.0, 24.0, 30.0, 25.0, 28.0, 17.0, 21.0, 24.0, 24.0, 7.0, 13.0, 10.0, 10.0, 5.0, 8.0, 9.0, 3.0, 1.0, 6.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00035506486892700195, -0.00034347549080848694, -0.0003318861126899719, -0.0003202967345714569, -0.0003087073564529419, -0.0002971179783344269, -0.00028552860021591187, -0.00027393922209739685, -0.00026234984397888184, -0.0002507604658603668, -0.0002391710877418518, -0.0002275817096233368, -0.00021599233150482178, -0.00020440295338630676, -0.00019281357526779175, -0.00018122419714927673, -0.00016963481903076172, -0.0001580454409122467, -0.0001464560627937317, -0.00013486668467521667, -0.00012327730655670166, -0.00011168792843818665, -0.00010009855031967163, -8.850917220115662e-05, -7.69197940826416e-05, -6.533041596412659e-05, -5.374103784561157e-05, -4.215165972709656e-05, -3.056228160858154e-05, -1.897290349006653e-05, -7.383525371551514e-06, 4.205852746963501e-06, 1.5795230865478516e-05, 2.738460898399353e-05, 3.8973987102508545e-05, 5.056336522102356e-05, 6.215274333953857e-05, 7.374212145805359e-05, 8.53314995765686e-05, 9.692087769508362e-05, 0.00010851025581359863, 0.00012009963393211365, 0.00013168901205062866, 0.00014327839016914368, 0.0001548677682876587, 0.0001664571464061737, 0.00017804652452468872, 0.00018963590264320374, 0.00020122528076171875, 0.00021281465888023376, 0.00022440403699874878, 0.0002359934151172638, 0.0002475827932357788, 0.0002591721713542938, 0.00027076154947280884, 0.00028235092759132385, 0.00029394030570983887, 0.0003055296838283539, 0.0003171190619468689, 0.0003287084400653839, 0.0003402978181838989, 0.00035188719630241394, 0.00036347657442092896, 0.00037506595253944397, 0.000386655330657959]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 8.0, 3.0, 9.0, 8.0, 8.0, 11.0, 12.0, 15.0, 15.0, 27.0, 19.0, 21.0, 22.0, 28.0, 28.0, 37.0, 23.0, 31.0, 39.0, 38.0, 45.0, 50.0, 31.0, 36.0, 31.0, 37.0, 49.0, 36.0, 31.0, 37.0, 26.0, 25.0, 25.0, 27.0, 19.0, 7.0, 18.0, 11.0, 12.0, 8.0, 8.0, 6.0, 7.0, 3.0, 1.0, 1.0, 6.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0], "bins": [-8.234375, -7.9849853515625, -7.735595703125, -7.4862060546875, -7.23681640625, -6.9874267578125, -6.738037109375, -6.4886474609375, -6.2392578125, -5.9898681640625, -5.740478515625, -5.4910888671875, -5.24169921875, -4.9923095703125, -4.742919921875, -4.4935302734375, -4.244140625, -3.9947509765625, -3.745361328125, -3.4959716796875, -3.24658203125, -2.9971923828125, -2.747802734375, -2.4984130859375, -2.2490234375, -1.9996337890625, -1.750244140625, -1.5008544921875, -1.25146484375, -1.0020751953125, -0.752685546875, -0.5032958984375, -0.25390625, -0.0045166015625, 0.244873046875, 0.4942626953125, 0.74365234375, 0.9930419921875, 1.242431640625, 1.4918212890625, 1.7412109375, 1.9906005859375, 2.239990234375, 2.4893798828125, 2.73876953125, 2.9881591796875, 3.237548828125, 3.4869384765625, 3.736328125, 3.9857177734375, 4.235107421875, 4.4844970703125, 4.73388671875, 4.9832763671875, 5.232666015625, 5.4820556640625, 5.7314453125, 5.9808349609375, 6.230224609375, 6.4796142578125, 6.72900390625, 6.9783935546875, 7.227783203125, 7.4771728515625, 7.7265625]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 9.0, 11.0, 11.0, 20.0, 17.0, 21.0, 23.0, 36.0, 37.0, 63.0, 66.0, 81.0, 124.0, 162.0, 184.0, 278.0, 400.0, 554.0, 857.0, 1765.0, 4994.0, 24020.0, 455720.0, 523607.0, 25597.0, 5027.0, 1790.0, 892.0, 580.0, 396.0, 304.0, 213.0, 166.0, 126.0, 108.0, 59.0, 43.0, 40.0, 35.0, 29.0, 15.0, 17.0, 11.0, 9.0, 8.0, 5.0, 2.0, 10.0, 4.0, 2.0, 2.0, 5.0, 1.0, 1.0], "bins": [-20.828125, -20.197265625, -19.56640625, -18.935546875, -18.3046875, -17.673828125, -17.04296875, -16.412109375, -15.78125, -15.150390625, -14.51953125, -13.888671875, -13.2578125, -12.626953125, -11.99609375, -11.365234375, -10.734375, -10.103515625, -9.47265625, -8.841796875, -8.2109375, -7.580078125, -6.94921875, -6.318359375, -5.6875, -5.056640625, -4.42578125, -3.794921875, -3.1640625, -2.533203125, -1.90234375, -1.271484375, -0.640625, -0.009765625, 0.62109375, 1.251953125, 1.8828125, 2.513671875, 3.14453125, 3.775390625, 4.40625, 5.037109375, 5.66796875, 6.298828125, 6.9296875, 7.560546875, 8.19140625, 8.822265625, 9.453125, 10.083984375, 10.71484375, 11.345703125, 11.9765625, 12.607421875, 13.23828125, 13.869140625, 14.5, 15.130859375, 15.76171875, 16.392578125, 17.0234375, 17.654296875, 18.28515625, 18.916015625, 19.546875]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 5.0, 5.0, 10.0, 5.0, 11.0, 11.0, 16.0, 17.0, 12.0, 21.0, 31.0, 30.0, 35.0, 36.0, 39.0, 45.0, 47.0, 56.0, 95.0, 1604.0, 385.0, 79.0, 59.0, 59.0, 30.0, 27.0, 38.0, 36.0, 33.0, 33.0, 21.0, 14.0, 16.0, 20.0, 15.0, 14.0, 19.0, 6.0, 8.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-27.78125, -27.0078125, -26.234375, -25.4609375, -24.6875, -23.9140625, -23.140625, -22.3671875, -21.59375, -20.8203125, -20.046875, -19.2734375, -18.5, -17.7265625, -16.953125, -16.1796875, -15.40625, -14.6328125, -13.859375, -13.0859375, -12.3125, -11.5390625, -10.765625, -9.9921875, -9.21875, -8.4453125, -7.671875, -6.8984375, -6.125, -5.3515625, -4.578125, -3.8046875, -3.03125, -2.2578125, -1.484375, -0.7109375, 0.0625, 0.8359375, 1.609375, 2.3828125, 3.15625, 3.9296875, 4.703125, 5.4765625, 6.25, 7.0234375, 7.796875, 8.5703125, 9.34375, 10.1171875, 10.890625, 11.6640625, 12.4375, 13.2109375, 13.984375, 14.7578125, 15.53125, 16.3046875, 17.078125, 17.8515625, 18.625, 19.3984375, 20.171875, 20.9453125, 21.71875]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 6.0, 9.0, 6.0, 17.0, 15.0, 16.0, 21.0, 20.0, 22.0, 30.0, 42.0, 46.0, 55.0, 82.0, 91.0, 153.0, 260.0, 740.0, 7340.0, 3109801.0, 24894.0, 1055.0, 314.0, 177.0, 116.0, 75.0, 64.0, 54.0, 37.0, 31.0, 19.0, 16.0, 18.0, 10.0, 14.0, 7.0, 9.0, 6.0, 5.0, 5.0, 4.0, 2.0, 0.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-66.8125, -64.5576171875, -62.302734375, -60.0478515625, -57.79296875, -55.5380859375, -53.283203125, -51.0283203125, -48.7734375, -46.5185546875, -44.263671875, -42.0087890625, -39.75390625, -37.4990234375, -35.244140625, -32.9892578125, -30.734375, -28.4794921875, -26.224609375, -23.9697265625, -21.71484375, -19.4599609375, -17.205078125, -14.9501953125, -12.6953125, -10.4404296875, -8.185546875, -5.9306640625, -3.67578125, -1.4208984375, 0.833984375, 3.0888671875, 5.34375, 7.5986328125, 9.853515625, 12.1083984375, 14.36328125, 16.6181640625, 18.873046875, 21.1279296875, 23.3828125, 25.6376953125, 27.892578125, 30.1474609375, 32.40234375, 34.6572265625, 36.912109375, 39.1669921875, 41.421875, 43.6767578125, 45.931640625, 48.1865234375, 50.44140625, 52.6962890625, 54.951171875, 57.2060546875, 59.4609375, 61.7158203125, 63.970703125, 66.2255859375, 68.48046875, 70.7353515625, 72.990234375, 75.2451171875, 77.5]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 76.0, 394.0, 420.0, 109.0, 11.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.291587829589844, -25.947967529296875, -23.604345321655273, -21.260723114013672, -18.917102813720703, -16.573482513427734, -14.229860305786133, -11.886238098144531, -9.542617797851562, -7.198996543884277, -4.855375289916992, -2.511754035949707, -0.16813278198242188, 2.1754884719848633, 4.519109725952148, 6.86273193359375, 9.206352233886719, 11.549973487854004, 13.893594741821289, 16.23721694946289, 18.58083724975586, 20.924457550048828, 23.26807975769043, 25.61170196533203, 27.955322265625, 30.29894256591797, 32.64256286621094, 34.98618698120117, 37.32980728149414, 39.67342758178711, 42.017051696777344, 44.36067199707031, 46.70428466796875, 49.04790496826172, 51.39152526855469, 53.73514938354492, 56.07876968383789, 58.42238998413086, 60.766014099121094, 63.10963439941406, 65.45325469970703, 67.796875, 70.14049530029297, 72.48411560058594, 74.82774353027344, 77.1713638305664, 79.51498413085938, 81.85860443115234, 84.20222473144531, 86.54584503173828, 88.88946533203125, 91.23308563232422, 93.57670593261719, 95.92033386230469, 98.26395416259766, 100.60757446289062, 102.9511947631836, 105.29481506347656, 107.63843536376953, 109.9820556640625, 112.32568359375, 114.66930389404297, 117.01292419433594, 119.3565444946289, 121.70016479492188]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 9.0, 6.0, 5.0, 5.0, 3.0, 13.0, 19.0, 7.0, 21.0, 18.0, 21.0, 21.0, 35.0, 24.0, 26.0, 41.0, 41.0, 35.0, 39.0, 44.0, 44.0, 37.0, 47.0, 55.0, 33.0, 38.0, 44.0, 37.0, 21.0, 32.0, 28.0, 24.0, 21.0, 15.0, 14.0, 11.0, 10.0, 8.0, 12.0, 8.0, 3.0, 9.0, 3.0, 1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-62.37874984741211, -60.472957611083984, -58.56716537475586, -56.661373138427734, -54.75558090209961, -52.849788665771484, -50.94399642944336, -49.038204193115234, -47.13241195678711, -45.226619720458984, -43.32082748413086, -41.415035247802734, -39.50924301147461, -37.603450775146484, -35.69765853881836, -33.791866302490234, -31.886072158813477, -29.98027992248535, -28.074487686157227, -26.1686954498291, -24.262903213500977, -22.35710906982422, -20.451316833496094, -18.54552459716797, -16.639732360839844, -14.733940124511719, -12.828147888183594, -10.922355651855469, -9.016563415527344, -7.110770225524902, -5.204977989196777, -3.2991857528686523, -1.3933944702148438, 0.5123978853225708, 2.4181902408599854, 4.3239827156066895, 6.2297749519348145, 8.135567665100098, 10.041359901428223, 11.947152137756348, 13.852944374084473, 15.758736610412598, 17.66452980041504, 19.570322036743164, 21.47611427307129, 23.381906509399414, 25.28769874572754, 27.193490982055664, 29.09928321838379, 31.005075454711914, 32.91086959838867, 34.8166618347168, 36.72245407104492, 38.62824630737305, 40.53403854370117, 42.4398307800293, 44.34562301635742, 46.25141525268555, 48.15720748901367, 50.0629997253418, 51.96879196166992, 53.87458419799805, 55.78037643432617, 57.6861686706543, 59.59196090698242]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 11.0, 2.0, 4.0, 6.0, 10.0, 7.0, 12.0, 13.0, 12.0, 13.0, 25.0, 22.0, 13.0, 23.0, 21.0, 28.0, 30.0, 39.0, 36.0, 38.0, 32.0, 37.0, 31.0, 45.0, 42.0, 31.0, 35.0, 34.0, 43.0, 40.0, 31.0, 32.0, 24.0, 32.0, 30.0, 26.0, 11.0, 7.0, 18.0, 13.0, 6.0, 9.0, 11.0, 3.0, 2.0, 8.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0], "bins": [-8.2109375, -7.95928955078125, -7.7076416015625, -7.45599365234375, -7.204345703125, -6.95269775390625, -6.7010498046875, -6.44940185546875, -6.19775390625, -5.94610595703125, -5.6944580078125, -5.44281005859375, -5.191162109375, -4.93951416015625, -4.6878662109375, -4.43621826171875, -4.1845703125, -3.93292236328125, -3.6812744140625, -3.42962646484375, -3.177978515625, -2.92633056640625, -2.6746826171875, -2.42303466796875, -2.17138671875, -1.91973876953125, -1.6680908203125, -1.41644287109375, -1.164794921875, -0.91314697265625, -0.6614990234375, -0.40985107421875, -0.158203125, 0.09344482421875, 0.3450927734375, 0.59674072265625, 0.848388671875, 1.10003662109375, 1.3516845703125, 1.60333251953125, 1.85498046875, 2.10662841796875, 2.3582763671875, 2.60992431640625, 2.861572265625, 3.11322021484375, 3.3648681640625, 3.61651611328125, 3.8681640625, 4.11981201171875, 4.3714599609375, 4.62310791015625, 4.874755859375, 5.12640380859375, 5.3780517578125, 5.62969970703125, 5.88134765625, 6.13299560546875, 6.3846435546875, 6.63629150390625, 6.887939453125, 7.13958740234375, 7.3912353515625, 7.64288330078125, 7.89453125]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 2.0, 4.0, 7.0, 10.0, 18.0, 16.0, 18.0, 28.0, 16.0, 43.0, 44.0, 69.0, 87.0, 129.0, 159.0, 219.0, 352.0, 627.0, 1592.0, 4650.0, 22668.0, 427736.0, 3118499.0, 580494.0, 27695.0, 5328.0, 1750.0, 820.0, 403.0, 203.0, 149.0, 105.0, 62.0, 71.0, 52.0, 32.0, 28.0, 23.0, 19.0, 17.0, 16.0, 9.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.875, -19.1787109375, -18.482421875, -17.7861328125, -17.08984375, -16.3935546875, -15.697265625, -15.0009765625, -14.3046875, -13.6083984375, -12.912109375, -12.2158203125, -11.51953125, -10.8232421875, -10.126953125, -9.4306640625, -8.734375, -8.0380859375, -7.341796875, -6.6455078125, -5.94921875, -5.2529296875, -4.556640625, -3.8603515625, -3.1640625, -2.4677734375, -1.771484375, -1.0751953125, -0.37890625, 0.3173828125, 1.013671875, 1.7099609375, 2.40625, 3.1025390625, 3.798828125, 4.4951171875, 5.19140625, 5.8876953125, 6.583984375, 7.2802734375, 7.9765625, 8.6728515625, 9.369140625, 10.0654296875, 10.76171875, 11.4580078125, 12.154296875, 12.8505859375, 13.546875, 14.2431640625, 14.939453125, 15.6357421875, 16.33203125, 17.0283203125, 17.724609375, 18.4208984375, 19.1171875, 19.8134765625, 20.509765625, 21.2060546875, 21.90234375, 22.5986328125, 23.294921875, 23.9912109375, 24.6875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 1.0, 12.0, 10.0, 18.0, 30.0, 50.0, 64.0, 118.0, 205.0, 321.0, 454.0, 680.0, 687.0, 523.0, 316.0, 222.0, 121.0, 78.0, 54.0, 41.0, 32.0, 4.0, 13.0, 9.0, 3.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.96875, -19.365478515625, -18.76220703125, -18.158935546875, -17.5556640625, -16.952392578125, -16.34912109375, -15.745849609375, -15.142578125, -14.539306640625, -13.93603515625, -13.332763671875, -12.7294921875, -12.126220703125, -11.52294921875, -10.919677734375, -10.31640625, -9.713134765625, -9.10986328125, -8.506591796875, -7.9033203125, -7.300048828125, -6.69677734375, -6.093505859375, -5.490234375, -4.886962890625, -4.28369140625, -3.680419921875, -3.0771484375, -2.473876953125, -1.87060546875, -1.267333984375, -0.6640625, -0.060791015625, 0.54248046875, 1.145751953125, 1.7490234375, 2.352294921875, 2.95556640625, 3.558837890625, 4.162109375, 4.765380859375, 5.36865234375, 5.971923828125, 6.5751953125, 7.178466796875, 7.78173828125, 8.385009765625, 8.98828125, 9.591552734375, 10.19482421875, 10.798095703125, 11.4013671875, 12.004638671875, 12.60791015625, 13.211181640625, 13.814453125, 14.417724609375, 15.02099609375, 15.624267578125, 16.2275390625, 16.830810546875, 17.43408203125, 18.037353515625, 18.640625]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 2.0, 4.0, 6.0, 7.0, 4.0, 4.0, 14.0, 13.0, 17.0, 24.0, 32.0, 25.0, 32.0, 41.0, 57.0, 61.0, 92.0, 92.0, 146.0, 192.0, 354.0, 694.0, 1757.0, 12037.0, 1104237.0, 3048923.0, 20963.0, 2381.0, 826.0, 353.0, 217.0, 152.0, 106.0, 87.0, 81.0, 54.0, 36.0, 32.0, 28.0, 25.0, 11.0, 16.0, 10.0, 15.0, 5.0, 5.0, 8.0, 1.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-49.46875, -47.92724609375, -46.3857421875, -44.84423828125, -43.302734375, -41.76123046875, -40.2197265625, -38.67822265625, -37.13671875, -35.59521484375, -34.0537109375, -32.51220703125, -30.970703125, -29.42919921875, -27.8876953125, -26.34619140625, -24.8046875, -23.26318359375, -21.7216796875, -20.18017578125, -18.638671875, -17.09716796875, -15.5556640625, -14.01416015625, -12.47265625, -10.93115234375, -9.3896484375, -7.84814453125, -6.306640625, -4.76513671875, -3.2236328125, -1.68212890625, -0.140625, 1.40087890625, 2.9423828125, 4.48388671875, 6.025390625, 7.56689453125, 9.1083984375, 10.64990234375, 12.19140625, 13.73291015625, 15.2744140625, 16.81591796875, 18.357421875, 19.89892578125, 21.4404296875, 22.98193359375, 24.5234375, 26.06494140625, 27.6064453125, 29.14794921875, 30.689453125, 32.23095703125, 33.7724609375, 35.31396484375, 36.85546875, 38.39697265625, 39.9384765625, 41.47998046875, 43.021484375, 44.56298828125, 46.1044921875, 47.64599609375, 49.1875]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 225.0, 768.0, 20.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.37764739990234, -77.55697631835938, -62.736297607421875, -47.91562271118164, -33.094947814941406, -18.274269104003906, -3.4535980224609375, 11.367073059082031, 26.18775177001953, 41.008426666259766, 55.8291015625, 70.6497802734375, 85.47045135498047, 100.29113006591797, 115.11180114746094, 129.93246459960938, 144.75314331054688, 159.57382202148438, 174.39450073242188, 189.2151641845703, 204.0358428955078, 218.8565216064453, 233.67718505859375, 248.49786376953125, 263.31854248046875, 278.13922119140625, 292.95989990234375, 307.78057861328125, 322.60125732421875, 337.42193603515625, 352.2425842285156, 367.0632629394531, 381.88397216796875, 396.70465087890625, 411.52532958984375, 426.34600830078125, 441.16668701171875, 455.98736572265625, 470.8080139160156, 485.6286926269531, 500.4493713378906, 515.27001953125, 530.0906982421875, 544.911376953125, 559.7320556640625, 574.552734375, 589.3734130859375, 604.194091796875, 619.0147705078125, 633.83544921875, 648.6561279296875, 663.476806640625, 678.2974853515625, 693.1181640625, 707.9388427734375, 722.759521484375, 737.5802001953125, 752.40087890625, 767.2215576171875, 782.042236328125, 796.8629150390625, 811.68359375, 826.5042724609375, 841.324951171875, 856.1455688476562]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 6.0, 4.0, 6.0, 9.0, 2.0, 6.0, 6.0, 10.0, 15.0, 17.0, 15.0, 18.0, 26.0, 27.0, 26.0, 25.0, 26.0, 44.0, 36.0, 36.0, 47.0, 36.0, 42.0, 33.0, 51.0, 42.0, 37.0, 39.0, 41.0, 30.0, 37.0, 23.0, 26.0, 28.0, 24.0, 22.0, 14.0, 15.0, 16.0, 18.0, 6.0, 5.0, 5.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-44.5260009765625, -43.06352233886719, -41.601043701171875, -40.13856506347656, -38.67608642578125, -37.2136116027832, -35.75113296508789, -34.28865432739258, -32.826175689697266, -31.363697052001953, -29.90121841430664, -28.43874168395996, -26.97626304626465, -25.513784408569336, -24.051307678222656, -22.588829040527344, -21.12635040283203, -19.66387176513672, -18.201393127441406, -16.738916397094727, -15.276437759399414, -13.813959121704102, -12.351481437683105, -10.88900375366211, -9.426525115966797, -7.964046955108643, -6.501568794250488, -5.039090633392334, -3.5766124725341797, -2.1141343116760254, -0.6516561508178711, 0.810821533203125, 2.2733001708984375, 3.735778331756592, 5.198256492614746, 6.6607346534729, 8.123212814331055, 9.585691452026367, 11.048169136047363, 12.51064682006836, 13.973125457763672, 15.435604095458984, 16.898082733154297, 18.360559463500977, 19.82303810119629, 21.2855167388916, 22.74799346923828, 24.210472106933594, 25.672950744628906, 27.13542938232422, 28.59790802001953, 30.06038475036621, 31.522863388061523, 32.9853401184082, 34.447818756103516, 35.91029739379883, 37.37277603149414, 38.83525466918945, 40.297733306884766, 41.76021194458008, 43.222686767578125, 44.68516540527344, 46.14764404296875, 47.61012268066406, 49.072601318359375]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 3.0, 3.0, 5.0, 5.0, 10.0, 13.0, 11.0, 17.0, 13.0, 17.0, 15.0, 22.0, 27.0, 22.0, 31.0, 31.0, 29.0, 34.0, 43.0, 46.0, 35.0, 39.0, 43.0, 31.0, 46.0, 35.0, 43.0, 40.0, 35.0, 33.0, 26.0, 25.0, 31.0, 18.0, 18.0, 17.0, 13.0, 18.0, 10.0, 9.0, 8.0, 8.0, 8.0, 3.0, 7.0, 3.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6953125, -8.43634033203125, -8.1773681640625, -7.91839599609375, -7.659423828125, -7.40045166015625, -7.1414794921875, -6.88250732421875, -6.62353515625, -6.36456298828125, -6.1055908203125, -5.84661865234375, -5.587646484375, -5.32867431640625, -5.0697021484375, -4.81072998046875, -4.5517578125, -4.29278564453125, -4.0338134765625, -3.77484130859375, -3.515869140625, -3.25689697265625, -2.9979248046875, -2.73895263671875, -2.47998046875, -2.22100830078125, -1.9620361328125, -1.70306396484375, -1.444091796875, -1.18511962890625, -0.9261474609375, -0.66717529296875, -0.408203125, -0.14923095703125, 0.1097412109375, 0.36871337890625, 0.627685546875, 0.88665771484375, 1.1456298828125, 1.40460205078125, 1.66357421875, 1.92254638671875, 2.1815185546875, 2.44049072265625, 2.699462890625, 2.95843505859375, 3.2174072265625, 3.47637939453125, 3.7353515625, 3.99432373046875, 4.2532958984375, 4.51226806640625, 4.771240234375, 5.03021240234375, 5.2891845703125, 5.54815673828125, 5.80712890625, 6.06610107421875, 6.3250732421875, 6.58404541015625, 6.843017578125, 7.10198974609375, 7.3609619140625, 7.61993408203125, 7.87890625]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 6.0, 9.0, 16.0, 23.0, 49.0, 62.0, 84.0, 108.0, 167.0, 221.0, 295.0, 382.0, 595.0, 826.0, 1199.0, 1580.0, 2293.0, 3255.0, 4727.0, 6705.0, 9895.0, 14560.0, 21248.0, 32486.0, 50981.0, 84485.0, 155435.0, 275613.0, 149932.0, 82759.0, 49638.0, 31854.0, 20924.0, 14144.0, 9707.0, 6673.0, 4605.0, 3245.0, 2195.0, 1570.0, 1128.0, 812.0, 599.0, 427.0, 310.0, 238.0, 142.0, 103.0, 73.0, 49.0, 35.0, 23.0, 28.0, 12.0, 10.0, 6.0, 6.0, 4.0, 6.0, 2.0, 3.0], "bins": [-1.38671875, -1.341217041015625, -1.29571533203125, -1.250213623046875, -1.2047119140625, -1.159210205078125, -1.11370849609375, -1.068206787109375, -1.022705078125, -0.977203369140625, -0.93170166015625, -0.886199951171875, -0.8406982421875, -0.795196533203125, -0.74969482421875, -0.704193115234375, -0.65869140625, -0.613189697265625, -0.56768798828125, -0.522186279296875, -0.4766845703125, -0.431182861328125, -0.38568115234375, -0.340179443359375, -0.294677734375, -0.249176025390625, -0.20367431640625, -0.158172607421875, -0.1126708984375, -0.067169189453125, -0.02166748046875, 0.023834228515625, 0.0693359375, 0.114837646484375, 0.16033935546875, 0.205841064453125, 0.2513427734375, 0.296844482421875, 0.34234619140625, 0.387847900390625, 0.433349609375, 0.478851318359375, 0.52435302734375, 0.569854736328125, 0.6153564453125, 0.660858154296875, 0.70635986328125, 0.751861572265625, 0.79736328125, 0.842864990234375, 0.88836669921875, 0.933868408203125, 0.9793701171875, 1.024871826171875, 1.07037353515625, 1.115875244140625, 1.161376953125, 1.206878662109375, 1.25238037109375, 1.297882080078125, 1.3433837890625, 1.388885498046875, 1.43438720703125, 1.479888916015625, 1.525390625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 2.0, 1.0, 3.0, 4.0, 4.0, 10.0, 10.0, 11.0, 14.0, 11.0, 8.0, 21.0, 17.0, 14.0, 18.0, 27.0, 32.0, 25.0, 33.0, 37.0, 39.0, 44.0, 24.0, 45.0, 1065.0, 34.0, 50.0, 35.0, 30.0, 46.0, 35.0, 36.0, 39.0, 26.0, 16.0, 24.0, 25.0, 18.0, 17.0, 9.0, 13.0, 12.0, 17.0, 11.0, 3.0, 4.0, 4.0, 2.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-5.1171875, -4.95562744140625, -4.7940673828125, -4.63250732421875, -4.470947265625, -4.30938720703125, -4.1478271484375, -3.98626708984375, -3.82470703125, -3.66314697265625, -3.5015869140625, -3.34002685546875, -3.178466796875, -3.01690673828125, -2.8553466796875, -2.69378662109375, -2.5322265625, -2.37066650390625, -2.2091064453125, -2.04754638671875, -1.885986328125, -1.72442626953125, -1.5628662109375, -1.40130615234375, -1.23974609375, -1.07818603515625, -0.9166259765625, -0.75506591796875, -0.593505859375, -0.43194580078125, -0.2703857421875, -0.10882568359375, 0.052734375, 0.21429443359375, 0.3758544921875, 0.53741455078125, 0.698974609375, 0.86053466796875, 1.0220947265625, 1.18365478515625, 1.34521484375, 1.50677490234375, 1.6683349609375, 1.82989501953125, 1.991455078125, 2.15301513671875, 2.3145751953125, 2.47613525390625, 2.6376953125, 2.79925537109375, 2.9608154296875, 3.12237548828125, 3.283935546875, 3.44549560546875, 3.6070556640625, 3.76861572265625, 3.93017578125, 4.09173583984375, 4.2532958984375, 4.41485595703125, 4.576416015625, 4.73797607421875, 4.8995361328125, 5.06109619140625, 5.22265625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 2.0, 4.0, 8.0, 4.0, 7.0, 19.0, 23.0, 28.0, 30.0, 59.0, 85.0, 129.0, 173.0, 259.0, 325.0, 486.0, 637.0, 1030.0, 1457.0, 1952.0, 2910.0, 4259.0, 6057.0, 8852.0, 12904.0, 19820.0, 30712.0, 48331.0, 79537.0, 146410.0, 1345016.0, 156692.0, 83578.0, 50160.0, 31735.0, 20445.0, 13340.0, 9117.0, 6265.0, 4345.0, 2961.0, 2062.0, 1524.0, 996.0, 691.0, 505.0, 332.0, 254.0, 189.0, 130.0, 74.0, 77.0, 30.0, 29.0, 30.0, 24.0, 8.0, 9.0, 6.0, 4.0, 3.0, 4.0, 4.0], "bins": [-1.4248046875, -1.379638671875, -1.33447265625, -1.289306640625, -1.244140625, -1.198974609375, -1.15380859375, -1.108642578125, -1.0634765625, -1.018310546875, -0.97314453125, -0.927978515625, -0.8828125, -0.837646484375, -0.79248046875, -0.747314453125, -0.7021484375, -0.656982421875, -0.61181640625, -0.566650390625, -0.521484375, -0.476318359375, -0.43115234375, -0.385986328125, -0.3408203125, -0.295654296875, -0.25048828125, -0.205322265625, -0.16015625, -0.114990234375, -0.06982421875, -0.024658203125, 0.0205078125, 0.065673828125, 0.11083984375, 0.156005859375, 0.201171875, 0.246337890625, 0.29150390625, 0.336669921875, 0.3818359375, 0.427001953125, 0.47216796875, 0.517333984375, 0.5625, 0.607666015625, 0.65283203125, 0.697998046875, 0.7431640625, 0.788330078125, 0.83349609375, 0.878662109375, 0.923828125, 0.968994140625, 1.01416015625, 1.059326171875, 1.1044921875, 1.149658203125, 1.19482421875, 1.239990234375, 1.28515625, 1.330322265625, 1.37548828125, 1.420654296875, 1.4658203125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 1.0, 2.0, 1.0, 4.0, 10.0, 7.0, 9.0, 5.0, 25.0, 8.0, 24.0, 26.0, 27.0, 37.0, 51.0, 64.0, 63.0, 62.0, 71.0, 73.0, 68.0, 69.0, 58.0, 41.0, 40.0, 24.0, 20.0, 24.0, 14.0, 17.0, 15.0, 6.0, 15.0, 7.0, 4.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011377334594726562, -0.001103624701499939, -0.0010695159435272217, -0.0010354071855545044, -0.0010012984275817871, -0.0009671896696090698, -0.0009330809116363525, -0.0008989721536636353, -0.000864863395690918, -0.0008307546377182007, -0.0007966458797454834, -0.0007625371217727661, -0.0007284283638000488, -0.0006943196058273315, -0.0006602108478546143, -0.000626102089881897, -0.0005919933319091797, -0.0005578845739364624, -0.0005237758159637451, -0.0004896670579910278, -0.00045555830001831055, -0.00042144954204559326, -0.000387340784072876, -0.0003532320261001587, -0.0003191232681274414, -0.0002850145101547241, -0.00025090575218200684, -0.00021679699420928955, -0.00018268823623657227, -0.00014857947826385498, -0.0001144707202911377, -8.036196231842041e-05, -4.6253204345703125e-05, -1.214444637298584e-05, 2.1964311599731445e-05, 5.607306957244873e-05, 9.018182754516602e-05, 0.0001242905855178833, 0.00015839934349060059, 0.00019250810146331787, 0.00022661685943603516, 0.00026072561740875244, 0.0002948343753814697, 0.000328943133354187, 0.0003630518913269043, 0.0003971606492996216, 0.00043126940727233887, 0.00046537816524505615, 0.0004994869232177734, 0.0005335956811904907, 0.000567704439163208, 0.0006018131971359253, 0.0006359219551086426, 0.0006700307130813599, 0.0007041394710540771, 0.0007382482290267944, 0.0007723569869995117, 0.000806465744972229, 0.0008405745029449463, 0.0008746832609176636, 0.0009087920188903809, 0.0009429007768630981, 0.0009770095348358154, 0.0010111182928085327, 0.00104522705078125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 8.0, 10.0, 3.0, 21.0, 18.0, 13.0, 27.0, 33.0, 41.0, 57.0, 81.0, 85.0, 167.0, 307.0, 621.0, 2906.0, 1033888.0, 8387.0, 772.0, 373.0, 206.0, 137.0, 94.0, 50.0, 60.0, 37.0, 35.0, 19.0, 25.0, 13.0, 16.0, 6.0, 10.0, 6.0, 4.0, 0.0, 5.0, 5.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0204925537109375, -0.019800186157226562, -0.019107818603515625, -0.018415451049804688, -0.01772308349609375, -0.017030715942382812, -0.016338348388671875, -0.015645980834960938, -0.01495361328125, -0.014261245727539062, -0.013568878173828125, -0.012876510620117188, -0.01218414306640625, -0.011491775512695312, -0.010799407958984375, -0.010107040405273438, -0.0094146728515625, -0.008722305297851562, -0.008029937744140625, -0.0073375701904296875, -0.00664520263671875, -0.0059528350830078125, -0.005260467529296875, -0.0045680999755859375, -0.003875732421875, -0.0031833648681640625, -0.002490997314453125, -0.0017986297607421875, -0.00110626220703125, -0.0004138946533203125, 0.000278472900390625, 0.0009708404541015625, 0.0016632080078125, 0.0023555755615234375, 0.003047943115234375, 0.0037403106689453125, 0.00443267822265625, 0.0051250457763671875, 0.005817413330078125, 0.0065097808837890625, 0.0072021484375, 0.007894515991210938, 0.008586883544921875, 0.009279251098632812, 0.00997161865234375, 0.010663986206054688, 0.011356353759765625, 0.012048721313476562, 0.0127410888671875, 0.013433456420898438, 0.014125823974609375, 0.014818191528320312, 0.01551055908203125, 0.016202926635742188, 0.016895294189453125, 0.017587661743164062, 0.018280029296875, 0.018972396850585938, 0.019664764404296875, 0.020357131958007812, 0.02104949951171875, 0.021741867065429688, 0.022434234619140625, 0.023126602172851562, 0.0238189697265625]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 118.0, 613.0, 266.0, 15.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002635367913171649, -0.0025401597376912832, -0.0024449515622109175, -0.0023497433867305517, -0.0022545354440808296, -0.002159327268600464, -0.002064119093120098, -0.0019689109176397324, -0.0018737027421593666, -0.0017784945666790009, -0.001683286391198635, -0.0015880783321335912, -0.0014928701566532254, -0.0013976619811728597, -0.0013024539221078157, -0.00120724574662745, -0.0011120375711470842, -0.0010168293956667185, -0.0009216212783940136, -0.0008264131611213088, -0.000731204985640943, -0.0006359968101605773, -0.0005407886928878725, -0.0004455805756151676, -0.00035037240013480186, -0.00025516425375826657, -0.00015995610738173127, -6.474796100519598e-05, 3.046018537133932e-05, 0.00012566833174787462, 0.00022087647812440991, 0.00031608459539711475, 0.00041129253804683685, 0.0005065007135272026, 0.0006017088307999074, 0.0006969169480726123, 0.000792125123552978, 0.0008873332990333438, 0.0009825413580983877, 0.0010777495335787535, 0.0011729577090591192, 0.001268165884539485, 0.0013633740600198507, 0.0014585821190848947, 0.0015537902945652604, 0.0016489984700456262, 0.00174420652911067, 0.0018394147045910358, 0.0019346228800714016, 0.0020298310555517673, 0.002125039231032133, 0.002220247406512499, 0.0023154555819928646, 0.0024106635246425867, 0.0025058717001229525, 0.002601079875603318, 0.002696288051083684, 0.0027914962265640497, 0.0028867044020444155, 0.0029819125775247812, 0.0030771205201745033, 0.003172328695654869, 0.003267536871135235, 0.0033627450466156006, 0.0034579532220959663]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 7.0, 10.0, 10.0, 7.0, 26.0, 22.0, 17.0, 21.0, 23.0, 31.0, 34.0, 39.0, 38.0, 41.0, 43.0, 38.0, 49.0, 52.0, 38.0, 48.0, 39.0, 41.0, 35.0, 40.0, 35.0, 33.0, 28.0, 30.0, 25.0, 25.0, 16.0, 21.0, 9.0, 6.0, 7.0, 10.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005216002464294434, -0.0005033900961279869, -0.00048517994582653046, -0.000466969795525074, -0.00044875964522361755, -0.0004305494949221611, -0.00041233934462070465, -0.0003941291943192482, -0.00037591904401779175, -0.0003577088937163353, -0.00033949874341487885, -0.0003212885931134224, -0.00030307844281196594, -0.0002848682925105095, -0.00026665814220905304, -0.0002484479919075966, -0.00023023784160614014, -0.00021202769130468369, -0.00019381754100322723, -0.00017560739070177078, -0.00015739724040031433, -0.00013918709009885788, -0.00012097693979740143, -0.00010276678949594498, -8.455663919448853e-05, -6.634648889303207e-05, -4.813633859157562e-05, -2.992618829011917e-05, -1.171603798866272e-05, 6.494112312793732e-06, 2.4704262614250183e-05, 4.2914412915706635e-05, 6.112456321716309e-05, 7.933471351861954e-05, 9.754486382007599e-05, 0.00011575501412153244, 0.0001339651644229889, 0.00015217531472444534, 0.0001703854650259018, 0.00018859561532735825, 0.0002068057656288147, 0.00022501591593027115, 0.0002432260662317276, 0.00026143621653318405, 0.0002796463668346405, 0.00029785651713609695, 0.0003160666674375534, 0.00033427681773900986, 0.0003524869680404663, 0.00037069711834192276, 0.0003889072686433792, 0.00040711741894483566, 0.0004253275692462921, 0.00044353771954774857, 0.000461747869849205, 0.00047995802015066147, 0.0004981681704521179, 0.0005163783207535744, 0.0005345884710550308, 0.0005527986213564873, 0.0005710087716579437, 0.0005892189219594002, 0.0006074290722608566, 0.0006256392225623131, 0.0006438493728637695]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 3.0, 3.0, 5.0, 5.0, 10.0, 13.0, 11.0, 17.0, 13.0, 17.0, 15.0, 22.0, 27.0, 22.0, 31.0, 31.0, 29.0, 34.0, 43.0, 46.0, 35.0, 39.0, 43.0, 31.0, 46.0, 35.0, 43.0, 40.0, 35.0, 33.0, 26.0, 25.0, 31.0, 18.0, 18.0, 17.0, 13.0, 18.0, 10.0, 9.0, 8.0, 8.0, 8.0, 3.0, 7.0, 3.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6953125, -8.43634033203125, -8.1773681640625, -7.91839599609375, -7.659423828125, -7.40045166015625, -7.1414794921875, -6.88250732421875, -6.62353515625, -6.36456298828125, -6.1055908203125, -5.84661865234375, -5.587646484375, -5.32867431640625, -5.0697021484375, -4.81072998046875, -4.5517578125, -4.29278564453125, -4.0338134765625, -3.77484130859375, -3.515869140625, -3.25689697265625, -2.9979248046875, -2.73895263671875, -2.47998046875, -2.22100830078125, -1.9620361328125, -1.70306396484375, -1.444091796875, -1.18511962890625, -0.9261474609375, -0.66717529296875, -0.408203125, -0.14923095703125, 0.1097412109375, 0.36871337890625, 0.627685546875, 0.88665771484375, 1.1456298828125, 1.40460205078125, 1.66357421875, 1.92254638671875, 2.1815185546875, 2.44049072265625, 2.699462890625, 2.95843505859375, 3.2174072265625, 3.47637939453125, 3.7353515625, 3.99432373046875, 4.2532958984375, 4.51226806640625, 4.771240234375, 5.03021240234375, 5.2891845703125, 5.54815673828125, 5.80712890625, 6.06610107421875, 6.3250732421875, 6.58404541015625, 6.843017578125, 7.10198974609375, 7.3609619140625, 7.61993408203125, 7.87890625]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 2.0, 9.0, 7.0, 7.0, 12.0, 12.0, 25.0, 23.0, 31.0, 44.0, 39.0, 73.0, 77.0, 136.0, 147.0, 214.0, 364.0, 630.0, 1190.0, 2478.0, 5750.0, 14689.0, 44537.0, 152840.0, 477394.0, 243340.0, 67909.0, 21646.0, 7922.0, 3320.0, 1533.0, 771.0, 398.0, 270.0, 187.0, 127.0, 89.0, 80.0, 44.0, 46.0, 38.0, 23.0, 31.0, 18.0, 9.0, 6.0, 12.0, 1.0, 8.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.3671875, -11.0296630859375, -10.692138671875, -10.3546142578125, -10.01708984375, -9.6795654296875, -9.342041015625, -9.0045166015625, -8.6669921875, -8.3294677734375, -7.991943359375, -7.6544189453125, -7.31689453125, -6.9793701171875, -6.641845703125, -6.3043212890625, -5.966796875, -5.6292724609375, -5.291748046875, -4.9542236328125, -4.61669921875, -4.2791748046875, -3.941650390625, -3.6041259765625, -3.2666015625, -2.9290771484375, -2.591552734375, -2.2540283203125, -1.91650390625, -1.5789794921875, -1.241455078125, -0.9039306640625, -0.56640625, -0.2288818359375, 0.108642578125, 0.4461669921875, 0.78369140625, 1.1212158203125, 1.458740234375, 1.7962646484375, 2.1337890625, 2.4713134765625, 2.808837890625, 3.1463623046875, 3.48388671875, 3.8214111328125, 4.158935546875, 4.4964599609375, 4.833984375, 5.1715087890625, 5.509033203125, 5.8465576171875, 6.18408203125, 6.5216064453125, 6.859130859375, 7.1966552734375, 7.5341796875, 7.8717041015625, 8.209228515625, 8.5467529296875, 8.88427734375, 9.2218017578125, 9.559326171875, 9.8968505859375, 10.234375]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 6.0, 4.0, 3.0, 7.0, 5.0, 5.0, 10.0, 16.0, 20.0, 15.0, 25.0, 36.0, 34.0, 43.0, 44.0, 59.0, 57.0, 68.0, 118.0, 236.0, 1589.0, 174.0, 82.0, 81.0, 51.0, 44.0, 38.0, 37.0, 29.0, 25.0, 20.0, 12.0, 9.0, 18.0, 9.0, 6.0, 10.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.09375, -27.249755859375, -26.40576171875, -25.561767578125, -24.7177734375, -23.873779296875, -23.02978515625, -22.185791015625, -21.341796875, -20.497802734375, -19.65380859375, -18.809814453125, -17.9658203125, -17.121826171875, -16.27783203125, -15.433837890625, -14.58984375, -13.745849609375, -12.90185546875, -12.057861328125, -11.2138671875, -10.369873046875, -9.52587890625, -8.681884765625, -7.837890625, -6.993896484375, -6.14990234375, -5.305908203125, -4.4619140625, -3.617919921875, -2.77392578125, -1.929931640625, -1.0859375, -0.241943359375, 0.60205078125, 1.446044921875, 2.2900390625, 3.134033203125, 3.97802734375, 4.822021484375, 5.666015625, 6.510009765625, 7.35400390625, 8.197998046875, 9.0419921875, 9.885986328125, 10.72998046875, 11.573974609375, 12.41796875, 13.261962890625, 14.10595703125, 14.949951171875, 15.7939453125, 16.637939453125, 17.48193359375, 18.325927734375, 19.169921875, 20.013916015625, 20.85791015625, 21.701904296875, 22.5458984375, 23.389892578125, 24.23388671875, 25.077880859375, 25.921875]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [5.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 4.0, 10.0, 6.0, 9.0, 17.0, 17.0, 19.0, 20.0, 22.0, 32.0, 39.0, 61.0, 73.0, 89.0, 151.0, 209.0, 322.0, 484.0, 1298.0, 7637.0, 144283.0, 2860037.0, 121187.0, 6878.0, 1209.0, 489.0, 266.0, 195.0, 141.0, 122.0, 90.0, 60.0, 50.0, 41.0, 34.0, 18.0, 15.0, 13.0, 10.0, 8.0, 11.0, 9.0, 5.0, 4.0, 1.0, 5.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-27.78125, -26.8056640625, -25.830078125, -24.8544921875, -23.87890625, -22.9033203125, -21.927734375, -20.9521484375, -19.9765625, -19.0009765625, -18.025390625, -17.0498046875, -16.07421875, -15.0986328125, -14.123046875, -13.1474609375, -12.171875, -11.1962890625, -10.220703125, -9.2451171875, -8.26953125, -7.2939453125, -6.318359375, -5.3427734375, -4.3671875, -3.3916015625, -2.416015625, -1.4404296875, -0.46484375, 0.5107421875, 1.486328125, 2.4619140625, 3.4375, 4.4130859375, 5.388671875, 6.3642578125, 7.33984375, 8.3154296875, 9.291015625, 10.2666015625, 11.2421875, 12.2177734375, 13.193359375, 14.1689453125, 15.14453125, 16.1201171875, 17.095703125, 18.0712890625, 19.046875, 20.0224609375, 20.998046875, 21.9736328125, 22.94921875, 23.9248046875, 24.900390625, 25.8759765625, 26.8515625, 27.8271484375, 28.802734375, 29.7783203125, 30.75390625, 31.7294921875, 32.705078125, 33.6806640625, 34.65625]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 23.0, 629.0, 361.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-144.31056213378906, -137.38217163085938, -130.4537811279297, -123.52539825439453, -116.59700775146484, -109.66861724853516, -102.740234375, -95.81184387207031, -88.88345336914062, -81.95506286621094, -75.02667236328125, -68.0982894897461, -61.169898986816406, -54.24150848388672, -47.3131217956543, -40.384735107421875, -33.45634460449219, -26.527956008911133, -19.599567413330078, -12.671178817749023, -5.742790222167969, 1.1856002807617188, 8.11398696899414, 15.042373657226562, 21.97076416015625, 28.899152755737305, 35.82754135131836, 42.75592803955078, 49.68431854248047, 56.612709045410156, 63.54109573364258, 70.469482421875, 77.39785766601562, 84.32624816894531, 91.254638671875, 98.18302154541016, 105.11141204833984, 112.03980255126953, 118.96818542480469, 125.89657592773438, 132.82496643066406, 139.75335693359375, 146.68174743652344, 153.61013793945312, 160.53851318359375, 167.4669189453125, 174.39529418945312, 181.3236846923828, 188.2520751953125, 195.1804656982422, 202.10885620117188, 209.03724670410156, 215.96563720703125, 222.89401245117188, 229.82240295410156, 236.75079345703125, 243.67918395996094, 250.60757446289062, 257.53594970703125, 264.46435546875, 271.3927307128906, 278.3211364746094, 285.24951171875, 292.17791748046875, 299.1062927246094]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 5.0, 4.0, 10.0, 7.0, 11.0, 11.0, 7.0, 19.0, 19.0, 24.0, 15.0, 31.0, 22.0, 32.0, 29.0, 30.0, 36.0, 42.0, 35.0, 33.0, 43.0, 46.0, 52.0, 43.0, 56.0, 42.0, 37.0, 42.0, 30.0, 29.0, 14.0, 20.0, 20.0, 19.0, 14.0, 11.0, 18.0, 14.0, 6.0, 8.0, 8.0, 2.0, 3.0, 5.0, 0.0, 3.0, 1.0, 1.0, 3.0], "bins": [-62.021888732910156, -60.27645492553711, -58.5310173034668, -56.78558349609375, -55.0401496887207, -53.294715881347656, -51.549278259277344, -49.8038444519043, -48.05841064453125, -46.3129768371582, -44.56753921508789, -42.822105407714844, -41.0766716003418, -39.33123779296875, -37.58580017089844, -35.84036636352539, -34.09492874145508, -32.34949493408203, -30.60405921936035, -28.858623504638672, -27.113189697265625, -25.367753982543945, -23.622318267822266, -21.87688446044922, -20.13144874572754, -18.38601303100586, -16.640579223632812, -14.895143508911133, -13.14970874786377, -11.404273986816406, -9.658838272094727, -7.913403511047363, -6.16796875, -4.422533988952637, -2.6770987510681152, -0.9316635131835938, 0.8137712478637695, 2.559206008911133, 4.3046417236328125, 6.050076484680176, 7.795511245727539, 9.540946006774902, 11.286380767822266, 13.031816482543945, 14.777251243591309, 16.522686004638672, 18.26812171936035, 20.01355743408203, 21.758991241455078, 23.504426956176758, 25.249860763549805, 26.995296478271484, 28.74073028564453, 30.48616600036621, 32.23160171508789, 33.97703552246094, 35.72247314453125, 37.4679069519043, 39.21334457397461, 40.958778381347656, 42.7042121887207, 44.44964599609375, 46.19508361816406, 47.94051742553711, 49.685951232910156]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 1.0, 3.0, 4.0, 6.0, 6.0, 8.0, 12.0, 10.0, 18.0, 21.0, 19.0, 16.0, 22.0, 30.0, 33.0, 25.0, 29.0, 42.0, 35.0, 34.0, 39.0, 40.0, 47.0, 38.0, 44.0, 40.0, 34.0, 36.0, 42.0, 39.0, 27.0, 34.0, 26.0, 18.0, 14.0, 19.0, 23.0, 13.0, 7.0, 13.0, 9.0, 9.0, 5.0, 4.0, 7.0, 4.0, 0.0, 3.0, 1.0, 3.0], "bins": [-10.046875, -9.775146484375, -9.50341796875, -9.231689453125, -8.9599609375, -8.688232421875, -8.41650390625, -8.144775390625, -7.873046875, -7.601318359375, -7.32958984375, -7.057861328125, -6.7861328125, -6.514404296875, -6.24267578125, -5.970947265625, -5.69921875, -5.427490234375, -5.15576171875, -4.884033203125, -4.6123046875, -4.340576171875, -4.06884765625, -3.797119140625, -3.525390625, -3.253662109375, -2.98193359375, -2.710205078125, -2.4384765625, -2.166748046875, -1.89501953125, -1.623291015625, -1.3515625, -1.079833984375, -0.80810546875, -0.536376953125, -0.2646484375, 0.007080078125, 0.27880859375, 0.550537109375, 0.822265625, 1.093994140625, 1.36572265625, 1.637451171875, 1.9091796875, 2.180908203125, 2.45263671875, 2.724365234375, 2.99609375, 3.267822265625, 3.53955078125, 3.811279296875, 4.0830078125, 4.354736328125, 4.62646484375, 4.898193359375, 5.169921875, 5.441650390625, 5.71337890625, 5.985107421875, 6.2568359375, 6.528564453125, 6.80029296875, 7.072021484375, 7.34375]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 6.0, 5.0, 5.0, 6.0, 10.0, 11.0, 9.0, 15.0, 16.0, 24.0, 26.0, 27.0, 31.0, 47.0, 49.0, 97.0, 233.0, 782.0, 4521.0, 237258.0, 3820295.0, 125731.0, 3790.0, 686.0, 221.0, 102.0, 65.0, 37.0, 27.0, 31.0, 22.0, 24.0, 12.0, 11.0, 12.0, 11.0, 10.0, 8.0, 8.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.625, -32.44287109375, -31.2607421875, -30.07861328125, -28.896484375, -27.71435546875, -26.5322265625, -25.35009765625, -24.16796875, -22.98583984375, -21.8037109375, -20.62158203125, -19.439453125, -18.25732421875, -17.0751953125, -15.89306640625, -14.7109375, -13.52880859375, -12.3466796875, -11.16455078125, -9.982421875, -8.80029296875, -7.6181640625, -6.43603515625, -5.25390625, -4.07177734375, -2.8896484375, -1.70751953125, -0.525390625, 0.65673828125, 1.8388671875, 3.02099609375, 4.203125, 5.38525390625, 6.5673828125, 7.74951171875, 8.931640625, 10.11376953125, 11.2958984375, 12.47802734375, 13.66015625, 14.84228515625, 16.0244140625, 17.20654296875, 18.388671875, 19.57080078125, 20.7529296875, 21.93505859375, 23.1171875, 24.29931640625, 25.4814453125, 26.66357421875, 27.845703125, 29.02783203125, 30.2099609375, 31.39208984375, 32.57421875, 33.75634765625, 34.9384765625, 36.12060546875, 37.302734375, 38.48486328125, 39.6669921875, 40.84912109375, 42.03125]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 8.0, 6.0, 12.0, 3.0, 9.0, 19.0, 22.0, 33.0, 44.0, 50.0, 84.0, 116.0, 181.0, 259.0, 349.0, 436.0, 520.0, 519.0, 421.0, 328.0, 210.0, 140.0, 105.0, 51.0, 40.0, 28.0, 21.0, 16.0, 15.0, 8.0, 4.0, 7.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.8203125, -12.416259765625, -12.01220703125, -11.608154296875, -11.2041015625, -10.800048828125, -10.39599609375, -9.991943359375, -9.587890625, -9.183837890625, -8.77978515625, -8.375732421875, -7.9716796875, -7.567626953125, -7.16357421875, -6.759521484375, -6.35546875, -5.951416015625, -5.54736328125, -5.143310546875, -4.7392578125, -4.335205078125, -3.93115234375, -3.527099609375, -3.123046875, -2.718994140625, -2.31494140625, -1.910888671875, -1.5068359375, -1.102783203125, -0.69873046875, -0.294677734375, 0.109375, 0.513427734375, 0.91748046875, 1.321533203125, 1.7255859375, 2.129638671875, 2.53369140625, 2.937744140625, 3.341796875, 3.745849609375, 4.14990234375, 4.553955078125, 4.9580078125, 5.362060546875, 5.76611328125, 6.170166015625, 6.57421875, 6.978271484375, 7.38232421875, 7.786376953125, 8.1904296875, 8.594482421875, 8.99853515625, 9.402587890625, 9.806640625, 10.210693359375, 10.61474609375, 11.018798828125, 11.4228515625, 11.826904296875, 12.23095703125, 12.635009765625, 13.0390625]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 10.0, 9.0, 13.0, 12.0, 20.0, 19.0, 30.0, 61.0, 93.0, 186.0, 395.0, 1083.0, 6744.0, 188404.0, 3888790.0, 101926.0, 4746.0, 972.0, 340.0, 166.0, 82.0, 51.0, 45.0, 25.0, 19.0, 16.0, 8.0, 9.0, 4.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.6875, -36.36181640625, -35.0361328125, -33.71044921875, -32.384765625, -31.05908203125, -29.7333984375, -28.40771484375, -27.08203125, -25.75634765625, -24.4306640625, -23.10498046875, -21.779296875, -20.45361328125, -19.1279296875, -17.80224609375, -16.4765625, -15.15087890625, -13.8251953125, -12.49951171875, -11.173828125, -9.84814453125, -8.5224609375, -7.19677734375, -5.87109375, -4.54541015625, -3.2197265625, -1.89404296875, -0.568359375, 0.75732421875, 2.0830078125, 3.40869140625, 4.734375, 6.06005859375, 7.3857421875, 8.71142578125, 10.037109375, 11.36279296875, 12.6884765625, 14.01416015625, 15.33984375, 16.66552734375, 17.9912109375, 19.31689453125, 20.642578125, 21.96826171875, 23.2939453125, 24.61962890625, 25.9453125, 27.27099609375, 28.5966796875, 29.92236328125, 31.248046875, 32.57373046875, 33.8994140625, 35.22509765625, 36.55078125, 37.87646484375, 39.2021484375, 40.52783203125, 41.853515625, 43.17919921875, 44.5048828125, 45.83056640625, 47.15625]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 31.0, 50.0, 140.0, 184.0, 220.0, 199.0, 100.0, 45.0, 32.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-133.75555419921875, -131.15850830078125, -128.5614471435547, -125.96440124511719, -123.36734771728516, -120.77029418945312, -118.1732406616211, -115.57618713378906, -112.97914123535156, -110.38208770751953, -107.7850341796875, -105.18798828125, -102.59093475341797, -99.99388122558594, -97.3968276977539, -94.79977416992188, -92.20272064208984, -89.60566711425781, -87.00861358642578, -84.41156768798828, -81.81451416015625, -79.21746063232422, -76.62040710449219, -74.02335357666016, -71.42630004882812, -68.8292465209961, -66.23219299316406, -63.6351432800293, -61.03809356689453, -58.4410400390625, -55.84398651123047, -53.24693298339844, -50.649879455566406, -48.052825927734375, -45.45577621459961, -42.85872268676758, -40.26167297363281, -37.66461944580078, -35.06756591796875, -32.47051239013672, -29.873462677001953, -27.276411056518555, -24.679359436035156, -22.082305908203125, -19.485254287719727, -16.888202667236328, -14.291150093078613, -11.694097518920898, -9.0970458984375, -6.499993801116943, -3.9029417037963867, -1.30588960647583, 1.2911624908447266, 3.888214111328125, 6.48526668548584, 9.082319259643555, 11.679370880126953, 14.276422500610352, 16.87347412109375, 19.47052764892578, 22.06757926940918, 24.664630889892578, 27.26168441772461, 29.858736038208008, 32.455787658691406]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 2.0, 0.0, 2.0, 5.0, 6.0, 9.0, 6.0, 3.0, 10.0, 8.0, 11.0, 14.0, 18.0, 20.0, 26.0, 17.0, 22.0, 23.0, 27.0, 23.0, 32.0, 31.0, 26.0, 46.0, 39.0, 38.0, 27.0, 30.0, 29.0, 39.0, 31.0, 49.0, 38.0, 40.0, 35.0, 26.0, 26.0, 26.0, 17.0, 17.0, 21.0, 14.0, 15.0, 8.0, 5.0, 13.0, 7.0, 5.0, 3.0, 3.0, 4.0, 11.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-36.50335693359375, -35.334442138671875, -34.165523529052734, -32.99660873413086, -31.82769203186035, -30.658775329589844, -29.48986053466797, -28.32094383239746, -27.152027130126953, -25.983110427856445, -24.814193725585938, -23.645278930664062, -22.476362228393555, -21.307445526123047, -20.138530731201172, -18.969614028930664, -17.800697326660156, -16.63178062438965, -15.462864875793457, -14.293949127197266, -13.125032424926758, -11.95611572265625, -10.787199974060059, -9.618284225463867, -8.44936752319336, -7.28045129776001, -6.11153507232666, -4.9426188468933105, -3.773702621459961, -2.6047863960266113, -1.4358701705932617, -0.2669544219970703, 0.9019622802734375, 2.070878505706787, 3.2397947311401367, 4.408710956573486, 5.577627182006836, 6.7465434074401855, 7.915459632873535, 9.084375381469727, 10.253292083740234, 11.422208786010742, 12.591124534606934, 13.760040283203125, 14.928956985473633, 16.09787368774414, 17.266788482666016, 18.435705184936523, 19.60462188720703, 20.77353858947754, 21.942455291748047, 23.111370086669922, 24.28028678894043, 25.449203491210938, 26.618118286132812, 27.78703498840332, 28.955951690673828, 30.124868392944336, 31.293785095214844, 32.46269989013672, 33.631614685058594, 34.800533294677734, 35.96944808959961, 37.13836669921875, 38.307281494140625]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 2.0, 3.0, 5.0, 5.0, 4.0, 8.0, 8.0, 14.0, 8.0, 12.0, 7.0, 25.0, 21.0, 24.0, 24.0, 24.0, 32.0, 31.0, 27.0, 28.0, 28.0, 28.0, 33.0, 35.0, 44.0, 50.0, 43.0, 36.0, 32.0, 41.0, 32.0, 28.0, 41.0, 30.0, 23.0, 25.0, 20.0, 18.0, 17.0, 22.0, 14.0, 8.0, 14.0, 5.0, 4.0, 7.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0, 5.0, 3.0, 0.0, 2.0], "bins": [-8.7421875, -8.4786376953125, -8.215087890625, -7.9515380859375, -7.68798828125, -7.4244384765625, -7.160888671875, -6.8973388671875, -6.6337890625, -6.3702392578125, -6.106689453125, -5.8431396484375, -5.57958984375, -5.3160400390625, -5.052490234375, -4.7889404296875, -4.525390625, -4.2618408203125, -3.998291015625, -3.7347412109375, -3.47119140625, -3.2076416015625, -2.944091796875, -2.6805419921875, -2.4169921875, -2.1534423828125, -1.889892578125, -1.6263427734375, -1.36279296875, -1.0992431640625, -0.835693359375, -0.5721435546875, -0.30859375, -0.0450439453125, 0.218505859375, 0.4820556640625, 0.74560546875, 1.0091552734375, 1.272705078125, 1.5362548828125, 1.7998046875, 2.0633544921875, 2.326904296875, 2.5904541015625, 2.85400390625, 3.1175537109375, 3.381103515625, 3.6446533203125, 3.908203125, 4.1717529296875, 4.435302734375, 4.6988525390625, 4.96240234375, 5.2259521484375, 5.489501953125, 5.7530517578125, 6.0166015625, 6.2801513671875, 6.543701171875, 6.8072509765625, 7.07080078125, 7.3343505859375, 7.597900390625, 7.8614501953125, 8.125]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 6.0, 3.0, 7.0, 4.0, 10.0, 18.0, 17.0, 43.0, 50.0, 62.0, 125.0, 148.0, 279.0, 384.0, 592.0, 903.0, 1250.0, 1977.0, 2970.0, 4397.0, 6740.0, 10368.0, 16272.0, 25756.0, 41279.0, 68042.0, 117342.0, 277145.0, 212393.0, 100414.0, 59295.0, 36372.0, 22446.0, 14328.0, 9332.0, 6011.0, 3830.0, 2663.0, 1744.0, 1227.0, 739.0, 538.0, 364.0, 208.0, 149.0, 107.0, 83.0, 41.0, 24.0, 32.0, 12.0, 9.0, 8.0, 7.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.7119140625, -1.6564483642578125, -1.600982666015625, -1.5455169677734375, -1.49005126953125, -1.4345855712890625, -1.379119873046875, -1.3236541748046875, -1.2681884765625, -1.2127227783203125, -1.157257080078125, -1.1017913818359375, -1.04632568359375, -0.9908599853515625, -0.935394287109375, -0.8799285888671875, -0.824462890625, -0.7689971923828125, -0.713531494140625, -0.6580657958984375, -0.60260009765625, -0.5471343994140625, -0.491668701171875, -0.4362030029296875, -0.3807373046875, -0.3252716064453125, -0.269805908203125, -0.2143402099609375, -0.15887451171875, -0.1034088134765625, -0.047943115234375, 0.0075225830078125, 0.06298828125, 0.1184539794921875, 0.173919677734375, 0.2293853759765625, 0.28485107421875, 0.3403167724609375, 0.395782470703125, 0.4512481689453125, 0.5067138671875, 0.5621795654296875, 0.617645263671875, 0.6731109619140625, 0.72857666015625, 0.7840423583984375, 0.839508056640625, 0.8949737548828125, 0.950439453125, 1.0059051513671875, 1.061370849609375, 1.1168365478515625, 1.17230224609375, 1.2277679443359375, 1.283233642578125, 1.3386993408203125, 1.3941650390625, 1.4496307373046875, 1.505096435546875, 1.5605621337890625, 1.61602783203125, 1.6714935302734375, 1.726959228515625, 1.7824249267578125, 1.837890625]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 5.0, 3.0, 2.0, 4.0, 7.0, 4.0, 10.0, 7.0, 11.0, 6.0, 16.0, 8.0, 14.0, 13.0, 21.0, 25.0, 33.0, 27.0, 27.0, 39.0, 40.0, 37.0, 34.0, 17.0, 42.0, 27.0, 1073.0, 31.0, 41.0, 41.0, 31.0, 42.0, 30.0, 14.0, 27.0, 33.0, 25.0, 18.0, 23.0, 20.0, 20.0, 20.0, 12.0, 9.0, 5.0, 9.0, 6.0, 11.0, 3.0, 5.0, 3.0, 2.0, 0.0, 4.0, 1.0, 2.0], "bins": [-5.77734375, -5.60968017578125, -5.4420166015625, -5.27435302734375, -5.106689453125, -4.93902587890625, -4.7713623046875, -4.60369873046875, -4.43603515625, -4.26837158203125, -4.1007080078125, -3.93304443359375, -3.765380859375, -3.59771728515625, -3.4300537109375, -3.26239013671875, -3.0947265625, -2.92706298828125, -2.7593994140625, -2.59173583984375, -2.424072265625, -2.25640869140625, -2.0887451171875, -1.92108154296875, -1.75341796875, -1.58575439453125, -1.4180908203125, -1.25042724609375, -1.082763671875, -0.91510009765625, -0.7474365234375, -0.57977294921875, -0.412109375, -0.24444580078125, -0.0767822265625, 0.09088134765625, 0.258544921875, 0.42620849609375, 0.5938720703125, 0.76153564453125, 0.92919921875, 1.09686279296875, 1.2645263671875, 1.43218994140625, 1.599853515625, 1.76751708984375, 1.9351806640625, 2.10284423828125, 2.2705078125, 2.43817138671875, 2.6058349609375, 2.77349853515625, 2.941162109375, 3.10882568359375, 3.2764892578125, 3.44415283203125, 3.61181640625, 3.77947998046875, 3.9471435546875, 4.11480712890625, 4.282470703125, 4.45013427734375, 4.6177978515625, 4.78546142578125, 4.953125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 4.0, 4.0, 2.0, 1.0, 11.0, 12.0, 19.0, 24.0, 29.0, 27.0, 74.0, 85.0, 106.0, 169.0, 257.0, 339.0, 491.0, 720.0, 1005.0, 1459.0, 2078.0, 3098.0, 4503.0, 6582.0, 9679.0, 14848.0, 22581.0, 34826.0, 56064.0, 92735.0, 183243.0, 1333897.0, 125936.0, 73152.0, 44949.0, 28218.0, 18219.0, 11960.0, 7945.0, 5420.0, 3717.0, 2662.0, 1809.0, 1281.0, 905.0, 597.0, 411.0, 308.0, 222.0, 133.0, 110.0, 69.0, 56.0, 32.0, 22.0, 15.0, 15.0, 8.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.6201171875, -1.5699005126953125, -1.519683837890625, -1.4694671630859375, -1.41925048828125, -1.3690338134765625, -1.318817138671875, -1.2686004638671875, -1.2183837890625, -1.1681671142578125, -1.117950439453125, -1.0677337646484375, -1.01751708984375, -0.9673004150390625, -0.917083740234375, -0.8668670654296875, -0.816650390625, -0.7664337158203125, -0.716217041015625, -0.6660003662109375, -0.61578369140625, -0.5655670166015625, -0.515350341796875, -0.4651336669921875, -0.4149169921875, -0.3647003173828125, -0.314483642578125, -0.2642669677734375, -0.21405029296875, -0.1638336181640625, -0.113616943359375, -0.0634002685546875, -0.01318359375, 0.0370330810546875, 0.087249755859375, 0.1374664306640625, 0.18768310546875, 0.2378997802734375, 0.288116455078125, 0.3383331298828125, 0.3885498046875, 0.4387664794921875, 0.488983154296875, 0.5391998291015625, 0.58941650390625, 0.6396331787109375, 0.689849853515625, 0.7400665283203125, 0.790283203125, 0.8404998779296875, 0.890716552734375, 0.9409332275390625, 0.99114990234375, 1.0413665771484375, 1.091583251953125, 1.1417999267578125, 1.1920166015625, 1.2422332763671875, 1.292449951171875, 1.3426666259765625, 1.39288330078125, 1.4430999755859375, 1.493316650390625, 1.5435333251953125, 1.59375]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 2.0, 5.0, 4.0, 3.0, 5.0, 7.0, 11.0, 15.0, 12.0, 11.0, 18.0, 24.0, 33.0, 34.0, 37.0, 55.0, 62.0, 68.0, 54.0, 61.0, 71.0, 57.0, 61.0, 45.0, 44.0, 23.0, 40.0, 20.0, 24.0, 19.0, 14.0, 13.0, 13.0, 6.0, 9.0, 5.0, 1.0, 4.0, 6.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0008502006530761719, -0.0008223056793212891, -0.0007944107055664062, -0.0007665157318115234, -0.0007386207580566406, -0.0007107257843017578, -0.000682830810546875, -0.0006549358367919922, -0.0006270408630371094, -0.0005991458892822266, -0.0005712509155273438, -0.0005433559417724609, -0.0005154609680175781, -0.0004875659942626953, -0.0004596710205078125, -0.0004317760467529297, -0.0004038810729980469, -0.00037598609924316406, -0.00034809112548828125, -0.00032019615173339844, -0.0002923011779785156, -0.0002644062042236328, -0.00023651123046875, -0.0002086162567138672, -0.00018072128295898438, -0.00015282630920410156, -0.00012493133544921875, -9.703636169433594e-05, -6.914138793945312e-05, -4.124641418457031e-05, -1.33514404296875e-05, 1.4543533325195312e-05, 4.2438507080078125e-05, 7.033348083496094e-05, 9.822845458984375e-05, 0.00012612342834472656, 0.00015401840209960938, 0.0001819133758544922, 0.000209808349609375, 0.0002377033233642578, 0.0002655982971191406, 0.00029349327087402344, 0.00032138824462890625, 0.00034928321838378906, 0.0003771781921386719, 0.0004050731658935547, 0.0004329681396484375, 0.0004608631134033203, 0.0004887580871582031, 0.0005166530609130859, 0.0005445480346679688, 0.0005724430084228516, 0.0006003379821777344, 0.0006282329559326172, 0.0006561279296875, 0.0006840229034423828, 0.0007119178771972656, 0.0007398128509521484, 0.0007677078247070312, 0.0007956027984619141, 0.0008234977722167969, 0.0008513927459716797, 0.0008792877197265625, 0.0009071826934814453, 0.0009350776672363281]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 8.0, 6.0, 7.0, 9.0, 11.0, 16.0, 22.0, 10.0, 18.0, 33.0, 35.0, 66.0, 68.0, 87.0, 131.0, 230.0, 459.0, 1039.0, 297016.0, 746871.0, 1171.0, 482.0, 246.0, 148.0, 82.0, 70.0, 42.0, 38.0, 32.0, 26.0, 20.0, 13.0, 7.0, 11.0, 7.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0206146240234375, -0.019990921020507812, -0.019367218017578125, -0.018743515014648438, -0.01811981201171875, -0.017496109008789062, -0.016872406005859375, -0.016248703002929688, -0.015625, -0.015001296997070312, -0.014377593994140625, -0.013753890991210938, -0.01313018798828125, -0.012506484985351562, -0.011882781982421875, -0.011259078979492188, -0.0106353759765625, -0.010011672973632812, -0.009387969970703125, -0.008764266967773438, -0.00814056396484375, -0.0075168609619140625, -0.006893157958984375, -0.0062694549560546875, -0.005645751953125, -0.0050220489501953125, -0.004398345947265625, -0.0037746429443359375, -0.00315093994140625, -0.0025272369384765625, -0.001903533935546875, -0.0012798309326171875, -0.0006561279296875, -3.24249267578125e-05, 0.000591278076171875, 0.0012149810791015625, 0.00183868408203125, 0.0024623870849609375, 0.003086090087890625, 0.0037097930908203125, 0.00433349609375, 0.0049571990966796875, 0.005580902099609375, 0.0062046051025390625, 0.00682830810546875, 0.0074520111083984375, 0.008075714111328125, 0.008699417114257812, 0.0093231201171875, 0.009946823120117188, 0.010570526123046875, 0.011194229125976562, 0.01181793212890625, 0.012441635131835938, 0.013065338134765625, 0.013689041137695312, 0.014312744140625, 0.014936447143554688, 0.015560150146484375, 0.016183853149414062, 0.01680755615234375, 0.017431259155273438, 0.018054962158203125, 0.018678665161132812, 0.0193023681640625]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 49.0, 875.0, 92.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.008120983839035034, -0.00796652864664793, -0.007812072988599539, -0.0076576173305511475, -0.007503162138164043, -0.007348706480115652, -0.007194250822067261, -0.007039795629680157, -0.006885339971631765, -0.006730884313583374, -0.00657642912119627, -0.006421973463147879, -0.006267517805099487, -0.006113062612712383, -0.005958606954663992, -0.005804151296615601, -0.0056496961042284966, -0.005495240446180105, -0.005340785253793001, -0.00518632959574461, -0.005031874403357506, -0.0048774187453091145, -0.004722963087260723, -0.004568507894873619, -0.004414052236825228, -0.004259596578776836, -0.004105141386389732, -0.003950685728341341, -0.0037962303031235933, -0.0036417748779058456, -0.0034873192198574543, -0.0033328637946397066, -0.003178408369421959, -0.0030239529442042112, -0.0028694975189864635, -0.002715041860938072, -0.0025605864357203245, -0.002406131010502577, -0.0022516753524541855, -0.002097219927236438, -0.0019427645020186901, -0.0017883090768009424, -0.001633853535167873, -0.0014793979935348034, -0.0013249425683170557, -0.001170487143099308, -0.0010160316014662385, -0.000861576059833169, -0.0007071206346154213, -0.0005526651511900127, -0.0003982096677646041, -0.0002437541843391955, -8.929870091378689e-05, 6.515678251162171e-05, 0.00021961226593703032, 0.00037406780757009983, 0.0005285232327878475, 0.0006829787162132561, 0.0008374341996386647, 0.0009918897412717342, 0.001146345166489482, 0.0013008005917072296, 0.0014552561333402991, 0.0016097116749733686, 0.0017641671001911163]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 7.0, 5.0, 12.0, 12.0, 7.0, 16.0, 15.0, 21.0, 18.0, 26.0, 25.0, 25.0, 39.0, 27.0, 30.0, 24.0, 24.0, 35.0, 32.0, 44.0, 36.0, 30.0, 38.0, 41.0, 45.0, 37.0, 31.0, 31.0, 37.0, 24.0, 31.0, 25.0, 28.0, 14.0, 12.0, 18.0, 13.0, 12.0, 12.0, 11.0, 9.0, 4.0, 3.0, 5.0, 6.0, 5.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0], "bins": [-0.00045377016067504883, -0.0004400312900543213, -0.00042629241943359375, -0.0004125535488128662, -0.00039881467819213867, -0.00038507580757141113, -0.0003713369369506836, -0.00035759806632995605, -0.0003438591957092285, -0.000330120325088501, -0.00031638145446777344, -0.0003026425838470459, -0.00028890371322631836, -0.0002751648426055908, -0.0002614259719848633, -0.00024768710136413574, -0.0002339482307434082, -0.00022020936012268066, -0.00020647048950195312, -0.00019273161888122559, -0.00017899274826049805, -0.0001652538776397705, -0.00015151500701904297, -0.00013777613639831543, -0.0001240372657775879, -0.00011029839515686035, -9.655952453613281e-05, -8.282065391540527e-05, -6.908178329467773e-05, -5.5342912673950195e-05, -4.1604042053222656e-05, -2.7865171432495117e-05, -1.4126300811767578e-05, -3.8743019104003906e-07, 1.33514404296875e-05, 2.709031105041504e-05, 4.082918167114258e-05, 5.456805229187012e-05, 6.830692291259766e-05, 8.20457935333252e-05, 9.578466415405273e-05, 0.00010952353477478027, 0.0001232624053955078, 0.00013700127601623535, 0.0001507401466369629, 0.00016447901725769043, 0.00017821788787841797, 0.0001919567584991455, 0.00020569562911987305, 0.00021943449974060059, 0.00023317337036132812, 0.00024691224098205566, 0.0002606511116027832, 0.00027438998222351074, 0.0002881288528442383, 0.0003018677234649658, 0.00031560659408569336, 0.0003293454647064209, 0.00034308433532714844, 0.000356823205947876, 0.0003705620765686035, 0.00038430094718933105, 0.0003980398178100586, 0.00041177868843078613, 0.00042551755905151367]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 2.0, 3.0, 5.0, 5.0, 4.0, 8.0, 8.0, 14.0, 8.0, 12.0, 7.0, 25.0, 21.0, 24.0, 24.0, 24.0, 32.0, 31.0, 27.0, 28.0, 28.0, 28.0, 33.0, 35.0, 44.0, 50.0, 43.0, 36.0, 32.0, 41.0, 32.0, 28.0, 41.0, 30.0, 23.0, 25.0, 20.0, 18.0, 17.0, 22.0, 14.0, 8.0, 14.0, 5.0, 4.0, 7.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0, 5.0, 3.0, 0.0, 2.0], "bins": [-8.7421875, -8.4786376953125, -8.215087890625, -7.9515380859375, -7.68798828125, -7.4244384765625, -7.160888671875, -6.8973388671875, -6.6337890625, -6.3702392578125, -6.106689453125, -5.8431396484375, -5.57958984375, -5.3160400390625, -5.052490234375, -4.7889404296875, -4.525390625, -4.2618408203125, -3.998291015625, -3.7347412109375, -3.47119140625, -3.2076416015625, -2.944091796875, -2.6805419921875, -2.4169921875, -2.1534423828125, -1.889892578125, -1.6263427734375, -1.36279296875, -1.0992431640625, -0.835693359375, -0.5721435546875, -0.30859375, -0.0450439453125, 0.218505859375, 0.4820556640625, 0.74560546875, 1.0091552734375, 1.272705078125, 1.5362548828125, 1.7998046875, 2.0633544921875, 2.326904296875, 2.5904541015625, 2.85400390625, 3.1175537109375, 3.381103515625, 3.6446533203125, 3.908203125, 4.1717529296875, 4.435302734375, 4.6988525390625, 4.96240234375, 5.2259521484375, 5.489501953125, 5.7530517578125, 6.0166015625, 6.2801513671875, 6.543701171875, 6.8072509765625, 7.07080078125, 7.3343505859375, 7.597900390625, 7.8614501953125, 8.125]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 6.0, 6.0, 6.0, 11.0, 15.0, 26.0, 24.0, 31.0, 35.0, 65.0, 81.0, 113.0, 145.0, 177.0, 242.0, 382.0, 538.0, 810.0, 1275.0, 2186.0, 4305.0, 10216.0, 29338.0, 97425.0, 318645.0, 389500.0, 129529.0, 38385.0, 12805.0, 5125.0, 2598.0, 1483.0, 908.0, 615.0, 391.0, 300.0, 205.0, 157.0, 113.0, 88.0, 67.0, 50.0, 34.0, 22.0, 21.0, 19.0, 12.0, 10.0, 8.0, 6.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4921875, -9.1871337890625, -8.882080078125, -8.5770263671875, -8.27197265625, -7.9669189453125, -7.661865234375, -7.3568115234375, -7.0517578125, -6.7467041015625, -6.441650390625, -6.1365966796875, -5.83154296875, -5.5264892578125, -5.221435546875, -4.9163818359375, -4.611328125, -4.3062744140625, -4.001220703125, -3.6961669921875, -3.39111328125, -3.0860595703125, -2.781005859375, -2.4759521484375, -2.1708984375, -1.8658447265625, -1.560791015625, -1.2557373046875, -0.95068359375, -0.6456298828125, -0.340576171875, -0.0355224609375, 0.26953125, 0.5745849609375, 0.879638671875, 1.1846923828125, 1.48974609375, 1.7947998046875, 2.099853515625, 2.4049072265625, 2.7099609375, 3.0150146484375, 3.320068359375, 3.6251220703125, 3.93017578125, 4.2352294921875, 4.540283203125, 4.8453369140625, 5.150390625, 5.4554443359375, 5.760498046875, 6.0655517578125, 6.37060546875, 6.6756591796875, 6.980712890625, 7.2857666015625, 7.5908203125, 7.8958740234375, 8.200927734375, 8.5059814453125, 8.81103515625, 9.1160888671875, 9.421142578125, 9.7261962890625, 10.03125]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 7.0, 7.0, 12.0, 9.0, 15.0, 12.0, 11.0, 20.0, 28.0, 30.0, 36.0, 40.0, 32.0, 43.0, 63.0, 66.0, 132.0, 267.0, 1594.0, 172.0, 81.0, 58.0, 56.0, 48.0, 35.0, 32.0, 32.0, 27.0, 18.0, 19.0, 12.0, 15.0, 11.0, 5.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.453125, -25.57958984375, -24.7060546875, -23.83251953125, -22.958984375, -22.08544921875, -21.2119140625, -20.33837890625, -19.46484375, -18.59130859375, -17.7177734375, -16.84423828125, -15.970703125, -15.09716796875, -14.2236328125, -13.35009765625, -12.4765625, -11.60302734375, -10.7294921875, -9.85595703125, -8.982421875, -8.10888671875, -7.2353515625, -6.36181640625, -5.48828125, -4.61474609375, -3.7412109375, -2.86767578125, -1.994140625, -1.12060546875, -0.2470703125, 0.62646484375, 1.5, 2.37353515625, 3.2470703125, 4.12060546875, 4.994140625, 5.86767578125, 6.7412109375, 7.61474609375, 8.48828125, 9.36181640625, 10.2353515625, 11.10888671875, 11.982421875, 12.85595703125, 13.7294921875, 14.60302734375, 15.4765625, 16.35009765625, 17.2236328125, 18.09716796875, 18.970703125, 19.84423828125, 20.7177734375, 21.59130859375, 22.46484375, 23.33837890625, 24.2119140625, 25.08544921875, 25.958984375, 26.83251953125, 27.7060546875, 28.57958984375, 29.453125]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 4.0, 8.0, 6.0, 8.0, 21.0, 19.0, 40.0, 41.0, 60.0, 83.0, 116.0, 145.0, 286.0, 435.0, 941.0, 7085.0, 2482733.0, 647532.0, 4136.0, 768.0, 404.0, 239.0, 147.0, 122.0, 91.0, 59.0, 55.0, 27.0, 28.0, 21.0, 12.0, 9.0, 11.0, 4.0, 4.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.65625, -46.20849609375, -44.7607421875, -43.31298828125, -41.865234375, -40.41748046875, -38.9697265625, -37.52197265625, -36.07421875, -34.62646484375, -33.1787109375, -31.73095703125, -30.283203125, -28.83544921875, -27.3876953125, -25.93994140625, -24.4921875, -23.04443359375, -21.5966796875, -20.14892578125, -18.701171875, -17.25341796875, -15.8056640625, -14.35791015625, -12.91015625, -11.46240234375, -10.0146484375, -8.56689453125, -7.119140625, -5.67138671875, -4.2236328125, -2.77587890625, -1.328125, 0.11962890625, 1.5673828125, 3.01513671875, 4.462890625, 5.91064453125, 7.3583984375, 8.80615234375, 10.25390625, 11.70166015625, 13.1494140625, 14.59716796875, 16.044921875, 17.49267578125, 18.9404296875, 20.38818359375, 21.8359375, 23.28369140625, 24.7314453125, 26.17919921875, 27.626953125, 29.07470703125, 30.5224609375, 31.97021484375, 33.41796875, 34.86572265625, 36.3134765625, 37.76123046875, 39.208984375, 40.65673828125, 42.1044921875, 43.55224609375, 45.0]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 196.0, 796.0, 21.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-365.01605224609375, -357.7579345703125, -350.4997863769531, -343.2416687011719, -335.9835205078125, -328.72540283203125, -321.4672546386719, -314.2091369628906, -306.95098876953125, -299.69287109375, -292.4347229003906, -285.1766052246094, -277.91845703125, -270.66033935546875, -263.4021911621094, -256.1440734863281, -248.88595581054688, -241.62782287597656, -234.36968994140625, -227.11155700683594, -219.85342407226562, -212.59530639648438, -205.33717346191406, -198.07904052734375, -190.82090759277344, -183.56277465820312, -176.3046417236328, -169.0465087890625, -161.78839111328125, -154.53024291992188, -147.27212524414062, -140.0139923095703, -132.755859375, -125.49772644042969, -118.23959350585938, -110.9814682006836, -103.72333526611328, -96.46520233154297, -89.20707702636719, -81.94894409179688, -74.69081115722656, -67.43267822265625, -60.1745491027832, -52.916419982910156, -45.658287048339844, -38.40015411376953, -31.142024993896484, -23.883895874023438, -16.625762939453125, -9.367631912231445, -2.1095008850097656, 5.148630142211914, 12.406761169433594, 19.664894104003906, 26.923023223876953, 34.18115234375, 41.43928527832031, 48.697418212890625, 55.95554733276367, 63.21367645263672, 70.47180938720703, 77.72994232177734, 84.98806762695312, 92.24620056152344, 99.50433349609375]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 5.0, 7.0, 5.0, 9.0, 7.0, 10.0, 12.0, 20.0, 20.0, 18.0, 26.0, 28.0, 26.0, 26.0, 25.0, 38.0, 42.0, 38.0, 44.0, 51.0, 32.0, 45.0, 42.0, 36.0, 40.0, 39.0, 51.0, 22.0, 27.0, 26.0, 25.0, 26.0, 24.0, 22.0, 20.0, 11.0, 15.0, 12.0, 5.0, 8.0, 4.0, 6.0, 5.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-59.233245849609375, -57.536346435546875, -55.83945083618164, -54.14255142211914, -52.445655822753906, -50.748756408691406, -49.051856994628906, -47.35496139526367, -45.65806198120117, -43.96116256713867, -42.26426696777344, -40.56736755371094, -38.8704719543457, -37.1735725402832, -35.47667694091797, -33.77977752685547, -32.08287811279297, -30.3859806060791, -28.689083099365234, -26.992183685302734, -25.295286178588867, -23.598388671875, -21.901491165161133, -20.204593658447266, -18.50769805908203, -16.810800552368164, -15.11390209197998, -13.417004585266113, -11.72010612487793, -10.023208618164062, -8.326311111450195, -6.629412651062012, -4.932514190673828, -3.2356162071228027, -1.5387184619903564, 0.15817928314208984, 1.8550772666931152, 3.5519752502441406, 5.248872756958008, 6.945771217346191, 8.642668724060059, 10.339566230773926, 12.03646469116211, 13.733362197875977, 15.430259704589844, 17.127159118652344, 18.824054718017578, 20.520954132080078, 22.217851638793945, 23.914749145507812, 25.61164665222168, 27.308544158935547, 29.005443572998047, 30.702341079711914, 32.39923858642578, 34.09613800048828, 35.793033599853516, 37.489933013916016, 39.18682861328125, 40.88372802734375, 42.580623626708984, 44.277523040771484, 45.97441864013672, 47.67131805419922, 49.36821746826172]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 2.0, 8.0, 9.0, 7.0, 7.0, 7.0, 13.0, 15.0, 12.0, 16.0, 37.0, 23.0, 23.0, 27.0, 27.0, 30.0, 35.0, 30.0, 36.0, 41.0, 33.0, 42.0, 42.0, 36.0, 43.0, 40.0, 37.0, 43.0, 39.0, 34.0, 20.0, 28.0, 20.0, 19.0, 26.0, 20.0, 15.0, 13.0, 10.0, 7.0, 7.0, 8.0, 4.0, 3.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 2.0, 1.0], "bins": [-9.421875, -9.1455078125, -8.869140625, -8.5927734375, -8.31640625, -8.0400390625, -7.763671875, -7.4873046875, -7.2109375, -6.9345703125, -6.658203125, -6.3818359375, -6.10546875, -5.8291015625, -5.552734375, -5.2763671875, -5.0, -4.7236328125, -4.447265625, -4.1708984375, -3.89453125, -3.6181640625, -3.341796875, -3.0654296875, -2.7890625, -2.5126953125, -2.236328125, -1.9599609375, -1.68359375, -1.4072265625, -1.130859375, -0.8544921875, -0.578125, -0.3017578125, -0.025390625, 0.2509765625, 0.52734375, 0.8037109375, 1.080078125, 1.3564453125, 1.6328125, 1.9091796875, 2.185546875, 2.4619140625, 2.73828125, 3.0146484375, 3.291015625, 3.5673828125, 3.84375, 4.1201171875, 4.396484375, 4.6728515625, 4.94921875, 5.2255859375, 5.501953125, 5.7783203125, 6.0546875, 6.3310546875, 6.607421875, 6.8837890625, 7.16015625, 7.4365234375, 7.712890625, 7.9892578125, 8.265625]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 6.0, 5.0, 4.0, 6.0, 6.0, 9.0, 18.0, 10.0, 23.0, 24.0, 37.0, 45.0, 54.0, 73.0, 106.0, 137.0, 210.0, 288.0, 360.0, 576.0, 62473.0, 4127605.0, 688.0, 416.0, 311.0, 192.0, 183.0, 113.0, 64.0, 53.0, 45.0, 38.0, 31.0, 11.0, 13.0, 12.0, 14.0, 8.0, 11.0, 8.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-291.0, -280.99609375, -270.9921875, -260.98828125, -250.984375, -240.98046875, -230.9765625, -220.97265625, -210.96875, -200.96484375, -190.9609375, -180.95703125, -170.953125, -160.94921875, -150.9453125, -140.94140625, -130.9375, -120.93359375, -110.9296875, -100.92578125, -90.921875, -80.91796875, -70.9140625, -60.91015625, -50.90625, -40.90234375, -30.8984375, -20.89453125, -10.890625, -0.88671875, 9.1171875, 19.12109375, 29.125, 39.12890625, 49.1328125, 59.13671875, 69.140625, 79.14453125, 89.1484375, 99.15234375, 109.15625, 119.16015625, 129.1640625, 139.16796875, 149.171875, 159.17578125, 169.1796875, 179.18359375, 189.1875, 199.19140625, 209.1953125, 219.19921875, 229.203125, 239.20703125, 249.2109375, 259.21484375, 269.21875, 279.22265625, 289.2265625, 299.23046875, 309.234375, 319.23828125, 329.2421875, 339.24609375, 349.25]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 7.0, 7.0, 6.0, 12.0, 10.0, 9.0, 21.0, 19.0, 24.0, 38.0, 44.0, 63.0, 80.0, 132.0, 177.0, 268.0, 456.0, 573.0, 652.0, 471.0, 326.0, 196.0, 133.0, 92.0, 61.0, 59.0, 36.0, 32.0, 15.0, 13.0, 8.0, 5.0, 8.0, 3.0, 4.0, 4.0, 5.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.7265625, -13.2703857421875, -12.814208984375, -12.3580322265625, -11.90185546875, -11.4456787109375, -10.989501953125, -10.5333251953125, -10.0771484375, -9.6209716796875, -9.164794921875, -8.7086181640625, -8.25244140625, -7.7962646484375, -7.340087890625, -6.8839111328125, -6.427734375, -5.9715576171875, -5.515380859375, -5.0592041015625, -4.60302734375, -4.1468505859375, -3.690673828125, -3.2344970703125, -2.7783203125, -2.3221435546875, -1.865966796875, -1.4097900390625, -0.95361328125, -0.4974365234375, -0.041259765625, 0.4149169921875, 0.87109375, 1.3272705078125, 1.783447265625, 2.2396240234375, 2.69580078125, 3.1519775390625, 3.608154296875, 4.0643310546875, 4.5205078125, 4.9766845703125, 5.432861328125, 5.8890380859375, 6.34521484375, 6.8013916015625, 7.257568359375, 7.7137451171875, 8.169921875, 8.6260986328125, 9.082275390625, 9.5384521484375, 9.99462890625, 10.4508056640625, 10.906982421875, 11.3631591796875, 11.8193359375, 12.2755126953125, 12.731689453125, 13.1878662109375, 13.64404296875, 14.1002197265625, 14.556396484375, 15.0125732421875, 15.46875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 3.0, 5.0, 5.0, 8.0, 6.0, 8.0, 10.0, 9.0, 10.0, 12.0, 14.0, 25.0, 28.0, 20.0, 27.0, 33.0, 48.0, 45.0, 89.0, 124.0, 352.0, 4052.0, 4172331.0, 16019.0, 441.0, 123.0, 78.0, 56.0, 39.0, 37.0, 38.0, 25.0, 25.0, 22.0, 24.0, 18.0, 16.0, 13.0, 7.0, 11.0, 7.0, 8.0, 3.0, 3.0, 5.0, 1.0, 3.0, 3.0, 2.0, 0.0, 3.0], "bins": [-140.5, -136.5546875, -132.609375, -128.6640625, -124.71875, -120.7734375, -116.828125, -112.8828125, -108.9375, -104.9921875, -101.046875, -97.1015625, -93.15625, -89.2109375, -85.265625, -81.3203125, -77.375, -73.4296875, -69.484375, -65.5390625, -61.59375, -57.6484375, -53.703125, -49.7578125, -45.8125, -41.8671875, -37.921875, -33.9765625, -30.03125, -26.0859375, -22.140625, -18.1953125, -14.25, -10.3046875, -6.359375, -2.4140625, 1.53125, 5.4765625, 9.421875, 13.3671875, 17.3125, 21.2578125, 25.203125, 29.1484375, 33.09375, 37.0390625, 40.984375, 44.9296875, 48.875, 52.8203125, 56.765625, 60.7109375, 64.65625, 68.6015625, 72.546875, 76.4921875, 80.4375, 84.3828125, 88.328125, 92.2734375, 96.21875, 100.1640625, 104.109375, 108.0546875, 112.0]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 15.0, 30.0, 55.0, 99.0, 157.0, 208.0, 186.0, 120.0, 92.0, 33.0, 10.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.89528274536133, -37.64990234375, -35.40452575683594, -33.159149169921875, -30.913768768310547, -28.66839027404785, -26.423011779785156, -24.17763328552246, -21.932254791259766, -19.68687629699707, -17.441497802734375, -15.19611930847168, -12.950740814208984, -10.705362319946289, -8.459983825683594, -6.214605331420898, -3.969226837158203, -1.7238483428955078, 0.5215301513671875, 2.766908645629883, 5.012287139892578, 7.257665634155273, 9.503044128417969, 11.748422622680664, 13.99380111694336, 16.239179611206055, 18.48455810546875, 20.729936599731445, 22.97531509399414, 25.220693588256836, 27.46607208251953, 29.711450576782227, 31.956825256347656, 34.20220184326172, 36.44758224487305, 38.692962646484375, 40.93833923339844, 43.1837158203125, 45.42909622192383, 47.674476623535156, 49.91985321044922, 52.16522979736328, 54.41061019897461, 56.65599060058594, 58.9013671875, 61.14674377441406, 63.39212417602539, 65.63750457763672, 67.88288116455078, 70.12825775146484, 72.37364196777344, 74.6190185546875, 76.86439514160156, 79.10977172851562, 81.35514831542969, 83.60053253173828, 85.84590911865234, 88.0912857055664, 90.336669921875, 92.58204650878906, 94.82742309570312, 97.07279968261719, 99.31817626953125, 101.56356048583984, 103.8089370727539]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 5.0, 10.0, 7.0, 7.0, 19.0, 12.0, 20.0, 14.0, 15.0, 23.0, 27.0, 24.0, 23.0, 24.0, 29.0, 36.0, 41.0, 29.0, 43.0, 30.0, 53.0, 35.0, 42.0, 35.0, 40.0, 45.0, 32.0, 31.0, 28.0, 23.0, 37.0, 19.0, 18.0, 17.0, 13.0, 17.0, 11.0, 8.0, 11.0, 14.0, 7.0, 6.0, 5.0, 6.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-42.0394287109375, -40.67521667480469, -39.31100845336914, -37.946800231933594, -36.58258819580078, -35.21837615966797, -33.85416793823242, -32.489959716796875, -31.125747680664062, -29.761537551879883, -28.397327423095703, -27.033117294311523, -25.668907165527344, -24.304697036743164, -22.940486907958984, -21.576276779174805, -20.212066650390625, -18.847856521606445, -17.483646392822266, -16.119436264038086, -14.755226135253906, -13.391016006469727, -12.026805877685547, -10.662595748901367, -9.298385620117188, -7.934175491333008, -6.569965362548828, -5.205755233764648, -3.8415451049804688, -2.477334976196289, -1.1131248474121094, 0.2510852813720703, 1.61529541015625, 2.9795055389404297, 4.343715667724609, 5.707925796508789, 7.072135925292969, 8.436346054077148, 9.800556182861328, 11.164766311645508, 12.528976440429688, 13.893186569213867, 15.257396697998047, 16.621606826782227, 17.985816955566406, 19.350027084350586, 20.714237213134766, 22.078447341918945, 23.442657470703125, 24.806867599487305, 26.171077728271484, 27.535287857055664, 28.899497985839844, 30.263708114624023, 31.627918243408203, 32.99212646484375, 34.35633850097656, 35.720550537109375, 37.08475875854492, 38.44896697998047, 39.81317901611328, 41.177391052246094, 42.54159927368164, 43.90580749511719, 45.27001953125]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 0.0, 5.0, 3.0, 7.0, 5.0, 11.0, 13.0, 5.0, 18.0, 15.0, 19.0, 22.0, 22.0, 17.0, 41.0, 27.0, 33.0, 35.0, 42.0, 41.0, 49.0, 30.0, 52.0, 39.0, 41.0, 33.0, 32.0, 32.0, 33.0, 27.0, 29.0, 28.0, 28.0, 24.0, 24.0, 22.0, 15.0, 15.0, 17.0, 9.0, 13.0, 11.0, 4.0, 7.0, 3.0, 1.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-9.25, -8.977783203125, -8.70556640625, -8.433349609375, -8.1611328125, -7.888916015625, -7.61669921875, -7.344482421875, -7.072265625, -6.800048828125, -6.52783203125, -6.255615234375, -5.9833984375, -5.711181640625, -5.43896484375, -5.166748046875, -4.89453125, -4.622314453125, -4.35009765625, -4.077880859375, -3.8056640625, -3.533447265625, -3.26123046875, -2.989013671875, -2.716796875, -2.444580078125, -2.17236328125, -1.900146484375, -1.6279296875, -1.355712890625, -1.08349609375, -0.811279296875, -0.5390625, -0.266845703125, 0.00537109375, 0.277587890625, 0.5498046875, 0.822021484375, 1.09423828125, 1.366455078125, 1.638671875, 1.910888671875, 2.18310546875, 2.455322265625, 2.7275390625, 2.999755859375, 3.27197265625, 3.544189453125, 3.81640625, 4.088623046875, 4.36083984375, 4.633056640625, 4.9052734375, 5.177490234375, 5.44970703125, 5.721923828125, 5.994140625, 6.266357421875, 6.53857421875, 6.810791015625, 7.0830078125, 7.355224609375, 7.62744140625, 7.899658203125, 8.171875]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 2.0, 5.0, 8.0, 6.0, 22.0, 28.0, 32.0, 49.0, 71.0, 127.0, 136.0, 282.0, 338.0, 521.0, 728.0, 987.0, 1518.0, 2063.0, 3061.0, 4370.0, 6371.0, 9218.0, 13797.0, 20289.0, 31156.0, 48451.0, 78556.0, 140871.0, 283941.0, 161213.0, 86254.0, 52098.0, 33011.0, 22100.0, 14468.0, 10080.0, 6934.0, 4830.0, 3296.0, 2272.0, 1531.0, 1078.0, 723.0, 509.0, 333.0, 261.0, 174.0, 127.0, 78.0, 70.0, 41.0, 30.0, 14.0, 14.0, 8.0, 6.0, 9.0, 2.0, 0.0, 2.0], "bins": [-1.5966796875, -1.5476837158203125, -1.498687744140625, -1.4496917724609375, -1.40069580078125, -1.3516998291015625, -1.302703857421875, -1.2537078857421875, -1.2047119140625, -1.1557159423828125, -1.106719970703125, -1.0577239990234375, -1.00872802734375, -0.9597320556640625, -0.910736083984375, -0.8617401123046875, -0.812744140625, -0.7637481689453125, -0.714752197265625, -0.6657562255859375, -0.61676025390625, -0.5677642822265625, -0.518768310546875, -0.4697723388671875, -0.4207763671875, -0.3717803955078125, -0.322784423828125, -0.2737884521484375, -0.22479248046875, -0.1757965087890625, -0.126800537109375, -0.0778045654296875, -0.02880859375, 0.0201873779296875, 0.069183349609375, 0.1181793212890625, 0.16717529296875, 0.2161712646484375, 0.265167236328125, 0.3141632080078125, 0.3631591796875, 0.4121551513671875, 0.461151123046875, 0.5101470947265625, 0.55914306640625, 0.6081390380859375, 0.657135009765625, 0.7061309814453125, 0.755126953125, 0.8041229248046875, 0.853118896484375, 0.9021148681640625, 0.95111083984375, 1.0001068115234375, 1.049102783203125, 1.0980987548828125, 1.1470947265625, 1.1960906982421875, 1.245086669921875, 1.2940826416015625, 1.34307861328125, 1.3920745849609375, 1.441070556640625, 1.4900665283203125, 1.5390625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 8.0, 8.0, 12.0, 11.0, 14.0, 14.0, 13.0, 27.0, 17.0, 21.0, 21.0, 23.0, 27.0, 31.0, 25.0, 26.0, 48.0, 36.0, 27.0, 41.0, 1072.0, 48.0, 41.0, 48.0, 38.0, 34.0, 24.0, 33.0, 35.0, 26.0, 20.0, 23.0, 31.0, 20.0, 12.0, 13.0, 19.0, 17.0, 4.0, 10.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-6.3046875, -6.12396240234375, -5.9432373046875, -5.76251220703125, -5.581787109375, -5.40106201171875, -5.2203369140625, -5.03961181640625, -4.85888671875, -4.67816162109375, -4.4974365234375, -4.31671142578125, -4.135986328125, -3.95526123046875, -3.7745361328125, -3.59381103515625, -3.4130859375, -3.23236083984375, -3.0516357421875, -2.87091064453125, -2.690185546875, -2.50946044921875, -2.3287353515625, -2.14801025390625, -1.96728515625, -1.78656005859375, -1.6058349609375, -1.42510986328125, -1.244384765625, -1.06365966796875, -0.8829345703125, -0.70220947265625, -0.521484375, -0.34075927734375, -0.1600341796875, 0.02069091796875, 0.201416015625, 0.38214111328125, 0.5628662109375, 0.74359130859375, 0.92431640625, 1.10504150390625, 1.2857666015625, 1.46649169921875, 1.647216796875, 1.82794189453125, 2.0086669921875, 2.18939208984375, 2.3701171875, 2.55084228515625, 2.7315673828125, 2.91229248046875, 3.093017578125, 3.27374267578125, 3.4544677734375, 3.63519287109375, 3.81591796875, 3.99664306640625, 4.1773681640625, 4.35809326171875, 4.538818359375, 4.71954345703125, 4.9002685546875, 5.08099365234375, 5.26171875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 4.0, 2.0, 8.0, 4.0, 7.0, 9.0, 21.0, 25.0, 28.0, 64.0, 98.0, 134.0, 198.0, 336.0, 456.0, 640.0, 981.0, 1531.0, 2294.0, 3517.0, 5473.0, 8377.0, 12775.0, 19911.0, 31840.0, 51771.0, 86502.0, 174466.0, 1368454.0, 133039.0, 73051.0, 43996.0, 27223.0, 17442.0, 11194.0, 7421.0, 4715.0, 3143.0, 2011.0, 1334.0, 917.0, 567.0, 407.0, 234.0, 158.0, 117.0, 79.0, 43.0, 43.0, 31.0, 17.0, 14.0, 9.0, 8.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.76171875, -1.707244873046875, -1.65277099609375, -1.598297119140625, -1.5438232421875, -1.489349365234375, -1.43487548828125, -1.380401611328125, -1.325927734375, -1.271453857421875, -1.21697998046875, -1.162506103515625, -1.1080322265625, -1.053558349609375, -0.99908447265625, -0.944610595703125, -0.89013671875, -0.835662841796875, -0.78118896484375, -0.726715087890625, -0.6722412109375, -0.617767333984375, -0.56329345703125, -0.508819580078125, -0.454345703125, -0.399871826171875, -0.34539794921875, -0.290924072265625, -0.2364501953125, -0.181976318359375, -0.12750244140625, -0.073028564453125, -0.0185546875, 0.035919189453125, 0.09039306640625, 0.144866943359375, 0.1993408203125, 0.253814697265625, 0.30828857421875, 0.362762451171875, 0.417236328125, 0.471710205078125, 0.52618408203125, 0.580657958984375, 0.6351318359375, 0.689605712890625, 0.74407958984375, 0.798553466796875, 0.85302734375, 0.907501220703125, 0.96197509765625, 1.016448974609375, 1.0709228515625, 1.125396728515625, 1.17987060546875, 1.234344482421875, 1.288818359375, 1.343292236328125, 1.39776611328125, 1.452239990234375, 1.5067138671875, 1.561187744140625, 1.61566162109375, 1.670135498046875, 1.724609375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 5.0, 7.0, 3.0, 8.0, 7.0, 7.0, 10.0, 11.0, 20.0, 25.0, 16.0, 22.0, 24.0, 20.0, 49.0, 45.0, 44.0, 63.0, 71.0, 64.0, 54.0, 43.0, 51.0, 43.0, 48.0, 36.0, 34.0, 23.0, 20.0, 21.0, 20.0, 23.0, 11.0, 11.0, 9.0, 11.0, 8.0, 5.0, 3.0, 4.0, 1.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0008864402770996094, -0.0008592978119850159, -0.0008321553468704224, -0.0008050128817558289, -0.0007778704166412354, -0.0007507279515266418, -0.0007235854864120483, -0.0006964430212974548, -0.0006693005561828613, -0.0006421580910682678, -0.0006150156259536743, -0.0005878731608390808, -0.0005607306957244873, -0.0005335882306098938, -0.0005064457654953003, -0.0004793033003807068, -0.0004521608352661133, -0.0004250183701515198, -0.00039787590503692627, -0.00037073343992233276, -0.00034359097480773926, -0.00031644850969314575, -0.00028930604457855225, -0.00026216357946395874, -0.00023502111434936523, -0.00020787864923477173, -0.00018073618412017822, -0.00015359371900558472, -0.0001264512538909912, -9.93087887763977e-05, -7.21663236618042e-05, -4.502385854721069e-05, -1.7881393432617188e-05, 9.261071681976318e-06, 3.6403536796569824e-05, 6.354600191116333e-05, 9.068846702575684e-05, 0.00011783093214035034, 0.00014497339725494385, 0.00017211586236953735, 0.00019925832748413086, 0.00022640079259872437, 0.00025354325771331787, 0.0002806857228279114, 0.0003078281879425049, 0.0003349706530570984, 0.0003621131181716919, 0.0003892555832862854, 0.0004163980484008789, 0.0004435405135154724, 0.0004706829786300659, 0.0004978254437446594, 0.0005249679088592529, 0.0005521103739738464, 0.0005792528390884399, 0.0006063953042030334, 0.000633537769317627, 0.0006606802344322205, 0.000687822699546814, 0.0007149651646614075, 0.000742107629776001, 0.0007692500948905945, 0.000796392560005188, 0.0008235350251197815, 0.000850677490234375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 11.0, 12.0, 8.0, 18.0, 22.0, 25.0, 22.0, 32.0, 37.0, 41.0, 57.0, 57.0, 71.0, 123.0, 174.0, 229.0, 323.0, 487.0, 831.0, 8660.0, 1016236.0, 18395.0, 975.0, 490.0, 334.0, 212.0, 167.0, 112.0, 69.0, 58.0, 51.0, 51.0, 32.0, 27.0, 16.0, 19.0, 17.0, 10.0, 14.0, 8.0, 4.0, 6.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.01526641845703125, -0.014797568321228027, -0.014328718185424805, -0.013859868049621582, -0.01339101791381836, -0.012922167778015137, -0.012453317642211914, -0.011984467506408691, -0.011515617370605469, -0.011046767234802246, -0.010577917098999023, -0.0101090669631958, -0.009640216827392578, -0.009171366691589355, -0.008702516555786133, -0.00823366641998291, -0.0077648162841796875, -0.007295966148376465, -0.006827116012573242, -0.0063582658767700195, -0.005889415740966797, -0.005420565605163574, -0.0049517154693603516, -0.004482865333557129, -0.004014015197753906, -0.0035451650619506836, -0.003076314926147461, -0.0026074647903442383, -0.0021386146545410156, -0.001669764518737793, -0.0012009143829345703, -0.0007320642471313477, -0.000263214111328125, 0.00020563602447509766, 0.0006744861602783203, 0.001143336296081543, 0.0016121864318847656, 0.0020810365676879883, 0.002549886703491211, 0.0030187368392944336, 0.0034875869750976562, 0.003956437110900879, 0.0044252872467041016, 0.004894137382507324, 0.005362987518310547, 0.0058318376541137695, 0.006300687789916992, 0.006769537925720215, 0.0072383880615234375, 0.00770723819732666, 0.008176088333129883, 0.008644938468933105, 0.009113788604736328, 0.00958263874053955, 0.010051488876342773, 0.010520339012145996, 0.010989189147949219, 0.011458039283752441, 0.011926889419555664, 0.012395739555358887, 0.01286458969116211, 0.013333439826965332, 0.013802289962768555, 0.014271140098571777, 0.014739990234375]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 24.0, 99.0, 336.0, 347.0, 138.0, 49.0, 12.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007120106020011008, -0.0006650126888416708, -0.0006180147174745798, -0.0005710168043151498, -0.0005240188911557198, -0.00047702097799628973, -0.00043002303573302925, -0.00038302509346976876, -0.00033602718031033874, -0.0002890292671509087, -0.00024203132488764822, -0.00019503339717630297, -0.00014803546946495771, -0.00010103754175361246, -5.40396140422672e-05, -7.04167177900672e-06, 3.995624138042331e-05, 8.695416909176856e-05, 0.00013395209680311382, 0.00018095002451445907, 0.00022794795222580433, 0.00027494586538523436, 0.00032194380764849484, 0.0003689417499117553, 0.00041593966307118535, 0.0004629375762306154, 0.0005099355475977063, 0.0005569334607571363, 0.0006039313739165664, 0.0006509292870759964, 0.0006979272002354264, 0.0007449251716025174, 0.0007919231429696083, 0.0008389210561290383, 0.0008859189692884684, 0.0009329169406555593, 0.0009799147956073284, 0.0010269128251820803, 0.0010739107383415103, 0.0011209086515009403, 0.0011679065646603703, 0.0012149044778198004, 0.0012619023909792304, 0.0013089003041386604, 0.0013558983337134123, 0.0014028962468728423, 0.0014498941600322723, 0.0014968920731917024, 0.0015438899863511324, 0.0015908878995105624, 0.0016378858126699924, 0.0016848837258294225, 0.0017318816389888525, 0.0017788796685636044, 0.0018258775817230344, 0.0018728754948824644, 0.0019198734080418944, 0.0019668713212013245, 0.0020138693507760763, 0.0020608671475201845, 0.0021078651770949364, 0.0021548629738390446, 0.0022018610034137964, 0.0022488590329885483, 0.0022958568297326565]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 5.0, 5.0, 4.0, 1.0, 6.0, 11.0, 12.0, 6.0, 5.0, 9.0, 5.0, 23.0, 19.0, 26.0, 21.0, 27.0, 30.0, 31.0, 23.0, 30.0, 27.0, 42.0, 30.0, 24.0, 45.0, 46.0, 40.0, 38.0, 31.0, 31.0, 43.0, 30.0, 26.0, 28.0, 28.0, 22.0, 22.0, 23.0, 16.0, 25.0, 20.0, 19.0, 16.0, 9.0, 10.0, 5.0, 5.0, 3.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.00038677453994750977, -0.00037334952503442764, -0.0003599245101213455, -0.0003464994952082634, -0.0003330744802951813, -0.00031964946538209915, -0.00030622445046901703, -0.0002927994355559349, -0.0002793744206428528, -0.00026594940572977066, -0.00025252439081668854, -0.00023909937590360641, -0.0002256743609905243, -0.00021224934607744217, -0.00019882433116436005, -0.00018539931625127792, -0.0001719743013381958, -0.00015854928642511368, -0.00014512427151203156, -0.00013169925659894943, -0.00011827424168586731, -0.00010484922677278519, -9.142421185970306e-05, -7.799919694662094e-05, -6.457418203353882e-05, -5.1149167120456696e-05, -3.772415220737457e-05, -2.429913729429245e-05, -1.0874122381210327e-05, 2.5508925318717957e-06, 1.597590744495392e-05, 2.940092235803604e-05, 4.2825937271118164e-05, 5.625095218420029e-05, 6.967596709728241e-05, 8.310098201036453e-05, 9.652599692344666e-05, 0.00010995101183652878, 0.0001233760267496109, 0.00013680104166269302, 0.00015022605657577515, 0.00016365107148885727, 0.0001770760864019394, 0.00019050110131502151, 0.00020392611622810364, 0.00021735113114118576, 0.00023077614605426788, 0.00024420116096735, 0.00025762617588043213, 0.00027105119079351425, 0.0002844762057065964, 0.0002979012206196785, 0.0003113262355327606, 0.00032475125044584274, 0.00033817626535892487, 0.000351601280272007, 0.0003650262951850891, 0.00037845131009817123, 0.00039187632501125336, 0.0004053013399243355, 0.0004187263548374176, 0.0004321513697504997, 0.00044557638466358185, 0.00045900139957666397, 0.0004724264144897461]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 0.0, 5.0, 3.0, 7.0, 5.0, 11.0, 13.0, 5.0, 18.0, 15.0, 19.0, 22.0, 22.0, 17.0, 41.0, 27.0, 33.0, 35.0, 42.0, 41.0, 49.0, 30.0, 52.0, 39.0, 41.0, 33.0, 32.0, 32.0, 33.0, 27.0, 29.0, 28.0, 28.0, 24.0, 24.0, 22.0, 15.0, 15.0, 17.0, 9.0, 13.0, 11.0, 4.0, 7.0, 3.0, 1.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-9.25, -8.977783203125, -8.70556640625, -8.433349609375, -8.1611328125, -7.888916015625, -7.61669921875, -7.344482421875, -7.072265625, -6.800048828125, -6.52783203125, -6.255615234375, -5.9833984375, -5.711181640625, -5.43896484375, -5.166748046875, -4.89453125, -4.622314453125, -4.35009765625, -4.077880859375, -3.8056640625, -3.533447265625, -3.26123046875, -2.989013671875, -2.716796875, -2.444580078125, -2.17236328125, -1.900146484375, -1.6279296875, -1.355712890625, -1.08349609375, -0.811279296875, -0.5390625, -0.266845703125, 0.00537109375, 0.277587890625, 0.5498046875, 0.822021484375, 1.09423828125, 1.366455078125, 1.638671875, 1.910888671875, 2.18310546875, 2.455322265625, 2.7275390625, 2.999755859375, 3.27197265625, 3.544189453125, 3.81640625, 4.088623046875, 4.36083984375, 4.633056640625, 4.9052734375, 5.177490234375, 5.44970703125, 5.721923828125, 5.994140625, 6.266357421875, 6.53857421875, 6.810791015625, 7.0830078125, 7.355224609375, 7.62744140625, 7.899658203125, 8.171875]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 4.0, 14.0, 12.0, 19.0, 19.0, 28.0, 40.0, 48.0, 68.0, 97.0, 123.0, 162.0, 192.0, 268.0, 323.0, 433.0, 536.0, 691.0, 887.0, 1154.0, 1748.0, 3754.0, 12569.0, 66446.0, 356971.0, 472733.0, 99342.0, 17777.0, 4653.0, 2044.0, 1208.0, 909.0, 697.0, 560.0, 486.0, 348.0, 274.0, 222.0, 178.0, 149.0, 95.0, 74.0, 58.0, 36.0, 29.0, 20.0, 10.0, 15.0, 10.0, 14.0, 0.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-13.2578125, -12.844970703125, -12.43212890625, -12.019287109375, -11.6064453125, -11.193603515625, -10.78076171875, -10.367919921875, -9.955078125, -9.542236328125, -9.12939453125, -8.716552734375, -8.3037109375, -7.890869140625, -7.47802734375, -7.065185546875, -6.65234375, -6.239501953125, -5.82666015625, -5.413818359375, -5.0009765625, -4.588134765625, -4.17529296875, -3.762451171875, -3.349609375, -2.936767578125, -2.52392578125, -2.111083984375, -1.6982421875, -1.285400390625, -0.87255859375, -0.459716796875, -0.046875, 0.365966796875, 0.77880859375, 1.191650390625, 1.6044921875, 2.017333984375, 2.43017578125, 2.843017578125, 3.255859375, 3.668701171875, 4.08154296875, 4.494384765625, 4.9072265625, 5.320068359375, 5.73291015625, 6.145751953125, 6.55859375, 6.971435546875, 7.38427734375, 7.797119140625, 8.2099609375, 8.622802734375, 9.03564453125, 9.448486328125, 9.861328125, 10.274169921875, 10.68701171875, 11.099853515625, 11.5126953125, 11.925537109375, 12.33837890625, 12.751220703125, 13.1640625]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 1.0, 4.0, 2.0, 4.0, 5.0, 6.0, 15.0, 9.0, 14.0, 17.0, 23.0, 23.0, 30.0, 27.0, 37.0, 34.0, 49.0, 61.0, 111.0, 209.0, 1610.0, 246.0, 105.0, 71.0, 64.0, 46.0, 28.0, 36.0, 26.0, 20.0, 19.0, 23.0, 19.0, 11.0, 8.0, 8.0, 6.0, 6.0, 4.0, 7.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-26.21875, -25.3603515625, -24.501953125, -23.6435546875, -22.78515625, -21.9267578125, -21.068359375, -20.2099609375, -19.3515625, -18.4931640625, -17.634765625, -16.7763671875, -15.91796875, -15.0595703125, -14.201171875, -13.3427734375, -12.484375, -11.6259765625, -10.767578125, -9.9091796875, -9.05078125, -8.1923828125, -7.333984375, -6.4755859375, -5.6171875, -4.7587890625, -3.900390625, -3.0419921875, -2.18359375, -1.3251953125, -0.466796875, 0.3916015625, 1.25, 2.1083984375, 2.966796875, 3.8251953125, 4.68359375, 5.5419921875, 6.400390625, 7.2587890625, 8.1171875, 8.9755859375, 9.833984375, 10.6923828125, 11.55078125, 12.4091796875, 13.267578125, 14.1259765625, 14.984375, 15.8427734375, 16.701171875, 17.5595703125, 18.41796875, 19.2763671875, 20.134765625, 20.9931640625, 21.8515625, 22.7099609375, 23.568359375, 24.4267578125, 25.28515625, 26.1435546875, 27.001953125, 27.8603515625, 28.71875]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 0.0, 8.0, 7.0, 5.0, 9.0, 12.0, 3.0, 9.0, 16.0, 15.0, 22.0, 25.0, 44.0, 37.0, 51.0, 79.0, 107.0, 139.0, 212.0, 407.0, 720.0, 2133.0, 2222156.0, 915704.0, 1968.0, 745.0, 342.0, 200.0, 139.0, 95.0, 75.0, 47.0, 28.0, 32.0, 28.0, 22.0, 13.0, 14.0, 8.0, 6.0, 8.0, 4.0, 7.0, 4.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.375, -65.2001953125, -63.025390625, -60.8505859375, -58.67578125, -56.5009765625, -54.326171875, -52.1513671875, -49.9765625, -47.8017578125, -45.626953125, -43.4521484375, -41.27734375, -39.1025390625, -36.927734375, -34.7529296875, -32.578125, -30.4033203125, -28.228515625, -26.0537109375, -23.87890625, -21.7041015625, -19.529296875, -17.3544921875, -15.1796875, -13.0048828125, -10.830078125, -8.6552734375, -6.48046875, -4.3056640625, -2.130859375, 0.0439453125, 2.21875, 4.3935546875, 6.568359375, 8.7431640625, 10.91796875, 13.0927734375, 15.267578125, 17.4423828125, 19.6171875, 21.7919921875, 23.966796875, 26.1416015625, 28.31640625, 30.4912109375, 32.666015625, 34.8408203125, 37.015625, 39.1904296875, 41.365234375, 43.5400390625, 45.71484375, 47.8896484375, 50.064453125, 52.2392578125, 54.4140625, 56.5888671875, 58.763671875, 60.9384765625, 63.11328125, 65.2880859375, 67.462890625, 69.6376953125, 71.8125]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 375.0, 630.0, 9.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-173.5770721435547, -164.49459838867188, -155.41213989257812, -146.3296661376953, -137.2471923828125, -128.16473388671875, -119.08226013183594, -109.99979400634766, -100.91732788085938, -91.8348617553711, -82.75239562988281, -73.669921875, -64.58745574951172, -55.50498962402344, -46.42251968383789, -37.340049743652344, -28.257583618164062, -19.17511558532715, -10.092647552490234, -1.0101795196533203, 8.072288513183594, 17.154754638671875, 26.237224578857422, 35.31969451904297, 44.40216064453125, 53.48462677001953, 62.56709671020508, 71.64956665039062, 80.7320327758789, 89.81449890136719, 98.89697265625, 107.97943878173828, 117.06192016601562, 126.1443862915039, 135.2268524169922, 144.309326171875, 153.39178466796875, 162.47425842285156, 171.55673217773438, 180.63919067382812, 189.72166442871094, 198.80413818359375, 207.8865966796875, 216.9690704345703, 226.05154418945312, 235.13400268554688, 244.2164764404297, 253.2989501953125, 262.38140869140625, 271.4638671875, 280.5463562011719, 289.6288146972656, 298.7112731933594, 307.79376220703125, 316.876220703125, 325.95867919921875, 335.0411376953125, 344.12359619140625, 353.2060852050781, 362.2885437011719, 371.3710021972656, 380.4534912109375, 389.53594970703125, 398.618408203125, 407.7008972167969]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 7.0, 4.0, 6.0, 8.0, 11.0, 9.0, 16.0, 14.0, 21.0, 17.0, 32.0, 25.0, 36.0, 25.0, 36.0, 37.0, 33.0, 32.0, 29.0, 39.0, 38.0, 41.0, 45.0, 40.0, 34.0, 37.0, 36.0, 35.0, 40.0, 30.0, 21.0, 17.0, 24.0, 23.0, 14.0, 9.0, 12.0, 15.0, 15.0, 5.0, 11.0, 5.0, 7.0, 3.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-69.07666015625, -67.05974578857422, -65.04283905029297, -63.02592849731445, -61.00901794433594, -58.992103576660156, -56.97519302368164, -54.958282470703125, -52.94137191772461, -50.924461364746094, -48.90755081176758, -46.89064025878906, -44.87372589111328, -42.85681915283203, -40.83990478515625, -38.822994232177734, -36.80608367919922, -34.7891731262207, -32.77226257324219, -30.75535011291504, -28.738439559936523, -26.721529006958008, -24.70461654663086, -22.687705993652344, -20.670795440673828, -18.653884887695312, -16.636974334716797, -14.620061874389648, -12.603151321411133, -10.586240768432617, -8.569329261779785, -6.552417755126953, -4.5355072021484375, -2.5185961723327637, -0.5016851425170898, 1.515225887298584, 3.532136917114258, 5.549047470092773, 7.5659589767456055, 9.582870483398438, 11.599781036376953, 13.616691589355469, 15.6336030960083, 17.650514602661133, 19.66742515563965, 21.684335708618164, 23.701248168945312, 25.718158721923828, 27.735069274902344, 29.75197982788086, 31.768890380859375, 33.78580093383789, 35.802711486816406, 37.81962585449219, 39.8365364074707, 41.85344696044922, 43.870357513427734, 45.88726806640625, 47.904178619384766, 49.92108917236328, 51.93800354003906, 53.95491027832031, 55.971824645996094, 57.98873519897461, 60.005645751953125]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 8.0, 16.0, 16.0, 11.0, 17.0, 11.0, 10.0, 18.0, 20.0, 24.0, 21.0, 32.0, 36.0, 46.0, 26.0, 45.0, 47.0, 44.0, 35.0, 43.0, 45.0, 49.0, 24.0, 27.0, 25.0, 39.0, 32.0, 32.0, 33.0, 21.0, 19.0, 17.0, 21.0, 20.0, 10.0, 15.0, 7.0, 8.0, 8.0, 8.0, 5.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-9.4765625, -9.2078857421875, -8.939208984375, -8.6705322265625, -8.40185546875, -8.1331787109375, -7.864501953125, -7.5958251953125, -7.3271484375, -7.0584716796875, -6.789794921875, -6.5211181640625, -6.25244140625, -5.9837646484375, -5.715087890625, -5.4464111328125, -5.177734375, -4.9090576171875, -4.640380859375, -4.3717041015625, -4.10302734375, -3.8343505859375, -3.565673828125, -3.2969970703125, -3.0283203125, -2.7596435546875, -2.490966796875, -2.2222900390625, -1.95361328125, -1.6849365234375, -1.416259765625, -1.1475830078125, -0.87890625, -0.6102294921875, -0.341552734375, -0.0728759765625, 0.19580078125, 0.4644775390625, 0.733154296875, 1.0018310546875, 1.2705078125, 1.5391845703125, 1.807861328125, 2.0765380859375, 2.34521484375, 2.6138916015625, 2.882568359375, 3.1512451171875, 3.419921875, 3.6885986328125, 3.957275390625, 4.2259521484375, 4.49462890625, 4.7633056640625, 5.031982421875, 5.3006591796875, 5.5693359375, 5.8380126953125, 6.106689453125, 6.3753662109375, 6.64404296875, 6.9127197265625, 7.181396484375, 7.4500732421875, 7.71875]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 5.0, 4.0, 5.0, 12.0, 6.0, 21.0, 17.0, 23.0, 29.0, 42.0, 43.0, 69.0, 66.0, 88.0, 98.0, 122.0, 155.0, 237.0, 510.0, 1595.0, 8479.0, 213908.0, 3471323.0, 480621.0, 13093.0, 2010.0, 571.0, 282.0, 181.0, 124.0, 128.0, 93.0, 62.0, 62.0, 47.0, 36.0, 22.0, 30.0, 14.0, 10.0, 16.0, 7.0, 2.0, 6.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.265625, -27.277099609375, -26.28857421875, -25.300048828125, -24.3115234375, -23.322998046875, -22.33447265625, -21.345947265625, -20.357421875, -19.368896484375, -18.38037109375, -17.391845703125, -16.4033203125, -15.414794921875, -14.42626953125, -13.437744140625, -12.44921875, -11.460693359375, -10.47216796875, -9.483642578125, -8.4951171875, -7.506591796875, -6.51806640625, -5.529541015625, -4.541015625, -3.552490234375, -2.56396484375, -1.575439453125, -0.5869140625, 0.401611328125, 1.39013671875, 2.378662109375, 3.3671875, 4.355712890625, 5.34423828125, 6.332763671875, 7.3212890625, 8.309814453125, 9.29833984375, 10.286865234375, 11.275390625, 12.263916015625, 13.25244140625, 14.240966796875, 15.2294921875, 16.218017578125, 17.20654296875, 18.195068359375, 19.18359375, 20.172119140625, 21.16064453125, 22.149169921875, 23.1376953125, 24.126220703125, 25.11474609375, 26.103271484375, 27.091796875, 28.080322265625, 29.06884765625, 30.057373046875, 31.0458984375, 32.034423828125, 33.02294921875, 34.011474609375, 35.0]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 1.0, 2.0, 2.0, 7.0, 8.0, 10.0, 17.0, 14.0, 18.0, 32.0, 33.0, 47.0, 42.0, 78.0, 91.0, 107.0, 131.0, 157.0, 217.0, 292.0, 391.0, 488.0, 424.0, 340.0, 254.0, 183.0, 132.0, 107.0, 77.0, 83.0, 75.0, 46.0, 34.0, 34.0, 22.0, 22.0, 16.0, 10.0, 7.0, 7.0, 7.0, 2.0, 5.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0703125, -11.664306640625, -11.25830078125, -10.852294921875, -10.4462890625, -10.040283203125, -9.63427734375, -9.228271484375, -8.822265625, -8.416259765625, -8.01025390625, -7.604248046875, -7.1982421875, -6.792236328125, -6.38623046875, -5.980224609375, -5.57421875, -5.168212890625, -4.76220703125, -4.356201171875, -3.9501953125, -3.544189453125, -3.13818359375, -2.732177734375, -2.326171875, -1.920166015625, -1.51416015625, -1.108154296875, -0.7021484375, -0.296142578125, 0.10986328125, 0.515869140625, 0.921875, 1.327880859375, 1.73388671875, 2.139892578125, 2.5458984375, 2.951904296875, 3.35791015625, 3.763916015625, 4.169921875, 4.575927734375, 4.98193359375, 5.387939453125, 5.7939453125, 6.199951171875, 6.60595703125, 7.011962890625, 7.41796875, 7.823974609375, 8.22998046875, 8.635986328125, 9.0419921875, 9.447998046875, 9.85400390625, 10.260009765625, 10.666015625, 11.072021484375, 11.47802734375, 11.884033203125, 12.2900390625, 12.696044921875, 13.10205078125, 13.508056640625, 13.9140625]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 9.0, 20.0, 17.0, 28.0, 48.0, 94.0, 136.0, 307.0, 955.0, 5541.0, 3182463.0, 999367.0, 3878.0, 784.0, 261.0, 147.0, 81.0, 52.0, 31.0, 21.0, 11.0, 11.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-80.0625, -77.7705078125, -75.478515625, -73.1865234375, -70.89453125, -68.6025390625, -66.310546875, -64.0185546875, -61.7265625, -59.4345703125, -57.142578125, -54.8505859375, -52.55859375, -50.2666015625, -47.974609375, -45.6826171875, -43.390625, -41.0986328125, -38.806640625, -36.5146484375, -34.22265625, -31.9306640625, -29.638671875, -27.3466796875, -25.0546875, -22.7626953125, -20.470703125, -18.1787109375, -15.88671875, -13.5947265625, -11.302734375, -9.0107421875, -6.71875, -4.4267578125, -2.134765625, 0.1572265625, 2.44921875, 4.7412109375, 7.033203125, 9.3251953125, 11.6171875, 13.9091796875, 16.201171875, 18.4931640625, 20.78515625, 23.0771484375, 25.369140625, 27.6611328125, 29.953125, 32.2451171875, 34.537109375, 36.8291015625, 39.12109375, 41.4130859375, 43.705078125, 45.9970703125, 48.2890625, 50.5810546875, 52.873046875, 55.1650390625, 57.45703125, 59.7490234375, 62.041015625, 64.3330078125, 66.625]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 11.0, 79.0, 331.0, 438.0, 132.0, 16.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-335.55377197265625, -329.1195983886719, -322.6854248046875, -316.2512512207031, -309.81707763671875, -303.3829040527344, -296.94873046875, -290.5145568847656, -284.08038330078125, -277.6462097167969, -271.2120361328125, -264.7778625488281, -258.34368896484375, -251.90951538085938, -245.475341796875, -239.04115295410156, -232.60696411132812, -226.17279052734375, -219.73861694335938, -213.304443359375, -206.87026977539062, -200.43609619140625, -194.00192260742188, -187.56773376464844, -181.13357543945312, -174.69940185546875, -168.26522827148438, -161.8310546875, -155.39688110351562, -148.96270751953125, -142.52853393554688, -136.09434509277344, -129.66015625, -123.22598266601562, -116.79180908203125, -110.35763549804688, -103.92345428466797, -97.4892807006836, -91.05510711669922, -84.62092590332031, -78.186767578125, -71.75259399414062, -65.31842041015625, -58.88424301147461, -52.45006561279297, -46.015892028808594, -39.58171844482422, -33.14754104614258, -26.713363647460938, -20.27918815612793, -13.845013618469238, -7.410839080810547, -0.9766635894775391, 5.457511901855469, 11.891685485839844, 18.325862884521484, 24.76003646850586, 31.194211959838867, 37.628387451171875, 44.06256103515625, 50.496734619140625, 56.930912017822266, 63.36508560180664, 69.79926300048828, 76.23343658447266]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 4.0, 4.0, 4.0, 12.0, 11.0, 13.0, 13.0, 12.0, 20.0, 17.0, 24.0, 26.0, 18.0, 35.0, 31.0, 37.0, 33.0, 35.0, 44.0, 41.0, 46.0, 34.0, 50.0, 41.0, 44.0, 34.0, 39.0, 25.0, 27.0, 34.0, 28.0, 31.0, 20.0, 20.0, 19.0, 15.0, 9.0, 12.0, 11.0, 5.0, 6.0, 7.0, 7.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-56.26118469238281, -54.52075958251953, -52.780338287353516, -51.039913177490234, -49.29949188232422, -47.55906677246094, -45.818641662597656, -44.07822036743164, -42.337799072265625, -40.597373962402344, -38.85695266723633, -37.11652755737305, -35.37610626220703, -33.63568115234375, -31.8952579498291, -30.154834747314453, -28.414409637451172, -26.673986434936523, -24.933563232421875, -23.193138122558594, -21.452716827392578, -19.712291717529297, -17.97186851501465, -16.2314453125, -14.491022109985352, -12.750598907470703, -11.010175704956055, -9.26975154876709, -7.529328346252441, -5.788905143737793, -4.048480987548828, -2.3080577850341797, -0.5676345825195312, 1.1727888584136963, 2.913212299346924, 4.6536359786987305, 6.394059181213379, 8.134482383728027, 9.874906539916992, 11.61532974243164, 13.355752944946289, 15.096176147460938, 16.836599349975586, 18.577022552490234, 20.317447662353516, 22.05786895751953, 23.798294067382812, 25.53871726989746, 27.27914047241211, 29.019563674926758, 30.759986877441406, 32.50041198730469, 34.2408332824707, 35.981258392333984, 37.7216796875, 39.46210479736328, 41.20252990722656, 42.942955017089844, 44.68337631225586, 46.42380142211914, 48.164222717285156, 49.90464782714844, 51.64507293701172, 53.385494232177734, 55.12591552734375]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 2.0, 2.0, 9.0, 4.0, 7.0, 6.0, 11.0, 17.0, 18.0, 23.0, 28.0, 27.0, 21.0, 27.0, 36.0, 39.0, 24.0, 37.0, 32.0, 39.0, 47.0, 36.0, 31.0, 43.0, 42.0, 38.0, 43.0, 34.0, 33.0, 36.0, 27.0, 26.0, 22.0, 19.0, 20.0, 19.0, 14.0, 12.0, 6.0, 5.0, 7.0, 7.0, 8.0, 2.0, 6.0, 5.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0], "bins": [-7.17578125, -6.96533203125, -6.7548828125, -6.54443359375, -6.333984375, -6.12353515625, -5.9130859375, -5.70263671875, -5.4921875, -5.28173828125, -5.0712890625, -4.86083984375, -4.650390625, -4.43994140625, -4.2294921875, -4.01904296875, -3.80859375, -3.59814453125, -3.3876953125, -3.17724609375, -2.966796875, -2.75634765625, -2.5458984375, -2.33544921875, -2.125, -1.91455078125, -1.7041015625, -1.49365234375, -1.283203125, -1.07275390625, -0.8623046875, -0.65185546875, -0.44140625, -0.23095703125, -0.0205078125, 0.18994140625, 0.400390625, 0.61083984375, 0.8212890625, 1.03173828125, 1.2421875, 1.45263671875, 1.6630859375, 1.87353515625, 2.083984375, 2.29443359375, 2.5048828125, 2.71533203125, 2.92578125, 3.13623046875, 3.3466796875, 3.55712890625, 3.767578125, 3.97802734375, 4.1884765625, 4.39892578125, 4.609375, 4.81982421875, 5.0302734375, 5.24072265625, 5.451171875, 5.66162109375, 5.8720703125, 6.08251953125, 6.29296875]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 7.0, 4.0, 4.0, 11.0, 9.0, 25.0, 24.0, 22.0, 42.0, 74.0, 118.0, 183.0, 263.0, 464.0, 801.0, 1389.0, 2286.0, 4019.0, 7313.0, 13382.0, 25265.0, 49154.0, 103708.0, 295246.0, 324492.0, 110292.0, 51795.0, 26520.0, 13883.0, 7573.0, 4152.0, 2417.0, 1378.0, 870.0, 520.0, 318.0, 185.0, 109.0, 88.0, 56.0, 29.0, 21.0, 8.0, 14.0, 7.0, 6.0, 7.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.7998046875, -1.7398834228515625, -1.679962158203125, -1.6200408935546875, -1.56011962890625, -1.5001983642578125, -1.440277099609375, -1.3803558349609375, -1.3204345703125, -1.2605133056640625, -1.200592041015625, -1.1406707763671875, -1.08074951171875, -1.0208282470703125, -0.960906982421875, -0.9009857177734375, -0.841064453125, -0.7811431884765625, -0.721221923828125, -0.6613006591796875, -0.60137939453125, -0.5414581298828125, -0.481536865234375, -0.4216156005859375, -0.3616943359375, -0.3017730712890625, -0.241851806640625, -0.1819305419921875, -0.12200927734375, -0.0620880126953125, -0.002166748046875, 0.0577545166015625, 0.11767578125, 0.1775970458984375, 0.237518310546875, 0.2974395751953125, 0.35736083984375, 0.4172821044921875, 0.477203369140625, 0.5371246337890625, 0.5970458984375, 0.6569671630859375, 0.716888427734375, 0.7768096923828125, 0.83673095703125, 0.8966522216796875, 0.956573486328125, 1.0164947509765625, 1.076416015625, 1.1363372802734375, 1.196258544921875, 1.2561798095703125, 1.31610107421875, 1.3760223388671875, 1.435943603515625, 1.4958648681640625, 1.5557861328125, 1.6157073974609375, 1.675628662109375, 1.7355499267578125, 1.79547119140625, 1.8553924560546875, 1.915313720703125, 1.9752349853515625, 2.03515625]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 7.0, 7.0, 5.0, 8.0, 5.0, 15.0, 13.0, 12.0, 19.0, 20.0, 17.0, 24.0, 34.0, 34.0, 26.0, 34.0, 32.0, 36.0, 30.0, 31.0, 50.0, 1065.0, 40.0, 31.0, 40.0, 43.0, 27.0, 37.0, 32.0, 31.0, 24.0, 35.0, 23.0, 17.0, 25.0, 17.0, 20.0, 9.0, 8.0, 8.0, 10.0, 7.0, 3.0, 5.0, 2.0, 3.0, 2.0, 5.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.390625, -4.260162353515625, -4.12969970703125, -3.999237060546875, -3.8687744140625, -3.738311767578125, -3.60784912109375, -3.477386474609375, -3.346923828125, -3.216461181640625, -3.08599853515625, -2.955535888671875, -2.8250732421875, -2.694610595703125, -2.56414794921875, -2.433685302734375, -2.30322265625, -2.172760009765625, -2.04229736328125, -1.911834716796875, -1.7813720703125, -1.650909423828125, -1.52044677734375, -1.389984130859375, -1.259521484375, -1.129058837890625, -0.99859619140625, -0.868133544921875, -0.7376708984375, -0.607208251953125, -0.47674560546875, -0.346282958984375, -0.2158203125, -0.085357666015625, 0.04510498046875, 0.175567626953125, 0.3060302734375, 0.436492919921875, 0.56695556640625, 0.697418212890625, 0.827880859375, 0.958343505859375, 1.08880615234375, 1.219268798828125, 1.3497314453125, 1.480194091796875, 1.61065673828125, 1.741119384765625, 1.87158203125, 2.002044677734375, 2.13250732421875, 2.262969970703125, 2.3934326171875, 2.523895263671875, 2.65435791015625, 2.784820556640625, 2.915283203125, 3.045745849609375, 3.17620849609375, 3.306671142578125, 3.4371337890625, 3.567596435546875, 3.69805908203125, 3.828521728515625, 3.958984375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [6.0, 3.0, 2.0, 2.0, 9.0, 8.0, 12.0, 12.0, 21.0, 19.0, 38.0, 47.0, 86.0, 100.0, 141.0, 218.0, 324.0, 424.0, 591.0, 902.0, 1285.0, 1812.0, 2767.0, 3993.0, 5944.0, 8867.0, 13554.0, 20647.0, 32436.0, 51575.0, 85038.0, 157726.0, 1353447.0, 140204.0, 78778.0, 48206.0, 30004.0, 19355.0, 12618.0, 8160.0, 5536.0, 3775.0, 2626.0, 1712.0, 1254.0, 855.0, 605.0, 400.0, 294.0, 203.0, 148.0, 117.0, 76.0, 50.0, 35.0, 32.0, 20.0, 12.0, 4.0, 7.0, 4.0, 3.0, 1.0, 2.0], "bins": [-1.228515625, -1.1906280517578125, -1.152740478515625, -1.1148529052734375, -1.07696533203125, -1.0390777587890625, -1.001190185546875, -0.9633026123046875, -0.9254150390625, -0.8875274658203125, -0.849639892578125, -0.8117523193359375, -0.77386474609375, -0.7359771728515625, -0.698089599609375, -0.6602020263671875, -0.622314453125, -0.5844268798828125, -0.546539306640625, -0.5086517333984375, -0.47076416015625, -0.4328765869140625, -0.394989013671875, -0.3571014404296875, -0.3192138671875, -0.2813262939453125, -0.243438720703125, -0.2055511474609375, -0.16766357421875, -0.1297760009765625, -0.091888427734375, -0.0540008544921875, -0.01611328125, 0.0217742919921875, 0.059661865234375, 0.0975494384765625, 0.13543701171875, 0.1733245849609375, 0.211212158203125, 0.2490997314453125, 0.2869873046875, 0.3248748779296875, 0.362762451171875, 0.4006500244140625, 0.43853759765625, 0.4764251708984375, 0.514312744140625, 0.5522003173828125, 0.590087890625, 0.6279754638671875, 0.665863037109375, 0.7037506103515625, 0.74163818359375, 0.7795257568359375, 0.817413330078125, 0.8553009033203125, 0.8931884765625, 0.9310760498046875, 0.968963623046875, 1.0068511962890625, 1.04473876953125, 1.0826263427734375, 1.120513916015625, 1.1584014892578125, 1.1962890625]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 9.0, 8.0, 5.0, 8.0, 10.0, 15.0, 18.0, 16.0, 24.0, 33.0, 24.0, 28.0, 33.0, 45.0, 61.0, 46.0, 39.0, 43.0, 41.0, 53.0, 62.0, 44.0, 35.0, 41.0, 44.0, 40.0, 29.0, 27.0, 20.0, 11.0, 23.0, 11.0, 8.0, 6.0, 9.0, 1.0, 2.0, 7.0, 6.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0004706382751464844, -0.0004552379250526428, -0.00043983757495880127, -0.0004244372248649597, -0.00040903687477111816, -0.0003936365246772766, -0.00037823617458343506, -0.0003628358244895935, -0.00034743547439575195, -0.0003320351243019104, -0.00031663477420806885, -0.0003012344241142273, -0.00028583407402038574, -0.0002704337239265442, -0.00025503337383270264, -0.00023963302373886108, -0.00022423267364501953, -0.00020883232355117798, -0.00019343197345733643, -0.00017803162336349487, -0.00016263127326965332, -0.00014723092317581177, -0.00013183057308197021, -0.00011643022298812866, -0.00010102987289428711, -8.562952280044556e-05, -7.0229172706604e-05, -5.482882261276245e-05, -3.94284725189209e-05, -2.4028122425079346e-05, -8.627772331237793e-06, 6.77257776260376e-06, 2.2172927856445312e-05, 3.7573277950286865e-05, 5.297362804412842e-05, 6.837397813796997e-05, 8.377432823181152e-05, 9.917467832565308e-05, 0.00011457502841949463, 0.00012997537851333618, 0.00014537572860717773, 0.0001607760787010193, 0.00017617642879486084, 0.0001915767788887024, 0.00020697712898254395, 0.0002223774790763855, 0.00023777782917022705, 0.0002531781792640686, 0.00026857852935791016, 0.0002839788794517517, 0.00029937922954559326, 0.0003147795796394348, 0.00033017992973327637, 0.0003455802798271179, 0.00036098062992095947, 0.000376380980014801, 0.0003917813301086426, 0.00040718168020248413, 0.0004225820302963257, 0.00043798238039016724, 0.0004533827304840088, 0.00046878308057785034, 0.0004841834306716919, 0.0004995837807655334, 0.000514984130859375]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 8.0, 3.0, 8.0, 8.0, 9.0, 12.0, 12.0, 19.0, 25.0, 25.0, 38.0, 41.0, 86.0, 131.0, 187.0, 245.0, 451.0, 826.0, 6211.0, 1030014.0, 8061.0, 809.0, 456.0, 251.0, 174.0, 125.0, 78.0, 73.0, 48.0, 27.0, 28.0, 19.0, 16.0, 13.0, 7.0, 4.0, 3.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01544189453125, -0.0150071382522583, -0.014572381973266602, -0.014137625694274902, -0.013702869415283203, -0.013268113136291504, -0.012833356857299805, -0.012398600578308105, -0.011963844299316406, -0.011529088020324707, -0.011094331741333008, -0.010659575462341309, -0.01022481918334961, -0.00979006290435791, -0.009355306625366211, -0.008920550346374512, -0.008485794067382812, -0.008051037788391113, -0.007616281509399414, -0.007181525230407715, -0.006746768951416016, -0.006312012672424316, -0.005877256393432617, -0.005442500114440918, -0.005007743835449219, -0.0045729875564575195, -0.00413823127746582, -0.003703474998474121, -0.003268718719482422, -0.0028339624404907227, -0.0023992061614990234, -0.0019644498825073242, -0.001529693603515625, -0.0010949373245239258, -0.0006601810455322266, -0.00022542476654052734, 0.00020933151245117188, 0.0006440877914428711, 0.0010788440704345703, 0.0015136003494262695, 0.0019483566284179688, 0.002383112907409668, 0.002817869186401367, 0.0032526254653930664, 0.0036873817443847656, 0.004122138023376465, 0.004556894302368164, 0.004991650581359863, 0.0054264068603515625, 0.005861163139343262, 0.006295919418334961, 0.00673067569732666, 0.007165431976318359, 0.007600188255310059, 0.008034944534301758, 0.008469700813293457, 0.008904457092285156, 0.009339213371276855, 0.009773969650268555, 0.010208725929260254, 0.010643482208251953, 0.011078238487243652, 0.011512994766235352, 0.01194775104522705, 0.01238250732421875]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 9.0, 183.0, 592.0, 211.0, 14.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001891540247015655, -0.0018316279165446758, -0.0017717157024890184, -0.001711803488433361, -0.0016518911579623818, -0.0015919788274914026, -0.0015320666134357452, -0.0014721543993800879, -0.0014122420689091086, -0.0013523297384381294, -0.001292417524382472, -0.0012325053103268147, -0.0011725929798558354, -0.0011126806493848562, -0.0010527684353291988, -0.0009928562212735415, -0.0009329438908025622, -0.0008730316185392439, -0.0008131193462759256, -0.0007532070740126073, -0.000693294801749289, -0.0006333825294859707, -0.0005734702572226524, -0.0005135579849593341, -0.00045364571269601583, -0.00039373344043269753, -0.00033382116816937923, -0.00027390889590606093, -0.00021399662364274263, -0.00015408435137942433, -9.417207911610603e-05, -3.425980685278773e-05, 2.5652465410530567e-05, 8.556473767384887e-05, 0.00014547700993716717, 0.00020538928220048547, 0.00026530155446380377, 0.00032521382672712207, 0.00038512609899044037, 0.00044503837125375867, 0.000504950643517077, 0.0005648629157803953, 0.0006247751880437136, 0.0006846874603070319, 0.0007445997325703502, 0.0008045120048336685, 0.0008644242770969868, 0.0009243365493603051, 0.0009842488216236234, 0.0010441611520946026, 0.00110407336615026, 0.0011639855802059174, 0.0012238979106768966, 0.0012838102411478758, 0.0013437224552035332, 0.0014036346692591906, 0.0014635469997301698, 0.001523459330201149, 0.0015833715442568064, 0.0016432837583124638, 0.001703196088783443, 0.0017631084192544222, 0.0018230206333100796, 0.001882932847365737, 0.0019428451778367162]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 2.0, 4.0, 5.0, 4.0, 9.0, 14.0, 15.0, 19.0, 26.0, 28.0, 33.0, 21.0, 33.0, 35.0, 38.0, 35.0, 44.0, 34.0, 47.0, 42.0, 38.0, 47.0, 42.0, 34.0, 56.0, 30.0, 36.0, 26.0, 28.0, 23.0, 27.0, 19.0, 23.0, 16.0, 15.0, 11.0, 13.0, 7.0, 2.0, 6.0, 8.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0003077983856201172, -0.000298377126455307, -0.0002889558672904968, -0.00027953460812568665, -0.00027011334896087646, -0.0002606920897960663, -0.0002512708306312561, -0.00024184957146644592, -0.00023242831230163574, -0.00022300705313682556, -0.00021358579397201538, -0.0002041645348072052, -0.00019474327564239502, -0.00018532201647758484, -0.00017590075731277466, -0.00016647949814796448, -0.0001570582389831543, -0.00014763697981834412, -0.00013821572065353394, -0.00012879446148872375, -0.00011937320232391357, -0.0001099519431591034, -0.00010053068399429321, -9.110942482948303e-05, -8.168816566467285e-05, -7.226690649986267e-05, -6.284564733505249e-05, -5.342438817024231e-05, -4.400312900543213e-05, -3.458186984062195e-05, -2.5160610675811768e-05, -1.5739351511001587e-05, -6.318092346191406e-06, 3.1031668186187744e-06, 1.2524425983428955e-05, 2.1945685148239136e-05, 3.1366944313049316e-05, 4.07882034778595e-05, 5.020946264266968e-05, 5.963072180747986e-05, 6.905198097229004e-05, 7.847324013710022e-05, 8.78944993019104e-05, 9.731575846672058e-05, 0.00010673701763153076, 0.00011615827679634094, 0.00012557953596115112, 0.0001350007951259613, 0.00014442205429077148, 0.00015384331345558167, 0.00016326457262039185, 0.00017268583178520203, 0.0001821070909500122, 0.0001915283501148224, 0.00020094960927963257, 0.00021037086844444275, 0.00021979212760925293, 0.0002292133867740631, 0.0002386346459388733, 0.00024805590510368347, 0.00025747716426849365, 0.00026689842343330383, 0.000276319682598114, 0.0002857409417629242, 0.0002951622009277344]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 2.0, 2.0, 9.0, 4.0, 7.0, 6.0, 11.0, 17.0, 17.0, 24.0, 28.0, 27.0, 21.0, 27.0, 36.0, 39.0, 24.0, 37.0, 32.0, 39.0, 47.0, 36.0, 31.0, 43.0, 42.0, 38.0, 43.0, 34.0, 33.0, 36.0, 27.0, 26.0, 22.0, 19.0, 20.0, 19.0, 14.0, 12.0, 6.0, 5.0, 7.0, 7.0, 8.0, 2.0, 6.0, 5.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0], "bins": [-7.17578125, -6.96533203125, -6.7548828125, -6.54443359375, -6.333984375, -6.12353515625, -5.9130859375, -5.70263671875, -5.4921875, -5.28173828125, -5.0712890625, -4.86083984375, -4.650390625, -4.43994140625, -4.2294921875, -4.01904296875, -3.80859375, -3.59814453125, -3.3876953125, -3.17724609375, -2.966796875, -2.75634765625, -2.5458984375, -2.33544921875, -2.125, -1.91455078125, -1.7041015625, -1.49365234375, -1.283203125, -1.07275390625, -0.8623046875, -0.65185546875, -0.44140625, -0.23095703125, -0.0205078125, 0.18994140625, 0.400390625, 0.61083984375, 0.8212890625, 1.03173828125, 1.2421875, 1.45263671875, 1.6630859375, 1.87353515625, 2.083984375, 2.29443359375, 2.5048828125, 2.71533203125, 2.92578125, 3.13623046875, 3.3466796875, 3.55712890625, 3.767578125, 3.97802734375, 4.1884765625, 4.39892578125, 4.609375, 4.81982421875, 5.0302734375, 5.24072265625, 5.451171875, 5.66162109375, 5.8720703125, 6.08251953125, 6.29296875]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [5.0, 2.0, 1.0, 3.0, 3.0, 3.0, 8.0, 8.0, 5.0, 11.0, 13.0, 19.0, 27.0, 42.0, 53.0, 81.0, 116.0, 162.0, 204.0, 282.0, 380.0, 580.0, 832.0, 1259.0, 1902.0, 3293.0, 7708.0, 33308.0, 323651.0, 591854.0, 60979.0, 10977.0, 4011.0, 2160.0, 1403.0, 1009.0, 651.0, 447.0, 297.0, 229.0, 154.0, 137.0, 85.0, 55.0, 45.0, 27.0, 21.0, 14.0, 19.0, 12.0, 7.0, 6.0, 4.0, 7.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.6171875, -15.0814208984375, -14.545654296875, -14.0098876953125, -13.47412109375, -12.9383544921875, -12.402587890625, -11.8668212890625, -11.3310546875, -10.7952880859375, -10.259521484375, -9.7237548828125, -9.18798828125, -8.6522216796875, -8.116455078125, -7.5806884765625, -7.044921875, -6.5091552734375, -5.973388671875, -5.4376220703125, -4.90185546875, -4.3660888671875, -3.830322265625, -3.2945556640625, -2.7587890625, -2.2230224609375, -1.687255859375, -1.1514892578125, -0.61572265625, -0.0799560546875, 0.455810546875, 0.9915771484375, 1.52734375, 2.0631103515625, 2.598876953125, 3.1346435546875, 3.67041015625, 4.2061767578125, 4.741943359375, 5.2777099609375, 5.8134765625, 6.3492431640625, 6.885009765625, 7.4207763671875, 7.95654296875, 8.4923095703125, 9.028076171875, 9.5638427734375, 10.099609375, 10.6353759765625, 11.171142578125, 11.7069091796875, 12.24267578125, 12.7784423828125, 13.314208984375, 13.8499755859375, 14.3857421875, 14.9215087890625, 15.457275390625, 15.9930419921875, 16.52880859375, 17.0645751953125, 17.600341796875, 18.1361083984375, 18.671875]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 6.0, 4.0, 8.0, 3.0, 8.0, 7.0, 15.0, 17.0, 17.0, 19.0, 16.0, 30.0, 32.0, 39.0, 41.0, 51.0, 52.0, 79.0, 121.0, 408.0, 1510.0, 156.0, 65.0, 51.0, 31.0, 33.0, 33.0, 38.0, 32.0, 22.0, 21.0, 22.0, 14.0, 11.0, 7.0, 7.0, 5.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-22.359375, -21.68310546875, -21.0068359375, -20.33056640625, -19.654296875, -18.97802734375, -18.3017578125, -17.62548828125, -16.94921875, -16.27294921875, -15.5966796875, -14.92041015625, -14.244140625, -13.56787109375, -12.8916015625, -12.21533203125, -11.5390625, -10.86279296875, -10.1865234375, -9.51025390625, -8.833984375, -8.15771484375, -7.4814453125, -6.80517578125, -6.12890625, -5.45263671875, -4.7763671875, -4.10009765625, -3.423828125, -2.74755859375, -2.0712890625, -1.39501953125, -0.71875, -0.04248046875, 0.6337890625, 1.31005859375, 1.986328125, 2.66259765625, 3.3388671875, 4.01513671875, 4.69140625, 5.36767578125, 6.0439453125, 6.72021484375, 7.396484375, 8.07275390625, 8.7490234375, 9.42529296875, 10.1015625, 10.77783203125, 11.4541015625, 12.13037109375, 12.806640625, 13.48291015625, 14.1591796875, 14.83544921875, 15.51171875, 16.18798828125, 16.8642578125, 17.54052734375, 18.216796875, 18.89306640625, 19.5693359375, 20.24560546875, 20.921875]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 7.0, 13.0, 18.0, 15.0, 20.0, 30.0, 20.0, 38.0, 45.0, 59.0, 65.0, 113.0, 150.0, 218.0, 378.0, 814.0, 2510.0, 2889545.0, 247874.0, 1876.0, 705.0, 371.0, 200.0, 140.0, 110.0, 82.0, 59.0, 44.0, 32.0, 27.0, 25.0, 24.0, 19.0, 10.0, 9.0, 10.0, 6.0, 5.0, 5.0, 4.0, 4.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-59.625, -57.75634765625, -55.8876953125, -54.01904296875, -52.150390625, -50.28173828125, -48.4130859375, -46.54443359375, -44.67578125, -42.80712890625, -40.9384765625, -39.06982421875, -37.201171875, -35.33251953125, -33.4638671875, -31.59521484375, -29.7265625, -27.85791015625, -25.9892578125, -24.12060546875, -22.251953125, -20.38330078125, -18.5146484375, -16.64599609375, -14.77734375, -12.90869140625, -11.0400390625, -9.17138671875, -7.302734375, -5.43408203125, -3.5654296875, -1.69677734375, 0.171875, 2.04052734375, 3.9091796875, 5.77783203125, 7.646484375, 9.51513671875, 11.3837890625, 13.25244140625, 15.12109375, 16.98974609375, 18.8583984375, 20.72705078125, 22.595703125, 24.46435546875, 26.3330078125, 28.20166015625, 30.0703125, 31.93896484375, 33.8076171875, 35.67626953125, 37.544921875, 39.41357421875, 41.2822265625, 43.15087890625, 45.01953125, 46.88818359375, 48.7568359375, 50.62548828125, 52.494140625, 54.36279296875, 56.2314453125, 58.10009765625, 59.96875]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 14.0, 132.0, 419.0, 348.0, 75.0, 18.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-117.1467514038086, -113.35729217529297, -109.56783294677734, -105.77836608886719, -101.98890686035156, -98.19944763183594, -94.40998840332031, -90.62052917480469, -86.83106994628906, -83.04161071777344, -79.25215148925781, -75.46269226074219, -71.67322540283203, -67.8837661743164, -64.09430694580078, -60.304847717285156, -56.515384674072266, -52.72592544555664, -48.93646240234375, -45.147003173828125, -41.3575439453125, -37.568084716796875, -33.778621673583984, -29.98916244506836, -26.1997013092041, -22.410240173339844, -18.62078094482422, -14.831319808959961, -11.04185962677002, -7.252399444580078, -3.4629383087158203, 0.3265209197998047, 4.1159820556640625, 7.905442237854004, 11.694902420043945, 15.484363555908203, 19.273822784423828, 23.063283920288086, 26.852745056152344, 30.64220428466797, 34.431663513183594, 38.22112274169922, 42.01058578491211, 45.800045013427734, 49.58950424194336, 53.37896728515625, 57.168426513671875, 60.9578857421875, 64.74734497070312, 68.53680419921875, 72.32626342773438, 76.11572265625, 79.90518951416016, 83.69464874267578, 87.4841079711914, 91.27356719970703, 95.06303405761719, 98.85249328613281, 102.64195251464844, 106.43141174316406, 110.22087860107422, 114.01033782958984, 117.79979705810547, 121.5892562866211, 125.37871551513672]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 6.0, 8.0, 6.0, 6.0, 15.0, 11.0, 20.0, 23.0, 18.0, 21.0, 22.0, 40.0, 29.0, 41.0, 29.0, 38.0, 44.0, 45.0, 42.0, 44.0, 51.0, 39.0, 50.0, 48.0, 42.0, 35.0, 26.0, 34.0, 27.0, 26.0, 21.0, 19.0, 14.0, 12.0, 7.0, 13.0, 4.0, 10.0, 5.0, 2.0, 4.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-70.54090118408203, -68.44624328613281, -66.35159301757812, -64.2569351196289, -62.16228485107422, -60.067630767822266, -57.97297668457031, -55.878318786621094, -53.783668518066406, -51.68901443481445, -49.5943603515625, -47.49970626831055, -45.405052185058594, -43.31039810180664, -41.21574401855469, -39.12108612060547, -37.026432037353516, -34.93177795410156, -32.83712387084961, -30.742469787597656, -28.647815704345703, -26.55316162109375, -24.458505630493164, -22.36385154724121, -20.269197463989258, -18.174543380737305, -16.07988929748535, -13.985234260559082, -11.890580177307129, -9.795926094055176, -7.701271057128906, -5.606616973876953, -3.5119590759277344, -1.4173047542572021, 0.6773495674133301, 2.7720041275024414, 4.8666582107543945, 6.961312294006348, 9.055967330932617, 11.15062141418457, 13.245275497436523, 15.339929580688477, 17.43458366394043, 19.529239654541016, 21.62389373779297, 23.718547821044922, 25.813201904296875, 27.907855987548828, 30.00251007080078, 32.097164154052734, 34.19181823730469, 36.28647232055664, 38.381126403808594, 40.47578048706055, 42.5704345703125, 44.66509246826172, 46.759742736816406, 48.85439682006836, 50.94905090332031, 53.043704986572266, 55.13835906982422, 57.23301315307617, 59.327667236328125, 61.422325134277344, 63.5169792175293]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 5.0, 4.0, 5.0, 6.0, 6.0, 9.0, 8.0, 8.0, 7.0, 16.0, 12.0, 17.0, 23.0, 21.0, 27.0, 26.0, 25.0, 38.0, 35.0, 32.0, 49.0, 40.0, 38.0, 36.0, 33.0, 47.0, 49.0, 32.0, 37.0, 25.0, 35.0, 35.0, 25.0, 21.0, 23.0, 33.0, 22.0, 14.0, 14.0, 21.0, 9.0, 9.0, 7.0, 6.0, 8.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.15234375, -5.93609619140625, -5.7198486328125, -5.50360107421875, -5.287353515625, -5.07110595703125, -4.8548583984375, -4.63861083984375, -4.42236328125, -4.20611572265625, -3.9898681640625, -3.77362060546875, -3.557373046875, -3.34112548828125, -3.1248779296875, -2.90863037109375, -2.6923828125, -2.47613525390625, -2.2598876953125, -2.04364013671875, -1.827392578125, -1.61114501953125, -1.3948974609375, -1.17864990234375, -0.96240234375, -0.74615478515625, -0.5299072265625, -0.31365966796875, -0.097412109375, 0.11883544921875, 0.3350830078125, 0.55133056640625, 0.767578125, 0.98382568359375, 1.2000732421875, 1.41632080078125, 1.632568359375, 1.84881591796875, 2.0650634765625, 2.28131103515625, 2.49755859375, 2.71380615234375, 2.9300537109375, 3.14630126953125, 3.362548828125, 3.57879638671875, 3.7950439453125, 4.01129150390625, 4.2275390625, 4.44378662109375, 4.6600341796875, 4.87628173828125, 5.092529296875, 5.30877685546875, 5.5250244140625, 5.74127197265625, 5.95751953125, 6.17376708984375, 6.3900146484375, 6.60626220703125, 6.822509765625, 7.03875732421875, 7.2550048828125, 7.47125244140625, 7.6875]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 6.0, 5.0, 7.0, 12.0, 7.0, 19.0, 27.0, 30.0, 47.0, 70.0, 93.0, 117.0, 202.0, 298.0, 441.0, 638.0, 953.0, 1575.0, 2639.0, 4545.0, 8834.0, 19687.0, 56573.0, 225349.0, 900209.0, 1755552.0, 893334.0, 229851.0, 54272.0, 18942.0, 8563.0, 4487.0, 2511.0, 1508.0, 936.0, 652.0, 403.0, 275.0, 195.0, 133.0, 88.0, 54.0, 59.0, 40.0, 17.0, 18.0, 7.0, 4.0, 7.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.875, -8.583984375, -8.29296875, -8.001953125, -7.7109375, -7.419921875, -7.12890625, -6.837890625, -6.546875, -6.255859375, -5.96484375, -5.673828125, -5.3828125, -5.091796875, -4.80078125, -4.509765625, -4.21875, -3.927734375, -3.63671875, -3.345703125, -3.0546875, -2.763671875, -2.47265625, -2.181640625, -1.890625, -1.599609375, -1.30859375, -1.017578125, -0.7265625, -0.435546875, -0.14453125, 0.146484375, 0.4375, 0.728515625, 1.01953125, 1.310546875, 1.6015625, 1.892578125, 2.18359375, 2.474609375, 2.765625, 3.056640625, 3.34765625, 3.638671875, 3.9296875, 4.220703125, 4.51171875, 4.802734375, 5.09375, 5.384765625, 5.67578125, 5.966796875, 6.2578125, 6.548828125, 6.83984375, 7.130859375, 7.421875, 7.712890625, 8.00390625, 8.294921875, 8.5859375, 8.876953125, 9.16796875, 9.458984375, 9.75]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 6.0, 21.0, 21.0, 33.0, 29.0, 44.0, 75.0, 112.0, 165.0, 235.0, 324.0, 435.0, 544.0, 572.0, 393.0, 285.0, 209.0, 155.0, 128.0, 79.0, 50.0, 47.0, 42.0, 15.0, 12.0, 10.0, 6.0, 5.0, 4.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.828125, -12.370361328125, -11.91259765625, -11.454833984375, -10.9970703125, -10.539306640625, -10.08154296875, -9.623779296875, -9.166015625, -8.708251953125, -8.25048828125, -7.792724609375, -7.3349609375, -6.877197265625, -6.41943359375, -5.961669921875, -5.50390625, -5.046142578125, -4.58837890625, -4.130615234375, -3.6728515625, -3.215087890625, -2.75732421875, -2.299560546875, -1.841796875, -1.384033203125, -0.92626953125, -0.468505859375, -0.0107421875, 0.447021484375, 0.90478515625, 1.362548828125, 1.8203125, 2.278076171875, 2.73583984375, 3.193603515625, 3.6513671875, 4.109130859375, 4.56689453125, 5.024658203125, 5.482421875, 5.940185546875, 6.39794921875, 6.855712890625, 7.3134765625, 7.771240234375, 8.22900390625, 8.686767578125, 9.14453125, 9.602294921875, 10.06005859375, 10.517822265625, 10.9755859375, 11.433349609375, 11.89111328125, 12.348876953125, 12.806640625, 13.264404296875, 13.72216796875, 14.179931640625, 14.6376953125, 15.095458984375, 15.55322265625, 16.010986328125, 16.46875]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 5.0, 4.0, 11.0, 9.0, 18.0, 24.0, 35.0, 56.0, 99.0, 201.0, 443.0, 1079.0, 3929.0, 2676108.0, 1506696.0, 3678.0, 1000.0, 424.0, 206.0, 98.0, 58.0, 28.0, 32.0, 11.0, 11.0, 8.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-68.6875, -66.7236328125, -64.759765625, -62.7958984375, -60.83203125, -58.8681640625, -56.904296875, -54.9404296875, -52.9765625, -51.0126953125, -49.048828125, -47.0849609375, -45.12109375, -43.1572265625, -41.193359375, -39.2294921875, -37.265625, -35.3017578125, -33.337890625, -31.3740234375, -29.41015625, -27.4462890625, -25.482421875, -23.5185546875, -21.5546875, -19.5908203125, -17.626953125, -15.6630859375, -13.69921875, -11.7353515625, -9.771484375, -7.8076171875, -5.84375, -3.8798828125, -1.916015625, 0.0478515625, 2.01171875, 3.9755859375, 5.939453125, 7.9033203125, 9.8671875, 11.8310546875, 13.794921875, 15.7587890625, 17.72265625, 19.6865234375, 21.650390625, 23.6142578125, 25.578125, 27.5419921875, 29.505859375, 31.4697265625, 33.43359375, 35.3974609375, 37.361328125, 39.3251953125, 41.2890625, 43.2529296875, 45.216796875, 47.1806640625, 49.14453125, 51.1083984375, 53.072265625, 55.0361328125, 57.0]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 38.0, 311.0, 510.0, 142.0, 10.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-331.8716125488281, -325.74896240234375, -319.6263427734375, -313.5036926269531, -307.3810729980469, -301.2584228515625, -295.13580322265625, -289.0131530761719, -282.8905029296875, -276.7678527832031, -270.6452331542969, -264.5225830078125, -258.39996337890625, -252.27731323242188, -246.15467834472656, -240.03204345703125, -233.90940856933594, -227.78677368164062, -221.6641387939453, -215.54150390625, -209.41885375976562, -203.2962188720703, -197.173583984375, -191.0509490966797, -184.92831420898438, -178.80567932128906, -172.68304443359375, -166.56039428710938, -160.43775939941406, -154.31512451171875, -148.19248962402344, -142.06985473632812, -135.94720458984375, -129.82456970214844, -123.7019271850586, -117.57929229736328, -111.45664978027344, -105.33401489257812, -99.21138000488281, -93.0887451171875, -86.96610260009766, -80.84346771240234, -74.7208251953125, -68.59819030761719, -62.47555160522461, -56.35291290283203, -50.23027801513672, -44.10763931274414, -37.98500061035156, -31.862361907958984, -25.73972511291504, -19.617088317871094, -13.494449615478516, -7.3718109130859375, -1.249176025390625, 4.873462677001953, 10.996101379394531, 17.11874008178711, 23.241376876831055, 29.364013671875, 35.48665237426758, 41.609291076660156, 47.73192596435547, 53.85456466674805, 59.977203369140625]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 0.0, 2.0, 4.0, 5.0, 9.0, 5.0, 10.0, 18.0, 8.0, 12.0, 20.0, 12.0, 15.0, 18.0, 20.0, 28.0, 36.0, 44.0, 33.0, 36.0, 34.0, 31.0, 35.0, 37.0, 44.0, 43.0, 49.0, 39.0, 36.0, 35.0, 32.0, 38.0, 33.0, 26.0, 25.0, 22.0, 18.0, 13.0, 15.0, 14.0, 7.0, 12.0, 9.0, 8.0, 9.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-41.966888427734375, -40.498680114746094, -39.03047561645508, -37.5622673034668, -36.09406280517578, -34.6258544921875, -33.15764617919922, -31.68943977355957, -30.221233367919922, -28.753026962280273, -27.284820556640625, -25.816612243652344, -24.348405838012695, -22.880199432373047, -21.411991119384766, -19.943784713745117, -18.47557830810547, -17.00737190246582, -15.539164543151855, -14.07095718383789, -12.602750778198242, -11.134544372558594, -9.666337013244629, -8.198129653930664, -6.729923248291016, -5.261716365814209, -3.7935094833374023, -2.3253026008605957, -0.8570957183837891, 0.6111111640930176, 2.079318046569824, 3.547525405883789, 5.0157318115234375, 6.483938694000244, 7.952145576477051, 9.420352935791016, 10.888559341430664, 12.356765747070312, 13.824973106384277, 15.293180465698242, 16.76138687133789, 18.22959327697754, 19.697799682617188, 21.16600799560547, 22.634214401245117, 24.102420806884766, 25.570629119873047, 27.038835525512695, 28.507041931152344, 29.975248336791992, 31.44345474243164, 32.91166305541992, 34.37986755371094, 35.84807586669922, 37.3162841796875, 38.78449249267578, 40.2526969909668, 41.72090530395508, 43.189109802246094, 44.657318115234375, 46.125526428222656, 47.59373092651367, 49.06193923950195, 50.53014373779297, 51.99835205078125]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 11.0, 4.0, 8.0, 10.0, 13.0, 13.0, 13.0, 15.0, 19.0, 25.0, 18.0, 26.0, 32.0, 26.0, 25.0, 27.0, 36.0, 35.0, 39.0, 41.0, 49.0, 36.0, 32.0, 46.0, 32.0, 33.0, 36.0, 33.0, 27.0, 21.0, 30.0, 32.0, 20.0, 20.0, 14.0, 25.0, 14.0, 10.0, 5.0, 11.0, 7.0, 5.0, 6.0, 8.0, 3.0, 2.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-4.984375, -4.81640625, -4.6484375, -4.48046875, -4.3125, -4.14453125, -3.9765625, -3.80859375, -3.640625, -3.47265625, -3.3046875, -3.13671875, -2.96875, -2.80078125, -2.6328125, -2.46484375, -2.296875, -2.12890625, -1.9609375, -1.79296875, -1.625, -1.45703125, -1.2890625, -1.12109375, -0.953125, -0.78515625, -0.6171875, -0.44921875, -0.28125, -0.11328125, 0.0546875, 0.22265625, 0.390625, 0.55859375, 0.7265625, 0.89453125, 1.0625, 1.23046875, 1.3984375, 1.56640625, 1.734375, 1.90234375, 2.0703125, 2.23828125, 2.40625, 2.57421875, 2.7421875, 2.91015625, 3.078125, 3.24609375, 3.4140625, 3.58203125, 3.75, 3.91796875, 4.0859375, 4.25390625, 4.421875, 4.58984375, 4.7578125, 4.92578125, 5.09375, 5.26171875, 5.4296875, 5.59765625, 5.765625]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 5.0, 9.0, 4.0, 16.0, 26.0, 42.0, 64.0, 96.0, 158.0, 221.0, 309.0, 468.0, 682.0, 1052.0, 1530.0, 2224.0, 3347.0, 5047.0, 7588.0, 11359.0, 17288.0, 26248.0, 40751.0, 65952.0, 120017.0, 307133.0, 196295.0, 89918.0, 52738.0, 33222.0, 21906.0, 14365.0, 9521.0, 6235.0, 4125.0, 2819.0, 1908.0, 1241.0, 831.0, 576.0, 400.0, 264.0, 172.0, 126.0, 87.0, 52.0, 38.0, 29.0, 21.0, 11.0, 10.0, 5.0, 5.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.033203125, -0.998504638671875, -0.96380615234375, -0.929107666015625, -0.8944091796875, -0.859710693359375, -0.82501220703125, -0.790313720703125, -0.755615234375, -0.720916748046875, -0.68621826171875, -0.651519775390625, -0.6168212890625, -0.582122802734375, -0.54742431640625, -0.512725830078125, -0.47802734375, -0.443328857421875, -0.40863037109375, -0.373931884765625, -0.3392333984375, -0.304534912109375, -0.26983642578125, -0.235137939453125, -0.200439453125, -0.165740966796875, -0.13104248046875, -0.096343994140625, -0.0616455078125, -0.026947021484375, 0.00775146484375, 0.042449951171875, 0.0771484375, 0.111846923828125, 0.14654541015625, 0.181243896484375, 0.2159423828125, 0.250640869140625, 0.28533935546875, 0.320037841796875, 0.354736328125, 0.389434814453125, 0.42413330078125, 0.458831787109375, 0.4935302734375, 0.528228759765625, 0.56292724609375, 0.597625732421875, 0.63232421875, 0.667022705078125, 0.70172119140625, 0.736419677734375, 0.7711181640625, 0.805816650390625, 0.84051513671875, 0.875213623046875, 0.909912109375, 0.944610595703125, 0.97930908203125, 1.014007568359375, 1.0487060546875, 1.083404541015625, 1.11810302734375, 1.152801513671875, 1.1875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 8.0, 4.0, 6.0, 8.0, 10.0, 12.0, 16.0, 10.0, 25.0, 19.0, 23.0, 30.0, 31.0, 33.0, 30.0, 32.0, 47.0, 54.0, 44.0, 41.0, 1059.0, 43.0, 39.0, 35.0, 41.0, 33.0, 44.0, 49.0, 27.0, 25.0, 25.0, 20.0, 25.0, 16.0, 18.0, 11.0, 9.0, 8.0, 7.0, 4.0, 4.0, 3.0, 5.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-4.625, -4.49871826171875, -4.3724365234375, -4.24615478515625, -4.119873046875, -3.99359130859375, -3.8673095703125, -3.74102783203125, -3.61474609375, -3.48846435546875, -3.3621826171875, -3.23590087890625, -3.109619140625, -2.98333740234375, -2.8570556640625, -2.73077392578125, -2.6044921875, -2.47821044921875, -2.3519287109375, -2.22564697265625, -2.099365234375, -1.97308349609375, -1.8468017578125, -1.72052001953125, -1.59423828125, -1.46795654296875, -1.3416748046875, -1.21539306640625, -1.089111328125, -0.96282958984375, -0.8365478515625, -0.71026611328125, -0.583984375, -0.45770263671875, -0.3314208984375, -0.20513916015625, -0.078857421875, 0.04742431640625, 0.1737060546875, 0.29998779296875, 0.42626953125, 0.55255126953125, 0.6788330078125, 0.80511474609375, 0.931396484375, 1.05767822265625, 1.1839599609375, 1.31024169921875, 1.4365234375, 1.56280517578125, 1.6890869140625, 1.81536865234375, 1.941650390625, 2.06793212890625, 2.1942138671875, 2.32049560546875, 2.44677734375, 2.57305908203125, 2.6993408203125, 2.82562255859375, 2.951904296875, 3.07818603515625, 3.2044677734375, 3.33074951171875, 3.45703125]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 6.0, 6.0, 8.0, 9.0, 24.0, 26.0, 44.0, 67.0, 95.0, 150.0, 239.0, 324.0, 526.0, 844.0, 1320.0, 2038.0, 3306.0, 5316.0, 8435.0, 14028.0, 23440.0, 40362.0, 72381.0, 137324.0, 1374330.0, 195404.0, 92202.0, 50737.0, 28964.0, 17322.0, 10438.0, 6455.0, 3975.0, 2511.0, 1597.0, 1058.0, 638.0, 424.0, 256.0, 179.0, 107.0, 79.0, 50.0, 31.0, 26.0, 12.0, 6.0, 14.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.29296875, -1.2534332275390625, -1.213897705078125, -1.1743621826171875, -1.13482666015625, -1.0952911376953125, -1.055755615234375, -1.0162200927734375, -0.9766845703125, -0.9371490478515625, -0.897613525390625, -0.8580780029296875, -0.81854248046875, -0.7790069580078125, -0.739471435546875, -0.6999359130859375, -0.660400390625, -0.6208648681640625, -0.581329345703125, -0.5417938232421875, -0.50225830078125, -0.4627227783203125, -0.423187255859375, -0.3836517333984375, -0.3441162109375, -0.3045806884765625, -0.265045166015625, -0.2255096435546875, -0.18597412109375, -0.1464385986328125, -0.106903076171875, -0.0673675537109375, -0.02783203125, 0.0117034912109375, 0.051239013671875, 0.0907745361328125, 0.13031005859375, 0.1698455810546875, 0.209381103515625, 0.2489166259765625, 0.2884521484375, 0.3279876708984375, 0.367523193359375, 0.4070587158203125, 0.44659423828125, 0.4861297607421875, 0.525665283203125, 0.5652008056640625, 0.604736328125, 0.6442718505859375, 0.683807373046875, 0.7233428955078125, 0.76287841796875, 0.8024139404296875, 0.841949462890625, 0.8814849853515625, 0.9210205078125, 0.9605560302734375, 1.000091552734375, 1.0396270751953125, 1.07916259765625, 1.1186981201171875, 1.158233642578125, 1.1977691650390625, 1.2373046875]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 12.0, 4.0, 12.0, 10.0, 10.0, 18.0, 17.0, 26.0, 23.0, 40.0, 36.0, 39.0, 41.0, 62.0, 65.0, 54.0, 71.0, 69.0, 74.0, 45.0, 56.0, 44.0, 33.0, 32.0, 23.0, 19.0, 17.0, 9.0, 8.0, 7.0, 9.0, 5.0, 2.0, 5.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004925727844238281, -0.0004733428359031677, -0.0004541128873825073, -0.0004348829388618469, -0.0004156529903411865, -0.0003964230418205261, -0.0003771930932998657, -0.0003579631447792053, -0.0003387331962585449, -0.0003195032477378845, -0.0003002732992172241, -0.0002810433506965637, -0.0002618134021759033, -0.00024258345365524292, -0.00022335350513458252, -0.00020412355661392212, -0.00018489360809326172, -0.00016566365957260132, -0.00014643371105194092, -0.00012720376253128052, -0.00010797381401062012, -8.874386548995972e-05, -6.951391696929932e-05, -5.0283968448638916e-05, -3.1054019927978516e-05, -1.1824071407318115e-05, 7.405877113342285e-06, 2.6635825634002686e-05, 4.5865774154663086e-05, 6.509572267532349e-05, 8.432567119598389e-05, 0.00010355561971664429, 0.0001227855682373047, 0.0001420155167579651, 0.0001612454652786255, 0.0001804754137992859, 0.0001997053623199463, 0.0002189353108406067, 0.0002381652593612671, 0.0002573952078819275, 0.0002766251564025879, 0.0002958551049232483, 0.0003150850534439087, 0.0003343150019645691, 0.0003535449504852295, 0.0003727748990058899, 0.0003920048475265503, 0.0004112347960472107, 0.0004304647445678711, 0.0004496946930885315, 0.0004689246416091919, 0.0004881545901298523, 0.0005073845386505127, 0.0005266144871711731, 0.0005458444356918335, 0.0005650743842124939, 0.0005843043327331543, 0.0006035342812538147, 0.0006227642297744751, 0.0006419941782951355, 0.0006612241268157959, 0.0006804540753364563, 0.0006996840238571167, 0.0007189139723777771, 0.0007381439208984375]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 4.0, 6.0, 5.0, 10.0, 16.0, 16.0, 11.0, 29.0, 33.0, 58.0, 67.0, 81.0, 111.0, 177.0, 309.0, 528.0, 1020.0, 51417.0, 991307.0, 1420.0, 663.0, 391.0, 259.0, 176.0, 122.0, 91.0, 69.0, 43.0, 36.0, 21.0, 17.0, 16.0, 12.0, 2.0, 3.0, 3.0, 7.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0133514404296875, -0.01293647289276123, -0.012521505355834961, -0.012106537818908691, -0.011691570281982422, -0.011276602745056152, -0.010861635208129883, -0.010446667671203613, -0.010031700134277344, -0.009616732597351074, -0.009201765060424805, -0.008786797523498535, -0.008371829986572266, -0.007956862449645996, -0.0075418949127197266, -0.007126927375793457, -0.0067119598388671875, -0.006296992301940918, -0.0058820247650146484, -0.005467057228088379, -0.005052089691162109, -0.00463712215423584, -0.00422215461730957, -0.0038071870803833008, -0.0033922195434570312, -0.0029772520065307617, -0.002562284469604492, -0.0021473169326782227, -0.0017323493957519531, -0.0013173818588256836, -0.0009024143218994141, -0.00048744678497314453, -7.2479248046875e-05, 0.00034248828887939453, 0.0007574558258056641, 0.0011724233627319336, 0.0015873908996582031, 0.0020023584365844727, 0.002417325973510742, 0.0028322935104370117, 0.0032472610473632812, 0.0036622285842895508, 0.00407719612121582, 0.00449216365814209, 0.004907131195068359, 0.005322098731994629, 0.0057370662689208984, 0.006152033805847168, 0.0065670013427734375, 0.006981968879699707, 0.0073969364166259766, 0.007811903953552246, 0.008226871490478516, 0.008641839027404785, 0.009056806564331055, 0.009471774101257324, 0.009886741638183594, 0.010301709175109863, 0.010716676712036133, 0.011131644248962402, 0.011546611785888672, 0.011961579322814941, 0.012376546859741211, 0.01279151439666748, 0.01320648193359375]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 23.0, 301.0, 604.0, 79.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0017445945413783193, -0.0016965147806331515, -0.0016484350198879838, -0.001600355375558138, -0.0015522756148129702, -0.0015041958540678024, -0.0014561160933226347, -0.001408036332577467, -0.0013599565718322992, -0.0013118768110871315, -0.0012637970503419638, -0.001215717289596796, -0.0011676376452669501, -0.0011195578845217824, -0.0010714781237766147, -0.001023398363031447, -0.000975318718701601, -0.0009272389579564333, -0.0008791592554189265, -0.0008310794946737587, -0.0007829997921362519, -0.0007349200313910842, -0.0006868402706459165, -0.0006387605099007487, -0.0005906808073632419, -0.0005426010466180742, -0.0004945213440805674, -0.00044644158333539963, -0.00039836185169406235, -0.0003502821200527251, -0.00030220235930755734, -0.00025412262766622007, -0.0002060428960248828, -0.00015796316438354552, -0.00010988341819029301, -6.180367199704051e-05, -1.3723940355703235e-05, 3.435579128563404e-05, 8.243555203080177e-05, 0.00013051528367213905, 0.00017859501531347632, 0.0002266747469548136, 0.0002747544785961509, 0.0003228342393413186, 0.0003709139709826559, 0.00041899370262399316, 0.0004670734633691609, 0.0005151531659066677, 0.0005632329266518354, 0.0006113126873970032, 0.00065939238993451, 0.0007074721506796777, 0.0007555518532171845, 0.0008036316139623523, 0.00085171137470752, 0.0008997911354526877, 0.0009478708379901946, 0.0009959505405277014, 0.0010440303012728691, 0.0010921100620180368, 0.0011401898227632046, 0.0011882695835083723, 0.00123634934425354, 0.001284428988583386, 0.0013325087493285537]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 6.0, 4.0, 1.0, 3.0, 8.0, 7.0, 8.0, 16.0, 13.0, 23.0, 20.0, 26.0, 22.0, 28.0, 21.0, 43.0, 31.0, 37.0, 40.0, 52.0, 40.0, 38.0, 38.0, 40.0, 41.0, 37.0, 29.0, 33.0, 40.0, 34.0, 41.0, 25.0, 27.0, 26.0, 19.0, 13.0, 20.0, 17.0, 10.0, 7.0, 4.0, 6.0, 5.0, 3.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00029289722442626953, -0.00028328970074653625, -0.000273682177066803, -0.0002640746533870697, -0.0002544671297073364, -0.00024485960602760315, -0.00023525208234786987, -0.0002256445586681366, -0.00021603703498840332, -0.00020642951130867004, -0.00019682198762893677, -0.0001872144639492035, -0.00017760694026947021, -0.00016799941658973694, -0.00015839189291000366, -0.00014878436923027039, -0.0001391768455505371, -0.00012956932187080383, -0.00011996179819107056, -0.00011035427451133728, -0.000100746750831604, -9.113922715187073e-05, -8.153170347213745e-05, -7.192417979240417e-05, -6.23166561126709e-05, -5.270913243293762e-05, -4.3101608753204346e-05, -3.349408507347107e-05, -2.3886561393737793e-05, -1.4279037714004517e-05, -4.67151403427124e-06, 4.936009645462036e-06, 1.4543533325195312e-05, 2.415105700492859e-05, 3.3758580684661865e-05, 4.336610436439514e-05, 5.297362804412842e-05, 6.25811517238617e-05, 7.218867540359497e-05, 8.179619908332825e-05, 9.140372276306152e-05, 0.0001010112464427948, 0.00011061877012252808, 0.00012022629380226135, 0.00012983381748199463, 0.0001394413411617279, 0.00014904886484146118, 0.00015865638852119446, 0.00016826391220092773, 0.000177871435880661, 0.0001874789595603943, 0.00019708648324012756, 0.00020669400691986084, 0.00021630153059959412, 0.0002259090542793274, 0.00023551657795906067, 0.00024512410163879395, 0.0002547316253185272, 0.0002643391489982605, 0.0002739466726779938, 0.00028355419635772705, 0.00029316172003746033, 0.0003027692437171936, 0.0003123767673969269, 0.00032198429107666016]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 11.0, 4.0, 8.0, 10.0, 13.0, 13.0, 13.0, 15.0, 19.0, 25.0, 18.0, 26.0, 32.0, 26.0, 25.0, 27.0, 36.0, 35.0, 39.0, 41.0, 49.0, 35.0, 33.0, 46.0, 32.0, 33.0, 36.0, 33.0, 27.0, 21.0, 30.0, 32.0, 20.0, 20.0, 14.0, 25.0, 14.0, 10.0, 5.0, 11.0, 7.0, 5.0, 6.0, 8.0, 3.0, 2.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-4.984375, -4.81640625, -4.6484375, -4.48046875, -4.3125, -4.14453125, -3.9765625, -3.80859375, -3.640625, -3.47265625, -3.3046875, -3.13671875, -2.96875, -2.80078125, -2.6328125, -2.46484375, -2.296875, -2.12890625, -1.9609375, -1.79296875, -1.625, -1.45703125, -1.2890625, -1.12109375, -0.953125, -0.78515625, -0.6171875, -0.44921875, -0.28125, -0.11328125, 0.0546875, 0.22265625, 0.390625, 0.55859375, 0.7265625, 0.89453125, 1.0625, 1.23046875, 1.3984375, 1.56640625, 1.734375, 1.90234375, 2.0703125, 2.23828125, 2.40625, 2.57421875, 2.7421875, 2.91015625, 3.078125, 3.24609375, 3.4140625, 3.58203125, 3.75, 3.91796875, 4.0859375, 4.25390625, 4.421875, 4.58984375, 4.7578125, 4.92578125, 5.09375, 5.26171875, 5.4296875, 5.59765625, 5.765625]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 7.0, 9.0, 14.0, 17.0, 27.0, 25.0, 40.0, 50.0, 61.0, 90.0, 116.0, 168.0, 234.0, 343.0, 474.0, 855.0, 1314.0, 2460.0, 5238.0, 13392.0, 42532.0, 205911.0, 603065.0, 122936.0, 29587.0, 10058.0, 4064.0, 2052.0, 1169.0, 721.0, 439.0, 329.0, 187.0, 141.0, 103.0, 82.0, 61.0, 41.0, 32.0, 24.0, 14.0, 17.0, 15.0, 7.0, 6.0, 5.0, 5.0, 7.0, 0.0, 2.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-9.5859375, -9.2593994140625, -8.932861328125, -8.6063232421875, -8.27978515625, -7.9532470703125, -7.626708984375, -7.3001708984375, -6.9736328125, -6.6470947265625, -6.320556640625, -5.9940185546875, -5.66748046875, -5.3409423828125, -5.014404296875, -4.6878662109375, -4.361328125, -4.0347900390625, -3.708251953125, -3.3817138671875, -3.05517578125, -2.7286376953125, -2.402099609375, -2.0755615234375, -1.7490234375, -1.4224853515625, -1.095947265625, -0.7694091796875, -0.44287109375, -0.1163330078125, 0.210205078125, 0.5367431640625, 0.86328125, 1.1898193359375, 1.516357421875, 1.8428955078125, 2.16943359375, 2.4959716796875, 2.822509765625, 3.1490478515625, 3.4755859375, 3.8021240234375, 4.128662109375, 4.4552001953125, 4.78173828125, 5.1082763671875, 5.434814453125, 5.7613525390625, 6.087890625, 6.4144287109375, 6.740966796875, 7.0675048828125, 7.39404296875, 7.7205810546875, 8.047119140625, 8.3736572265625, 8.7001953125, 9.0267333984375, 9.353271484375, 9.6798095703125, 10.00634765625, 10.3328857421875, 10.659423828125, 10.9859619140625, 11.3125]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 0.0, 3.0, 7.0, 6.0, 8.0, 8.0, 4.0, 8.0, 18.0, 11.0, 13.0, 22.0, 24.0, 19.0, 24.0, 36.0, 34.0, 41.0, 51.0, 47.0, 113.0, 470.0, 1563.0, 127.0, 59.0, 41.0, 41.0, 33.0, 39.0, 34.0, 25.0, 20.0, 13.0, 13.0, 9.0, 15.0, 14.0, 13.0, 8.0, 4.0, 3.0, 3.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.0703125, -13.5858154296875, -13.101318359375, -12.6168212890625, -12.13232421875, -11.6478271484375, -11.163330078125, -10.6788330078125, -10.1943359375, -9.7098388671875, -9.225341796875, -8.7408447265625, -8.25634765625, -7.7718505859375, -7.287353515625, -6.8028564453125, -6.318359375, -5.8338623046875, -5.349365234375, -4.8648681640625, -4.38037109375, -3.8958740234375, -3.411376953125, -2.9268798828125, -2.4423828125, -1.9578857421875, -1.473388671875, -0.9888916015625, -0.50439453125, -0.0198974609375, 0.464599609375, 0.9490966796875, 1.43359375, 1.9180908203125, 2.402587890625, 2.8870849609375, 3.37158203125, 3.8560791015625, 4.340576171875, 4.8250732421875, 5.3095703125, 5.7940673828125, 6.278564453125, 6.7630615234375, 7.24755859375, 7.7320556640625, 8.216552734375, 8.7010498046875, 9.185546875, 9.6700439453125, 10.154541015625, 10.6390380859375, 11.12353515625, 11.6080322265625, 12.092529296875, 12.5770263671875, 13.0615234375, 13.5460205078125, 14.030517578125, 14.5150146484375, 14.99951171875, 15.4840087890625, 15.968505859375, 16.4530029296875, 16.9375]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 3.0, 1.0, 7.0, 4.0, 4.0, 5.0, 12.0, 16.0, 15.0, 16.0, 15.0, 17.0, 32.0, 41.0, 68.0, 84.0, 148.0, 273.0, 456.0, 1044.0, 21118.0, 3117402.0, 3233.0, 689.0, 363.0, 203.0, 116.0, 84.0, 45.0, 41.0, 31.0, 16.0, 19.0, 17.0, 12.0, 11.0, 7.0, 3.0, 9.0, 7.0, 6.0, 5.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-51.3125, -49.8994140625, -48.486328125, -47.0732421875, -45.66015625, -44.2470703125, -42.833984375, -41.4208984375, -40.0078125, -38.5947265625, -37.181640625, -35.7685546875, -34.35546875, -32.9423828125, -31.529296875, -30.1162109375, -28.703125, -27.2900390625, -25.876953125, -24.4638671875, -23.05078125, -21.6376953125, -20.224609375, -18.8115234375, -17.3984375, -15.9853515625, -14.572265625, -13.1591796875, -11.74609375, -10.3330078125, -8.919921875, -7.5068359375, -6.09375, -4.6806640625, -3.267578125, -1.8544921875, -0.44140625, 0.9716796875, 2.384765625, 3.7978515625, 5.2109375, 6.6240234375, 8.037109375, 9.4501953125, 10.86328125, 12.2763671875, 13.689453125, 15.1025390625, 16.515625, 17.9287109375, 19.341796875, 20.7548828125, 22.16796875, 23.5810546875, 24.994140625, 26.4072265625, 27.8203125, 29.2333984375, 30.646484375, 32.0595703125, 33.47265625, 34.8857421875, 36.298828125, 37.7119140625, 39.125]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 50.0, 408.0, 494.0, 54.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.610820770263672, -29.36249542236328, -27.114171981811523, -24.865846633911133, -22.617523193359375, -20.369197845458984, -18.120872497558594, -15.87254810333252, -13.624223709106445, -11.375899314880371, -9.127574920654297, -6.879249572753906, -4.630925178527832, -2.382600784301758, -0.1342754364013672, 2.114048957824707, 4.362373352050781, 6.6106977462768555, 8.85902214050293, 11.10734748840332, 13.355671882629395, 15.603996276855469, 17.85232162475586, 20.10064697265625, 22.348970413208008, 24.5972957611084, 26.845619201660156, 29.093944549560547, 31.342269897460938, 33.59059143066406, 35.83892059326172, 38.087242126464844, 40.33556365966797, 42.58388900756836, 44.83221435546875, 47.080535888671875, 49.328861236572266, 51.577186584472656, 53.82551193237305, 56.07383728027344, 58.32215881347656, 60.57048416137695, 62.818809509277344, 65.06713104248047, 67.31546020507812, 69.56378173828125, 71.81210327148438, 74.06043243408203, 76.30876159667969, 78.55708312988281, 80.80541229248047, 83.0537338256836, 85.30206298828125, 87.55038452148438, 89.7987060546875, 92.04703521728516, 94.29535675048828, 96.5436782836914, 98.79200744628906, 101.04032897949219, 103.28865814208984, 105.53697967529297, 107.78530883789062, 110.03363037109375, 112.28195190429688]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 8.0, 8.0, 14.0, 16.0, 17.0, 23.0, 20.0, 34.0, 23.0, 26.0, 42.0, 43.0, 40.0, 54.0, 44.0, 49.0, 53.0, 47.0, 56.0, 45.0, 48.0, 30.0, 36.0, 36.0, 32.0, 32.0, 21.0, 22.0, 18.0, 18.0, 9.0, 7.0, 13.0, 3.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.665122985839844, -40.412986755371094, -39.160850524902344, -37.908714294433594, -36.65657424926758, -35.40443801879883, -34.15230178833008, -32.90016555786133, -31.648029327392578, -30.395893096923828, -29.143754959106445, -27.891618728637695, -26.639482498168945, -25.387344360351562, -24.135208129882812, -22.883071899414062, -21.63093376159668, -20.37879753112793, -19.126659393310547, -17.874523162841797, -16.622386932373047, -15.37024974822998, -14.118112564086914, -12.865976333618164, -11.613839149475098, -10.361701965332031, -9.109565734863281, -7.857428550720215, -6.605291843414307, -5.353155136108398, -4.101017951965332, -2.848881721496582, -1.5967445373535156, -0.34460771083831787, 0.9075291156768799, 2.159666061401367, 3.4118027687072754, 4.663939476013184, 5.91607666015625, 7.168212890625, 8.420350074768066, 9.672487258911133, 10.924623489379883, 12.17676067352295, 13.428897857666016, 14.681034088134766, 15.933171272277832, 17.185306549072266, 18.43744468688965, 19.6895809173584, 20.94171905517578, 22.19385528564453, 23.44599151611328, 24.69812774658203, 25.950265884399414, 27.202402114868164, 28.454540252685547, 29.706676483154297, 30.95881462097168, 32.21095275878906, 33.46308898925781, 34.71522521972656, 35.96736145019531, 37.21949768066406, 38.47163391113281]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 6.0, 5.0, 12.0, 16.0, 20.0, 16.0, 16.0, 24.0, 28.0, 29.0, 37.0, 49.0, 36.0, 38.0, 41.0, 34.0, 59.0, 61.0, 42.0, 53.0, 51.0, 43.0, 36.0, 31.0, 24.0, 25.0, 29.0, 28.0, 23.0, 19.0, 18.0, 11.0, 12.0, 8.0, 6.0, 1.0, 7.0, 4.0, 3.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.8046875, -6.5584716796875, -6.312255859375, -6.0660400390625, -5.81982421875, -5.5736083984375, -5.327392578125, -5.0811767578125, -4.8349609375, -4.5887451171875, -4.342529296875, -4.0963134765625, -3.85009765625, -3.6038818359375, -3.357666015625, -3.1114501953125, -2.865234375, -2.6190185546875, -2.372802734375, -2.1265869140625, -1.88037109375, -1.6341552734375, -1.387939453125, -1.1417236328125, -0.8955078125, -0.6492919921875, -0.403076171875, -0.1568603515625, 0.08935546875, 0.3355712890625, 0.581787109375, 0.8280029296875, 1.07421875, 1.3204345703125, 1.566650390625, 1.8128662109375, 2.05908203125, 2.3052978515625, 2.551513671875, 2.7977294921875, 3.0439453125, 3.2901611328125, 3.536376953125, 3.7825927734375, 4.02880859375, 4.2750244140625, 4.521240234375, 4.7674560546875, 5.013671875, 5.2598876953125, 5.506103515625, 5.7523193359375, 5.99853515625, 6.2447509765625, 6.490966796875, 6.7371826171875, 6.9833984375, 7.2296142578125, 7.475830078125, 7.7220458984375, 7.96826171875, 8.2144775390625, 8.460693359375, 8.7069091796875, 8.953125]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 7.0, 6.0, 11.0, 15.0, 16.0, 36.0, 32.0, 59.0, 58.0, 75.0, 101.0, 117.0, 148.0, 251.0, 357.0, 608.0, 1093.0, 3601.0, 392390.0, 3778504.0, 12692.0, 1786.0, 758.0, 435.0, 285.0, 225.0, 154.0, 101.0, 71.0, 60.0, 45.0, 35.0, 34.0, 24.0, 20.0, 23.0, 14.0, 9.0, 10.0, 7.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.3125, -53.59716796875, -51.8818359375, -50.16650390625, -48.451171875, -46.73583984375, -45.0205078125, -43.30517578125, -41.58984375, -39.87451171875, -38.1591796875, -36.44384765625, -34.728515625, -33.01318359375, -31.2978515625, -29.58251953125, -27.8671875, -26.15185546875, -24.4365234375, -22.72119140625, -21.005859375, -19.29052734375, -17.5751953125, -15.85986328125, -14.14453125, -12.42919921875, -10.7138671875, -8.99853515625, -7.283203125, -5.56787109375, -3.8525390625, -2.13720703125, -0.421875, 1.29345703125, 3.0087890625, 4.72412109375, 6.439453125, 8.15478515625, 9.8701171875, 11.58544921875, 13.30078125, 15.01611328125, 16.7314453125, 18.44677734375, 20.162109375, 21.87744140625, 23.5927734375, 25.30810546875, 27.0234375, 28.73876953125, 30.4541015625, 32.16943359375, 33.884765625, 35.60009765625, 37.3154296875, 39.03076171875, 40.74609375, 42.46142578125, 44.1767578125, 45.89208984375, 47.607421875, 49.32275390625, 51.0380859375, 52.75341796875, 54.46875]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 5.0, 6.0, 8.0, 22.0, 21.0, 35.0, 58.0, 116.0, 167.0, 301.0, 467.0, 660.0, 691.0, 538.0, 379.0, 232.0, 131.0, 80.0, 44.0, 33.0, 18.0, 19.0, 11.0, 6.0, 4.0, 2.0, 5.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4921875, -9.0648193359375, -8.637451171875, -8.2100830078125, -7.78271484375, -7.3553466796875, -6.927978515625, -6.5006103515625, -6.0732421875, -5.6458740234375, -5.218505859375, -4.7911376953125, -4.36376953125, -3.9364013671875, -3.509033203125, -3.0816650390625, -2.654296875, -2.2269287109375, -1.799560546875, -1.3721923828125, -0.94482421875, -0.5174560546875, -0.090087890625, 0.3372802734375, 0.7646484375, 1.1920166015625, 1.619384765625, 2.0467529296875, 2.47412109375, 2.9014892578125, 3.328857421875, 3.7562255859375, 4.18359375, 4.6109619140625, 5.038330078125, 5.4656982421875, 5.89306640625, 6.3204345703125, 6.747802734375, 7.1751708984375, 7.6025390625, 8.0299072265625, 8.457275390625, 8.8846435546875, 9.31201171875, 9.7393798828125, 10.166748046875, 10.5941162109375, 11.021484375, 11.4488525390625, 11.876220703125, 12.3035888671875, 12.73095703125, 13.1583251953125, 13.585693359375, 14.0130615234375, 14.4404296875, 14.8677978515625, 15.295166015625, 15.7225341796875, 16.14990234375, 16.5772705078125, 17.004638671875, 17.4320068359375, 17.859375]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 5.0, 2.0, 4.0, 5.0, 5.0, 9.0, 7.0, 20.0, 23.0, 32.0, 66.0, 105.0, 242.0, 556.0, 1907.0, 7813.0, 55627.0, 2012839.0, 2047259.0, 57127.0, 7660.0, 1870.0, 581.0, 225.0, 119.0, 63.0, 36.0, 26.0, 21.0, 9.0, 7.0, 1.0, 7.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.265625, -17.712158203125, -17.15869140625, -16.605224609375, -16.0517578125, -15.498291015625, -14.94482421875, -14.391357421875, -13.837890625, -13.284423828125, -12.73095703125, -12.177490234375, -11.6240234375, -11.070556640625, -10.51708984375, -9.963623046875, -9.41015625, -8.856689453125, -8.30322265625, -7.749755859375, -7.1962890625, -6.642822265625, -6.08935546875, -5.535888671875, -4.982421875, -4.428955078125, -3.87548828125, -3.322021484375, -2.7685546875, -2.215087890625, -1.66162109375, -1.108154296875, -0.5546875, -0.001220703125, 0.55224609375, 1.105712890625, 1.6591796875, 2.212646484375, 2.76611328125, 3.319580078125, 3.873046875, 4.426513671875, 4.97998046875, 5.533447265625, 6.0869140625, 6.640380859375, 7.19384765625, 7.747314453125, 8.30078125, 8.854248046875, 9.40771484375, 9.961181640625, 10.5146484375, 11.068115234375, 11.62158203125, 12.175048828125, 12.728515625, 13.281982421875, 13.83544921875, 14.388916015625, 14.9423828125, 15.495849609375, 16.04931640625, 16.602783203125, 17.15625]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 9.0, 9.0, 11.0, 42.0, 42.0, 49.0, 94.0, 102.0, 124.0, 106.0, 119.0, 101.0, 64.0, 43.0, 21.0, 26.0, 12.0, 9.0, 6.0, 4.0, 3.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.13043212890625, -43.909393310546875, -41.688358306884766, -39.46731948852539, -37.24628448486328, -35.025245666503906, -32.80420684814453, -30.583171844482422, -28.36213493347168, -26.141098022460938, -23.920061111450195, -21.699024200439453, -19.477985382080078, -17.25695037841797, -15.035911560058594, -12.814874649047852, -10.59383773803711, -8.372800827026367, -6.151763439178467, -3.9307260513305664, -1.7096891403198242, 0.511347770690918, 2.7323856353759766, 4.953422546386719, 7.174459457397461, 9.395496368408203, 11.616533279418945, 13.837571144104004, 16.058609008789062, 18.279644012451172, 20.500682830810547, 22.72171974182129, 24.94275665283203, 27.163793563842773, 29.384830474853516, 31.60586929321289, 33.826904296875, 36.047943115234375, 38.26898193359375, 40.49001693725586, 42.71105194091797, 44.932090759277344, 47.15312576293945, 49.37416458129883, 51.59519958496094, 53.81623840332031, 56.03727722167969, 58.2583122253418, 60.47935104370117, 62.70038986206055, 64.92142486572266, 67.14246368408203, 69.3635025024414, 71.58453369140625, 73.80557250976562, 76.026611328125, 78.24765014648438, 80.46868896484375, 82.68972778320312, 84.91075897216797, 87.13179779052734, 89.35283660888672, 91.5738754272461, 93.79490661621094, 96.01594543457031]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 5.0, 8.0, 6.0, 7.0, 9.0, 11.0, 15.0, 23.0, 19.0, 35.0, 30.0, 28.0, 29.0, 28.0, 29.0, 37.0, 38.0, 45.0, 42.0, 37.0, 36.0, 51.0, 49.0, 54.0, 25.0, 32.0, 38.0, 36.0, 19.0, 28.0, 15.0, 24.0, 26.0, 17.0, 8.0, 10.0, 17.0, 7.0, 7.0, 7.0, 6.0, 3.0, 8.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.2600212097168, -36.14570617675781, -35.03139114379883, -33.91707992553711, -32.802764892578125, -31.68844985961914, -30.574134826660156, -29.459819793701172, -28.34550666809082, -27.231191635131836, -26.116878509521484, -25.0025634765625, -23.888248443603516, -22.773935317993164, -21.65962028503418, -20.545307159423828, -19.430992126464844, -18.31667709350586, -17.202363967895508, -16.088048934936523, -14.973734855651855, -13.859420776367188, -12.745105743408203, -11.630791664123535, -10.516477584838867, -9.4021635055542, -8.287849426269531, -7.173534393310547, -6.059220314025879, -4.944906234741211, -3.8305916786193848, -2.7162771224975586, -1.6019668579101562, -0.4876525402069092, 0.6266617774963379, 1.740976095199585, 2.855290412902832, 3.9696044921875, 5.083919048309326, 6.198233604431152, 7.31254768371582, 8.426861763000488, 9.541175842285156, 10.65549087524414, 11.769804954528809, 12.884119033813477, 13.998434066772461, 15.112748146057129, 16.227062225341797, 17.34137725830078, 18.455690383911133, 19.570005416870117, 20.68431854248047, 21.798633575439453, 22.912948608398438, 24.027263641357422, 25.141576766967773, 26.255891799926758, 27.37020492553711, 28.484519958496094, 29.598834991455078, 30.71314811706543, 31.827463150024414, 32.941776275634766, 34.05609130859375]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 7.0, 3.0, 5.0, 7.0, 16.0, 8.0, 10.0, 15.0, 19.0, 13.0, 28.0, 25.0, 23.0, 30.0, 28.0, 21.0, 30.0, 28.0, 32.0, 49.0, 31.0, 41.0, 54.0, 33.0, 35.0, 42.0, 42.0, 43.0, 36.0, 17.0, 20.0, 27.0, 16.0, 22.0, 22.0, 16.0, 19.0, 12.0, 14.0, 9.0, 9.0, 4.0, 12.0, 9.0, 7.0, 8.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0], "bins": [-51.21875, -49.6982421875, -48.177734375, -46.6572265625, -45.13671875, -43.6162109375, -42.095703125, -40.5751953125, -39.0546875, -37.5341796875, -36.013671875, -34.4931640625, -32.97265625, -31.4521484375, -29.931640625, -28.4111328125, -26.890625, -25.3701171875, -23.849609375, -22.3291015625, -20.80859375, -19.2880859375, -17.767578125, -16.2470703125, -14.7265625, -13.2060546875, -11.685546875, -10.1650390625, -8.64453125, -7.1240234375, -5.603515625, -4.0830078125, -2.5625, -1.0419921875, 0.478515625, 1.9990234375, 3.51953125, 5.0400390625, 6.560546875, 8.0810546875, 9.6015625, 11.1220703125, 12.642578125, 14.1630859375, 15.68359375, 17.2041015625, 18.724609375, 20.2451171875, 21.765625, 23.2861328125, 24.806640625, 26.3271484375, 27.84765625, 29.3681640625, 30.888671875, 32.4091796875, 33.9296875, 35.4501953125, 36.970703125, 38.4912109375, 40.01171875, 41.5322265625, 43.052734375, 44.5732421875, 46.09375]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 6.0, 6.0, 9.0, 17.0, 19.0, 30.0, 45.0, 55.0, 68.0, 130.0, 155.0, 242.0, 370.0, 539.0, 779.0, 1154.0, 1831.0, 2662.0, 3944.0, 6076.0, 9229.0, 14296.0, 22274.0, 35213.0, 58977.0, 109843.0, 271639.0, 251689.0, 104950.0, 56906.0, 33803.0, 21172.0, 13535.0, 8866.0, 5912.0, 3970.0, 2674.0, 1790.0, 1215.0, 814.0, 534.0, 388.0, 263.0, 155.0, 108.0, 70.0, 43.0, 34.0, 24.0, 16.0, 9.0, 5.0, 3.0, 3.0, 0.0, 6.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-8.96875, -8.66943359375, -8.3701171875, -8.07080078125, -7.771484375, -7.47216796875, -7.1728515625, -6.87353515625, -6.57421875, -6.27490234375, -5.9755859375, -5.67626953125, -5.376953125, -5.07763671875, -4.7783203125, -4.47900390625, -4.1796875, -3.88037109375, -3.5810546875, -3.28173828125, -2.982421875, -2.68310546875, -2.3837890625, -2.08447265625, -1.78515625, -1.48583984375, -1.1865234375, -0.88720703125, -0.587890625, -0.28857421875, 0.0107421875, 0.31005859375, 0.609375, 0.90869140625, 1.2080078125, 1.50732421875, 1.806640625, 2.10595703125, 2.4052734375, 2.70458984375, 3.00390625, 3.30322265625, 3.6025390625, 3.90185546875, 4.201171875, 4.50048828125, 4.7998046875, 5.09912109375, 5.3984375, 5.69775390625, 5.9970703125, 6.29638671875, 6.595703125, 6.89501953125, 7.1943359375, 7.49365234375, 7.79296875, 8.09228515625, 8.3916015625, 8.69091796875, 8.990234375, 9.28955078125, 9.5888671875, 9.88818359375, 10.1875]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 4.0, 6.0, 5.0, 6.0, 7.0, 13.0, 7.0, 11.0, 18.0, 21.0, 22.0, 27.0, 22.0, 32.0, 27.0, 33.0, 30.0, 40.0, 41.0, 44.0, 40.0, 39.0, 1067.0, 48.0, 42.0, 49.0, 43.0, 30.0, 38.0, 25.0, 27.0, 24.0, 29.0, 25.0, 21.0, 12.0, 13.0, 14.0, 9.0, 6.0, 1.0, 2.0, 9.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.5, -31.3828125, -30.265625, -29.1484375, -28.03125, -26.9140625, -25.796875, -24.6796875, -23.5625, -22.4453125, -21.328125, -20.2109375, -19.09375, -17.9765625, -16.859375, -15.7421875, -14.625, -13.5078125, -12.390625, -11.2734375, -10.15625, -9.0390625, -7.921875, -6.8046875, -5.6875, -4.5703125, -3.453125, -2.3359375, -1.21875, -0.1015625, 1.015625, 2.1328125, 3.25, 4.3671875, 5.484375, 6.6015625, 7.71875, 8.8359375, 9.953125, 11.0703125, 12.1875, 13.3046875, 14.421875, 15.5390625, 16.65625, 17.7734375, 18.890625, 20.0078125, 21.125, 22.2421875, 23.359375, 24.4765625, 25.59375, 26.7109375, 27.828125, 28.9453125, 30.0625, 31.1796875, 32.296875, 33.4140625, 34.53125, 35.6484375, 36.765625, 37.8828125, 39.0]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 4.0, 2.0, 9.0, 16.0, 33.0, 33.0, 55.0, 90.0, 128.0, 178.0, 242.0, 370.0, 583.0, 834.0, 1242.0, 2029.0, 2892.0, 4796.0, 7184.0, 11535.0, 18688.0, 30218.0, 50916.0, 90169.0, 187289.0, 1370702.0, 134962.0, 71996.0, 41803.0, 25061.0, 15605.0, 9856.0, 6154.0, 4017.0, 2556.0, 1680.0, 1072.0, 737.0, 475.0, 301.0, 212.0, 128.0, 81.0, 65.0, 41.0, 31.0, 21.0, 17.0, 7.0, 8.0, 6.0, 6.0, 4.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-10.4453125, -10.1116943359375, -9.778076171875, -9.4444580078125, -9.11083984375, -8.7772216796875, -8.443603515625, -8.1099853515625, -7.7763671875, -7.4427490234375, -7.109130859375, -6.7755126953125, -6.44189453125, -6.1082763671875, -5.774658203125, -5.4410400390625, -5.107421875, -4.7738037109375, -4.440185546875, -4.1065673828125, -3.77294921875, -3.4393310546875, -3.105712890625, -2.7720947265625, -2.4384765625, -2.1048583984375, -1.771240234375, -1.4376220703125, -1.10400390625, -0.7703857421875, -0.436767578125, -0.1031494140625, 0.23046875, 0.5640869140625, 0.897705078125, 1.2313232421875, 1.56494140625, 1.8985595703125, 2.232177734375, 2.5657958984375, 2.8994140625, 3.2330322265625, 3.566650390625, 3.9002685546875, 4.23388671875, 4.5675048828125, 4.901123046875, 5.2347412109375, 5.568359375, 5.9019775390625, 6.235595703125, 6.5692138671875, 6.90283203125, 7.2364501953125, 7.570068359375, 7.9036865234375, 8.2373046875, 8.5709228515625, 8.904541015625, 9.2381591796875, 9.57177734375, 9.9053955078125, 10.239013671875, 10.5726318359375, 10.90625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 5.0, 11.0, 9.0, 9.0, 16.0, 25.0, 23.0, 42.0, 43.0, 63.0, 79.0, 105.0, 111.0, 108.0, 92.0, 70.0, 42.0, 34.0, 22.0, 22.0, 16.0, 11.0, 11.0, 11.0, 7.0, 2.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0081787109375, -0.007948577404022217, -0.007718443870544434, -0.00748831033706665, -0.007258176803588867, -0.007028043270111084, -0.006797909736633301, -0.006567776203155518, -0.006337642669677734, -0.006107509136199951, -0.005877375602722168, -0.005647242069244385, -0.0054171085357666016, -0.005186975002288818, -0.004956841468811035, -0.004726707935333252, -0.004496574401855469, -0.0042664408683776855, -0.004036307334899902, -0.003806173801422119, -0.003576040267944336, -0.0033459067344665527, -0.0031157732009887695, -0.0028856396675109863, -0.002655506134033203, -0.00242537260055542, -0.0021952390670776367, -0.0019651055335998535, -0.0017349720001220703, -0.0015048384666442871, -0.001274704933166504, -0.0010445713996887207, -0.0008144378662109375, -0.0005843043327331543, -0.0003541707992553711, -0.0001240372657775879, 0.00010609626770019531, 0.0003362298011779785, 0.0005663633346557617, 0.0007964968681335449, 0.0010266304016113281, 0.0012567639350891113, 0.0014868974685668945, 0.0017170310020446777, 0.001947164535522461, 0.002177298069000244, 0.0024074316024780273, 0.0026375651359558105, 0.0028676986694335938, 0.003097832202911377, 0.00332796573638916, 0.0035580992698669434, 0.0037882328033447266, 0.00401836633682251, 0.004248499870300293, 0.004478633403778076, 0.004708766937255859, 0.004938900470733643, 0.005169034004211426, 0.005399167537689209, 0.005629301071166992, 0.005859434604644775, 0.006089568138122559, 0.006319701671600342, 0.006549835205078125]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 4.0, 5.0, 4.0, 8.0, 21.0, 21.0, 38.0, 46.0, 84.0, 141.0, 201.0, 394.0, 912.0, 3551.0, 29076.0, 571301.0, 416481.0, 21635.0, 2891.0, 811.0, 365.0, 224.0, 115.0, 87.0, 38.0, 35.0, 19.0, 16.0, 4.0, 6.0, 5.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06695556640625, -0.06464195251464844, -0.062328338623046875, -0.06001472473144531, -0.05770111083984375, -0.05538749694824219, -0.053073883056640625, -0.05076026916503906, -0.0484466552734375, -0.04613304138183594, -0.043819427490234375, -0.04150581359863281, -0.03919219970703125, -0.03687858581542969, -0.034564971923828125, -0.03225135803222656, -0.029937744140625, -0.027624130249023438, -0.025310516357421875, -0.022996902465820312, -0.02068328857421875, -0.018369674682617188, -0.016056060791015625, -0.013742446899414062, -0.0114288330078125, -0.009115219116210938, -0.006801605224609375, -0.0044879913330078125, -0.00217437744140625, 0.0001392364501953125, 0.002452850341796875, 0.0047664642333984375, 0.007080078125, 0.009393692016601562, 0.011707305908203125, 0.014020919799804688, 0.01633453369140625, 0.018648147583007812, 0.020961761474609375, 0.023275375366210938, 0.0255889892578125, 0.027902603149414062, 0.030216217041015625, 0.03252983093261719, 0.03484344482421875, 0.03715705871582031, 0.039470672607421875, 0.04178428649902344, 0.044097900390625, 0.04641151428222656, 0.048725128173828125, 0.05103874206542969, 0.05335235595703125, 0.05566596984863281, 0.057979583740234375, 0.06029319763183594, 0.0626068115234375, 0.06492042541503906, 0.06723403930664062, 0.06954765319824219, 0.07186126708984375, 0.07417488098144531, 0.07648849487304688, 0.07880210876464844, 0.08111572265625]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 12.0, 22.0, 55.0, 86.0, 157.0, 219.0, 214.0, 117.0, 68.0, 30.0, 18.0, 6.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.016507407650351524, -0.016146620735526085, -0.015785833820700645, -0.015425046905875206, -0.015064259991049767, -0.014703472144901752, -0.014342685230076313, -0.013981898315250874, -0.013621111400425434, -0.013260324485599995, -0.012899537570774555, -0.012538750655949116, -0.012177962809801102, -0.011817175894975662, -0.011456388980150223, -0.011095602065324783, -0.010734815150499344, -0.010374028235673904, -0.010013241320848465, -0.009652454406023026, -0.009291667491197586, -0.008930879645049572, -0.008570092730224133, -0.008209305815398693, -0.007848518900573254, -0.007487731985747814, -0.007126945070922375, -0.006766157690435648, -0.0064053707756102085, -0.006044583860784769, -0.005683796480298042, -0.005323009565472603, -0.004962221719324589, -0.004601434804499149, -0.00424064788967371, -0.003879860509186983, -0.0035190735943615437, -0.003158286679536104, -0.002797499531880021, -0.002436712384223938, -0.0020759254693984985, -0.0017151384381577373, -0.001354351406916976, -0.0009935643756762147, -0.0006327773444354534, -0.00027199031319469213, 8.879671804606915e-05, 0.00044958386570215225, 0.0008103707805275917, 0.001171157811768353, 0.0015319448430091143, 0.0018927318742498755, 0.002253518905490637, 0.0026143058203160763, 0.0029750929679721594, 0.0033358801156282425, 0.003696667030453682, 0.004057453945279121, 0.004418240860104561, 0.004779028240591288, 0.005139815155416727, 0.0055006020702421665, 0.005861389450728893, 0.006222176365554333, 0.006582963280379772]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 5.0, 10.0, 12.0, 7.0, 9.0, 12.0, 12.0, 16.0, 12.0, 18.0, 21.0, 22.0, 25.0, 20.0, 28.0, 27.0, 32.0, 32.0, 33.0, 50.0, 41.0, 28.0, 35.0, 35.0, 31.0, 43.0, 34.0, 42.0, 33.0, 26.0, 34.0, 31.0, 23.0, 20.0, 25.0, 15.0, 16.0, 13.0, 13.0, 14.0, 15.0, 6.0, 7.0, 6.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0025461912155151367, -0.0024674367159605026, -0.0023886822164058685, -0.0023099277168512344, -0.0022311732172966003, -0.0021524187177419662, -0.002073664218187332, -0.001994909718632698, -0.001916155219078064, -0.0018374007195234299, -0.0017586462199687958, -0.0016798917204141617, -0.0016011372208595276, -0.0015223827213048935, -0.0014436282217502594, -0.0013648737221956253, -0.0012861192226409912, -0.0012073647230863571, -0.001128610223531723, -0.001049855723977089, -0.0009711012244224548, -0.0008923467248678207, -0.0008135922253131866, -0.0007348377257585526, -0.0006560832262039185, -0.0005773287266492844, -0.0004985742270946503, -0.0004198197275400162, -0.0003410652279853821, -0.000262310728430748, -0.0001835562288761139, -0.0001048017293214798, -2.6047229766845703e-05, 5.270726978778839e-05, 0.00013146176934242249, 0.00021021626889705658, 0.0002889707684516907, 0.00036772526800632477, 0.00044647976756095886, 0.000525234267115593, 0.000603988766670227, 0.0006827432662248611, 0.0007614977657794952, 0.0008402522653341293, 0.0009190067648887634, 0.0009977612644433975, 0.0010765157639980316, 0.0011552702635526657, 0.0012340247631072998, 0.001312779262661934, 0.001391533762216568, 0.001470288261771202, 0.0015490427613258362, 0.0016277972608804703, 0.0017065517604351044, 0.0017853062599897385, 0.0018640607595443726, 0.0019428152590990067, 0.0020215697586536407, 0.002100324258208275, 0.002179078757762909, 0.002257833257317543, 0.002336587756872177, 0.0024153422564268112, 0.0024940967559814453]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 7.0, 3.0, 5.0, 7.0, 16.0, 8.0, 10.0, 15.0, 19.0, 13.0, 28.0, 25.0, 23.0, 30.0, 28.0, 21.0, 30.0, 28.0, 32.0, 49.0, 31.0, 41.0, 54.0, 33.0, 35.0, 42.0, 42.0, 43.0, 37.0, 16.0, 20.0, 27.0, 16.0, 22.0, 22.0, 16.0, 19.0, 12.0, 14.0, 9.0, 8.0, 5.0, 12.0, 9.0, 7.0, 8.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0], "bins": [-51.21875, -49.6982421875, -48.177734375, -46.6572265625, -45.13671875, -43.6162109375, -42.095703125, -40.5751953125, -39.0546875, -37.5341796875, -36.013671875, -34.4931640625, -32.97265625, -31.4521484375, -29.931640625, -28.4111328125, -26.890625, -25.3701171875, -23.849609375, -22.3291015625, -20.80859375, -19.2880859375, -17.767578125, -16.2470703125, -14.7265625, -13.2060546875, -11.685546875, -10.1650390625, -8.64453125, -7.1240234375, -5.603515625, -4.0830078125, -2.5625, -1.0419921875, 0.478515625, 1.9990234375, 3.51953125, 5.0400390625, 6.560546875, 8.0810546875, 9.6015625, 11.1220703125, 12.642578125, 14.1630859375, 15.68359375, 17.2041015625, 18.724609375, 20.2451171875, 21.765625, 23.2861328125, 24.806640625, 26.3271484375, 27.84765625, 29.3681640625, 30.888671875, 32.4091796875, 33.9296875, 35.4501953125, 36.970703125, 38.4912109375, 40.01171875, 41.5322265625, 43.052734375, 44.5732421875, 46.09375]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 6.0, 6.0, 5.0, 9.0, 10.0, 11.0, 20.0, 21.0, 28.0, 38.0, 58.0, 87.0, 121.0, 192.0, 277.0, 494.0, 793.0, 1408.0, 2505.0, 5064.0, 12021.0, 39819.0, 194555.0, 588296.0, 149866.0, 32461.0, 10298.0, 4611.0, 2221.0, 1240.0, 694.0, 453.0, 278.0, 172.0, 105.0, 74.0, 51.0, 36.0, 39.0, 31.0, 26.0, 20.0, 7.0, 12.0, 7.0, 4.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.59375, -14.1436767578125, -13.693603515625, -13.2435302734375, -12.79345703125, -12.3433837890625, -11.893310546875, -11.4432373046875, -10.9931640625, -10.5430908203125, -10.093017578125, -9.6429443359375, -9.19287109375, -8.7427978515625, -8.292724609375, -7.8426513671875, -7.392578125, -6.9425048828125, -6.492431640625, -6.0423583984375, -5.59228515625, -5.1422119140625, -4.692138671875, -4.2420654296875, -3.7919921875, -3.3419189453125, -2.891845703125, -2.4417724609375, -1.99169921875, -1.5416259765625, -1.091552734375, -0.6414794921875, -0.19140625, 0.2586669921875, 0.708740234375, 1.1588134765625, 1.60888671875, 2.0589599609375, 2.509033203125, 2.9591064453125, 3.4091796875, 3.8592529296875, 4.309326171875, 4.7593994140625, 5.20947265625, 5.6595458984375, 6.109619140625, 6.5596923828125, 7.009765625, 7.4598388671875, 7.909912109375, 8.3599853515625, 8.81005859375, 9.2601318359375, 9.710205078125, 10.1602783203125, 10.6103515625, 11.0604248046875, 11.510498046875, 11.9605712890625, 12.41064453125, 12.8607177734375, 13.310791015625, 13.7608642578125, 14.2109375]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 10.0, 14.0, 17.0, 26.0, 29.0, 27.0, 50.0, 44.0, 40.0, 57.0, 80.0, 144.0, 2056.0, 67.0, 68.0, 59.0, 65.0, 54.0, 35.0, 21.0, 28.0, 19.0, 8.0, 6.0, 8.0, 6.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-137.75, -134.0390625, -130.328125, -126.6171875, -122.90625, -119.1953125, -115.484375, -111.7734375, -108.0625, -104.3515625, -100.640625, -96.9296875, -93.21875, -89.5078125, -85.796875, -82.0859375, -78.375, -74.6640625, -70.953125, -67.2421875, -63.53125, -59.8203125, -56.109375, -52.3984375, -48.6875, -44.9765625, -41.265625, -37.5546875, -33.84375, -30.1328125, -26.421875, -22.7109375, -19.0, -15.2890625, -11.578125, -7.8671875, -4.15625, -0.4453125, 3.265625, 6.9765625, 10.6875, 14.3984375, 18.109375, 21.8203125, 25.53125, 29.2421875, 32.953125, 36.6640625, 40.375, 44.0859375, 47.796875, 51.5078125, 55.21875, 58.9296875, 62.640625, 66.3515625, 70.0625, 73.7734375, 77.484375, 81.1953125, 84.90625, 88.6171875, 92.328125, 96.0390625, 99.75]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 4.0, 4.0, 4.0, 6.0, 5.0, 13.0, 25.0, 39.0, 59.0, 86.0, 151.0, 198.0, 404.0, 927.0, 2502.0, 14027.0, 2670694.0, 441668.0, 10847.0, 2227.0, 855.0, 368.0, 212.0, 128.0, 84.0, 61.0, 40.0, 21.0, 13.0, 8.0, 9.0, 1.0, 4.0, 4.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-35.3125, -34.2724609375, -33.232421875, -32.1923828125, -31.15234375, -30.1123046875, -29.072265625, -28.0322265625, -26.9921875, -25.9521484375, -24.912109375, -23.8720703125, -22.83203125, -21.7919921875, -20.751953125, -19.7119140625, -18.671875, -17.6318359375, -16.591796875, -15.5517578125, -14.51171875, -13.4716796875, -12.431640625, -11.3916015625, -10.3515625, -9.3115234375, -8.271484375, -7.2314453125, -6.19140625, -5.1513671875, -4.111328125, -3.0712890625, -2.03125, -0.9912109375, 0.048828125, 1.0888671875, 2.12890625, 3.1689453125, 4.208984375, 5.2490234375, 6.2890625, 7.3291015625, 8.369140625, 9.4091796875, 10.44921875, 11.4892578125, 12.529296875, 13.5693359375, 14.609375, 15.6494140625, 16.689453125, 17.7294921875, 18.76953125, 19.8095703125, 20.849609375, 21.8896484375, 22.9296875, 23.9697265625, 25.009765625, 26.0498046875, 27.08984375, 28.1298828125, 29.169921875, 30.2099609375, 31.25]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 0.0, 4.0, 2.0, 7.0, 11.0, 29.0, 33.0, 88.0, 137.0, 174.0, 173.0, 151.0, 76.0, 45.0, 31.0, 15.0, 7.0, 6.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-125.33549499511719, -120.71463012695312, -116.0937728881836, -111.47290802001953, -106.85205078125, -102.23118591308594, -97.61032104492188, -92.98946380615234, -88.36860656738281, -83.74774169921875, -79.12688446044922, -74.50601959228516, -69.88516235351562, -65.26429748535156, -60.643436431884766, -56.02257537841797, -51.401710510253906, -46.78084945678711, -42.15998840332031, -37.53912353515625, -32.91826629638672, -28.29740333557129, -23.67654037475586, -19.055679321289062, -14.434818267822266, -9.813957214355469, -5.1930952072143555, -0.5722332000732422, 4.048627853393555, 8.669488906860352, 13.290351867675781, 17.911212921142578, 22.532073974609375, 27.152935028076172, 31.77379608154297, 36.39466094970703, 41.01551818847656, 45.636383056640625, 50.25724411010742, 54.87810516357422, 59.498966217041016, 64.11982727050781, 68.74069213867188, 73.3615493774414, 77.98241424560547, 82.603271484375, 87.22413635253906, 91.84500122070312, 96.46585845947266, 101.08672332763672, 105.70758056640625, 110.32844543457031, 114.94930267333984, 119.5701675415039, 124.19102478027344, 128.8118896484375, 133.43275451660156, 138.05361938476562, 142.6744842529297, 147.2953338623047, 151.91619873046875, 156.5370635986328, 161.15792846679688, 165.77877807617188, 170.39964294433594]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 3.0, 6.0, 6.0, 7.0, 6.0, 6.0, 19.0, 21.0, 19.0, 16.0, 33.0, 22.0, 26.0, 35.0, 40.0, 42.0, 59.0, 69.0, 44.0, 41.0, 57.0, 51.0, 37.0, 37.0, 48.0, 38.0, 45.0, 29.0, 19.0, 22.0, 25.0, 15.0, 14.0, 5.0, 8.0, 11.0, 6.0, 12.0, 2.0, 1.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.93501281738281, -87.40480041503906, -83.87458038330078, -80.34436798095703, -76.81415557861328, -73.283935546875, -69.75372314453125, -66.2235107421875, -62.69329833984375, -59.163082122802734, -55.632869720458984, -52.10265350341797, -48.57244110107422, -45.0422248840332, -41.51200866699219, -37.98179626464844, -34.45158004760742, -30.92136573791504, -27.391151428222656, -23.86093521118164, -20.33072280883789, -16.800506591796875, -13.270292282104492, -9.74007797241211, -6.209863662719727, -2.6796491146087646, 0.8505654335021973, 4.380780220031738, 7.910994529724121, 11.44120979309082, 14.971424102783203, 18.501638412475586, 22.03185272216797, 25.56206703186035, 29.092281341552734, 32.62249755859375, 36.1527099609375, 39.682926177978516, 43.21314239501953, 46.74335479736328, 50.27356719970703, 53.80378341674805, 57.3339958190918, 60.86421203613281, 64.39442443847656, 67.92463684082031, 71.4548568725586, 74.98506927490234, 78.51528930664062, 82.04550170898438, 85.57572174072266, 89.1059341430664, 92.63614654541016, 96.16636657714844, 99.69657897949219, 103.22679138183594, 106.75700378417969, 110.28721618652344, 113.81743621826172, 117.34764862060547, 120.87786102294922, 124.4080810546875, 127.93829345703125, 131.468505859375, 134.99871826171875]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 5.0, 6.0, 1.0, 9.0, 17.0, 20.0, 43.0, 74.0, 115.0, 152.0, 209.0, 305.0, 414.0, 580.0, 852.0, 1868.0, 1040751.0, 1029.0, 575.0, 447.0, 331.0, 242.0, 152.0, 124.0, 77.0, 50.0, 37.0, 28.0, 14.0, 18.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-60.856773376464844, -59.302391052246094, -57.748008728027344, -56.19363021850586, -54.63924789428711, -53.08486557006836, -51.530487060546875, -49.976104736328125, -48.421722412109375, -46.867340087890625, -45.312957763671875, -43.75857925415039, -42.20419692993164, -40.64981460571289, -39.095436096191406, -37.541053771972656, -35.986671447753906, -34.432289123535156, -32.877906799316406, -31.323528289794922, -29.769145965576172, -28.214763641357422, -26.660383224487305, -25.106002807617188, -23.551620483398438, -21.997238159179688, -20.44285774230957, -18.888477325439453, -17.334095001220703, -15.77971363067627, -14.225332260131836, -12.670950889587402, -11.116569519042969, -9.562188148498535, -8.007806777954102, -6.453425407409668, -4.899044036865234, -3.344662666320801, -1.7902812957763672, -0.2358999252319336, 1.3184814453125, 2.8728628158569336, 4.427244186401367, 5.981625556945801, 7.536006927490234, 9.090388298034668, 10.644769668579102, 12.199151039123535, 13.753532409667969, 15.307913780212402, 16.862295150756836, 18.416675567626953, 19.971057891845703, 21.525440216064453, 23.07982063293457, 24.634201049804688, 26.188583374023438, 27.742965698242188, 29.297346115112305, 30.851726531982422, 32.40610885620117, 33.96049118041992, 35.514869689941406, 37.069252014160156, 38.623634338378906]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 4.0, 3.0, 10.0, 10.0, 5.0, 15.0, 13.0, 14.0, 33.0, 94.0, 788.0, 51461884.0, 132.0, 54.0, 26.0, 15.0, 13.0, 6.0, 6.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 7.0, 11.0, 1.0, 7.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4968.0, -4745.13671875, -4522.27392578125, -4299.41064453125, -4076.5478515625, -3853.6845703125, -3630.821533203125, -3407.95849609375, -3185.095458984375, -2962.232421875, -2739.369384765625, -2516.50634765625, -2293.64306640625, -2070.7802734375, -1847.9169921875, -1625.053955078125, -1402.19091796875, -1179.327880859375, -956.4647827148438, -733.6016845703125, -510.7386474609375, -287.8756103515625, -65.012451171875, 157.8505859375, 380.713623046875, 603.57666015625, 826.4397583007812, 1049.3028564453125, 1272.1658935546875, 1495.0289306640625, 1717.89208984375, 1940.755126953125, 2163.6181640625, 2386.481201171875, 2609.34423828125, 2832.20751953125, 3055.0703125, 3277.93359375, 3500.796630859375, 3723.65966796875, 3946.522705078125, 4169.3857421875, 4392.2490234375, 4615.11181640625, 4837.97509765625, 5060.837890625, 5283.701171875, 5506.564453125, 5729.42724609375, 5952.29052734375, 6175.1533203125, 6398.0166015625, 6620.87939453125, 6843.74267578125, 7066.60546875, 7289.46875, 7512.33203125, 7735.1953125, 7958.05810546875, 8180.92138671875, 8403.7841796875, 8626.6474609375, 8849.5107421875, 9072.373046875, 9295.236328125]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [3.0, 3.0, 4.0, 4.0, 5.0, 8.0, 8.0, 12.0, 14.0, 25.0, 18.0, 39.0, 74.0, 98.0, 151.0, 209.0, 314.0, 438.0, 615.0, 925.0, 1367.0, 2144.0, 3208.0, 4785.0, 7548.0, 12009.0, 19528.0, 31893.0, 52397.0, 90096.0, 158237.0, 310697.0, 2760143.0, 2145167.0, 306827.0, 156984.0, 88785.0, 52008.0, 31377.0, 19361.0, 11900.0, 7618.0, 4900.0, 3221.0, 2069.0, 1325.0, 872.0, 596.0, 442.0, 280.0, 223.0, 131.0, 96.0, 87.0, 48.0, 36.0, 26.0, 19.0, 7.0, 8.0, 9.0, 6.0, 4.0, 5.0], "bins": [-6.625, -6.4241943359375, -6.223388671875, -6.0225830078125, -5.82177734375, -5.6209716796875, -5.420166015625, -5.2193603515625, -5.0185546875, -4.8177490234375, -4.616943359375, -4.4161376953125, -4.21533203125, -4.0145263671875, -3.813720703125, -3.6129150390625, -3.412109375, -3.2113037109375, -3.010498046875, -2.8096923828125, -2.60888671875, -2.4080810546875, -2.207275390625, -2.0064697265625, -1.8056640625, -1.6048583984375, -1.404052734375, -1.2032470703125, -1.00244140625, -0.8016357421875, -0.600830078125, -0.4000244140625, -0.19921875, 0.0015869140625, 0.202392578125, 0.4031982421875, 0.60400390625, 0.8048095703125, 1.005615234375, 1.2064208984375, 1.4072265625, 1.6080322265625, 1.808837890625, 2.0096435546875, 2.21044921875, 2.4112548828125, 2.612060546875, 2.8128662109375, 3.013671875, 3.2144775390625, 3.415283203125, 3.6160888671875, 3.81689453125, 4.0177001953125, 4.218505859375, 4.4193115234375, 4.6201171875, 4.8209228515625, 5.021728515625, 5.2225341796875, 5.42333984375, 5.6241455078125, 5.824951171875, 6.0257568359375, 6.2265625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 6.0, 6.0, 5.0, 9.0, 4.0, 11.0, 12.0, 20.0, 23.0, 24.0, 24.0, 22.0, 38.0, 44.0, 45.0, 40.0, 51.0, 70.0, 178.0, 742.0, 210.0, 76.0, 47.0, 42.0, 39.0, 26.0, 32.0, 35.0, 26.0, 24.0, 23.0, 13.0, 15.0, 17.0, 8.0, 5.0, 4.0, 3.0, 3.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.1953125, -13.7156982421875, -13.236083984375, -12.7564697265625, -12.27685546875, -11.7972412109375, -11.317626953125, -10.8380126953125, -10.3583984375, -9.8787841796875, -9.399169921875, -8.9195556640625, -8.43994140625, -7.9603271484375, -7.480712890625, -7.0010986328125, -6.521484375, -6.0418701171875, -5.562255859375, -5.0826416015625, -4.60302734375, -4.1234130859375, -3.643798828125, -3.1641845703125, -2.6845703125, -2.2049560546875, -1.725341796875, -1.2457275390625, -0.76611328125, -0.2864990234375, 0.193115234375, 0.6727294921875, 1.15234375, 1.6319580078125, 2.111572265625, 2.5911865234375, 3.07080078125, 3.5504150390625, 4.030029296875, 4.5096435546875, 4.9892578125, 5.4688720703125, 5.948486328125, 6.4281005859375, 6.90771484375, 7.3873291015625, 7.866943359375, 8.3465576171875, 8.826171875, 9.3057861328125, 9.785400390625, 10.2650146484375, 10.74462890625, 11.2242431640625, 11.703857421875, 12.1834716796875, 12.6630859375, 13.1427001953125, 13.622314453125, 14.1019287109375, 14.58154296875, 15.0611572265625, 15.540771484375, 16.0203857421875, 16.5]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 3.0, 12.0, 23.0, 11.0, 16.0, 9.0, 51.0, 57.0, 77.0, 129.0, 193.0, 245.0, 358.0, 535.0, 799.0, 1119.0, 1670.0, 2523.0, 3654.0, 5293.0, 8007.0, 11870.0, 17405.0, 26334.0, 39824.0, 61866.0, 97560.0, 163871.0, 311694.0, 1071535.0, 3534047.0, 408597.0, 198721.0, 115139.0, 71533.0, 45982.0, 29547.0, 19961.0, 13027.0, 9127.0, 5934.0, 4198.0, 2754.0, 1916.0, 1334.0, 904.0, 634.0, 379.0, 313.0, 242.0, 122.0, 93.0, 73.0, 50.0, 24.0, 21.0, 6.0, 4.0, 12.0, 7.0, 6.0, 1.0, 2.0], "bins": [-5.58984375, -5.41046142578125, -5.2310791015625, -5.05169677734375, -4.872314453125, -4.69293212890625, -4.5135498046875, -4.33416748046875, -4.15478515625, -3.97540283203125, -3.7960205078125, -3.61663818359375, -3.437255859375, -3.25787353515625, -3.0784912109375, -2.89910888671875, -2.7197265625, -2.54034423828125, -2.3609619140625, -2.18157958984375, -2.002197265625, -1.82281494140625, -1.6434326171875, -1.46405029296875, -1.28466796875, -1.10528564453125, -0.9259033203125, -0.74652099609375, -0.567138671875, -0.38775634765625, -0.2083740234375, -0.02899169921875, 0.150390625, 0.32977294921875, 0.5091552734375, 0.68853759765625, 0.867919921875, 1.04730224609375, 1.2266845703125, 1.40606689453125, 1.58544921875, 1.76483154296875, 1.9442138671875, 2.12359619140625, 2.302978515625, 2.48236083984375, 2.6617431640625, 2.84112548828125, 3.0205078125, 3.19989013671875, 3.3792724609375, 3.55865478515625, 3.738037109375, 3.91741943359375, 4.0968017578125, 4.27618408203125, 4.45556640625, 4.63494873046875, 4.8143310546875, 4.99371337890625, 5.173095703125, 5.35247802734375, 5.5318603515625, 5.71124267578125, 5.890625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 9.0, 5.0, 5.0, 8.0, 9.0, 19.0, 9.0, 20.0, 16.0, 27.0, 21.0, 28.0, 24.0, 32.0, 25.0, 47.0, 41.0, 46.0, 51.0, 77.0, 231.0, 605.0, 168.0, 87.0, 67.0, 52.0, 40.0, 34.0, 35.0, 14.0, 20.0, 26.0, 21.0, 12.0, 15.0, 16.0, 21.0, 11.0, 3.0, 10.0, 8.0, 4.0, 4.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.3359375, -9.0391845703125, -8.742431640625, -8.4456787109375, -8.14892578125, -7.8521728515625, -7.555419921875, -7.2586669921875, -6.9619140625, -6.6651611328125, -6.368408203125, -6.0716552734375, -5.77490234375, -5.4781494140625, -5.181396484375, -4.8846435546875, -4.587890625, -4.2911376953125, -3.994384765625, -3.6976318359375, -3.40087890625, -3.1041259765625, -2.807373046875, -2.5106201171875, -2.2138671875, -1.9171142578125, -1.620361328125, -1.3236083984375, -1.02685546875, -0.7301025390625, -0.433349609375, -0.1365966796875, 0.16015625, 0.4569091796875, 0.753662109375, 1.0504150390625, 1.34716796875, 1.6439208984375, 1.940673828125, 2.2374267578125, 2.5341796875, 2.8309326171875, 3.127685546875, 3.4244384765625, 3.72119140625, 4.0179443359375, 4.314697265625, 4.6114501953125, 4.908203125, 5.2049560546875, 5.501708984375, 5.7984619140625, 6.09521484375, 6.3919677734375, 6.688720703125, 6.9854736328125, 7.2822265625, 7.5789794921875, 7.875732421875, 8.1724853515625, 8.46923828125, 8.7659912109375, 9.062744140625, 9.3594970703125, 9.65625]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 11.0, 17.0, 5.0, 26.0, 21.0, 36.0, 16.0, 92.0, 65.0, 136.0, 210.0, 297.0, 415.0, 622.0, 947.0, 1686.0, 2602.0, 5148.0, 11866.0, 36143.0, 260002.0, 5887625.0, 53491.0, 15276.0, 6424.0, 3120.0, 1886.0, 1071.0, 649.0, 434.0, 358.0, 241.0, 174.0, 99.0, 57.0, 34.0, 43.0, 19.0, 46.0, 10.0, 13.0, 8.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-25.78125, -24.92578125, -24.0703125, -23.21484375, -22.359375, -21.50390625, -20.6484375, -19.79296875, -18.9375, -18.08203125, -17.2265625, -16.37109375, -15.515625, -14.66015625, -13.8046875, -12.94921875, -12.09375, -11.23828125, -10.3828125, -9.52734375, -8.671875, -7.81640625, -6.9609375, -6.10546875, -5.25, -4.39453125, -3.5390625, -2.68359375, -1.828125, -0.97265625, -0.1171875, 0.73828125, 1.59375, 2.44921875, 3.3046875, 4.16015625, 5.015625, 5.87109375, 6.7265625, 7.58203125, 8.4375, 9.29296875, 10.1484375, 11.00390625, 11.859375, 12.71484375, 13.5703125, 14.42578125, 15.28125, 16.13671875, 16.9921875, 17.84765625, 18.703125, 19.55859375, 20.4140625, 21.26953125, 22.125, 22.98046875, 23.8359375, 24.69140625, 25.546875, 26.40234375, 27.2578125, 28.11328125, 28.96875]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 2.0, 2.0, 5.0, 3.0, 10.0, 9.0, 12.0, 15.0, 22.0, 17.0, 24.0, 30.0, 32.0, 41.0, 37.0, 51.0, 56.0, 95.0, 176.0, 394.0, 418.0, 128.0, 90.0, 59.0, 54.0, 42.0, 32.0, 25.0, 29.0, 19.0, 26.0, 23.0, 11.0, 11.0, 9.0, 6.0, 3.0, 8.0, 1.0, 0.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.859375, -6.595703125, -6.33203125, -6.068359375, -5.8046875, -5.541015625, -5.27734375, -5.013671875, -4.75, -4.486328125, -4.22265625, -3.958984375, -3.6953125, -3.431640625, -3.16796875, -2.904296875, -2.640625, -2.376953125, -2.11328125, -1.849609375, -1.5859375, -1.322265625, -1.05859375, -0.794921875, -0.53125, -0.267578125, -0.00390625, 0.259765625, 0.5234375, 0.787109375, 1.05078125, 1.314453125, 1.578125, 1.841796875, 2.10546875, 2.369140625, 2.6328125, 2.896484375, 3.16015625, 3.423828125, 3.6875, 3.951171875, 4.21484375, 4.478515625, 4.7421875, 5.005859375, 5.26953125, 5.533203125, 5.796875, 6.060546875, 6.32421875, 6.587890625, 6.8515625, 7.115234375, 7.37890625, 7.642578125, 7.90625, 8.169921875, 8.43359375, 8.697265625, 8.9609375, 9.224609375, 9.48828125, 9.751953125, 10.015625]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 10.0, 8.0, 16.0, 10.0, 21.0, 44.0, 76.0, 172.0, 341.0, 131.0, 69.0, 40.0, 24.0, 15.0, 12.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-31.486644744873047, -30.686426162719727, -29.886205673217773, -29.085987091064453, -28.2857666015625, -27.48554801940918, -26.68532943725586, -25.885108947753906, -25.084888458251953, -24.284669876098633, -23.48444938659668, -22.68423080444336, -21.884010314941406, -21.083791732788086, -20.283573150634766, -19.483352661132812, -18.683134078979492, -17.882915496826172, -17.08269500732422, -16.2824764251709, -15.482255935668945, -14.682037353515625, -13.881817817687988, -13.081598281860352, -12.281378746032715, -11.481159210205078, -10.680939674377441, -9.880720138549805, -9.080501556396484, -8.280281066894531, -7.480062484741211, -6.679842948913574, -5.8796234130859375, -5.079403877258301, -4.279184341430664, -3.4789652824401855, -2.678745746612549, -1.878526210784912, -1.0783071517944336, -0.2780876159667969, 0.5221319198608398, 1.322351336479187, 2.122570753097534, 2.922790050506592, 3.7230095863342285, 4.523229122161865, 5.323448181152344, 6.1236677169799805, 6.923887252807617, 7.724106788635254, 8.52432632446289, 9.324544906616211, 10.124765396118164, 10.924983978271484, 11.725203514099121, 12.525423049926758, 13.325642585754395, 14.125862121582031, 14.926081657409668, 15.726301193237305, 16.526519775390625, 17.326740264892578, 18.1269588470459, 18.92717742919922, 19.727397918701172]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 6.0, 6.0, 7.0, 11.0, 12.0, 13.0, 10.0, 19.0, 22.0, 24.0, 24.0, 24.0, 28.0, 28.0, 35.0, 41.0, 38.0, 31.0, 39.0, 36.0, 45.0, 40.0, 37.0, 41.0, 36.0, 30.0, 35.0, 31.0, 36.0, 39.0, 25.0, 21.0, 20.0, 23.0, 16.0, 9.0, 16.0, 13.0, 6.0, 6.0, 7.0, 4.0, 6.0, 3.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.237184524536133, -8.926107406616211, -8.615030288696289, -8.303953170776367, -7.992876052856445, -7.681798934936523, -7.37072229385376, -7.059645175933838, -6.748568058013916, -6.437490940093994, -6.126413822174072, -5.81533670425415, -5.504260063171387, -5.193182945251465, -4.882105827331543, -4.571028709411621, -4.259951591491699, -3.9488744735717773, -3.6377973556518555, -3.3267204761505127, -3.015643358230591, -2.704566240310669, -2.393489360809326, -2.0824122428894043, -1.7713351249694824, -1.4602580070495605, -1.1491810083389282, -0.8381039500236511, -0.527026891708374, -0.21594977378845215, 0.09512722492218018, 0.4062042236328125, 0.717280387878418, 1.0283575057983398, 1.3394345045089722, 1.6505115032196045, 1.9615886211395264, 2.2726657390594482, 2.583742618560791, 2.894819736480713, 3.2058968544006348, 3.5169739723205566, 3.8280510902404785, 4.1391282081604, 4.450204849243164, 4.761281967163086, 5.072359085083008, 5.38343620300293, 5.694513320922852, 6.005590438842773, 6.316667556762695, 6.627744674682617, 6.938821792602539, 7.249898910522461, 7.560975551605225, 7.8720526695251465, 8.183130264282227, 8.494207382202148, 8.80528450012207, 9.116361618041992, 9.427438735961914, 9.738515853881836, 10.049592971801758, 10.36067008972168, 10.671746253967285]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 6.0, 4.0, 1.0, 6.0, 10.0, 8.0, 9.0, 17.0, 11.0, 18.0, 31.0, 42.0, 66.0, 74.0, 120.0, 141.0, 214.0, 313.0, 450.0, 694.0, 1202.0, 2232.0, 4459.0, 11905.0, 57596.0, 4069441.0, 27917.0, 8222.0, 3614.0, 1998.0, 1183.0, 712.0, 483.0, 329.0, 210.0, 150.0, 110.0, 65.0, 57.0, 48.0, 27.0, 26.0, 13.0, 16.0, 6.0, 8.0, 6.0, 7.0, 1.0, 7.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.030517578125, -0.02957296371459961, -0.02862834930419922, -0.027683734893798828, -0.026739120483398438, -0.025794506072998047, -0.024849891662597656, -0.023905277252197266, -0.022960662841796875, -0.022016048431396484, -0.021071434020996094, -0.020126819610595703, -0.019182205200195312, -0.018237590789794922, -0.01729297637939453, -0.01634836196899414, -0.01540374755859375, -0.01445913314819336, -0.013514518737792969, -0.012569904327392578, -0.011625289916992188, -0.010680675506591797, -0.009736061096191406, -0.008791446685791016, -0.007846832275390625, -0.006902217864990234, -0.005957603454589844, -0.005012989044189453, -0.0040683746337890625, -0.003123760223388672, -0.0021791458129882812, -0.0012345314025878906, -0.0002899169921875, 0.0006546974182128906, 0.0015993118286132812, 0.002543926239013672, 0.0034885406494140625, 0.004433155059814453, 0.005377769470214844, 0.006322383880615234, 0.007266998291015625, 0.008211612701416016, 0.009156227111816406, 0.010100841522216797, 0.011045455932617188, 0.011990070343017578, 0.012934684753417969, 0.01387929916381836, 0.01482391357421875, 0.01576852798461914, 0.01671314239501953, 0.017657756805419922, 0.018602371215820312, 0.019546985626220703, 0.020491600036621094, 0.021436214447021484, 0.022380828857421875, 0.023325443267822266, 0.024270057678222656, 0.025214672088623047, 0.026159286499023438, 0.027103900909423828, 0.02804851531982422, 0.02899312973022461, 0.029937744140625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 9.0, 4.0, 6.0, 11.0, 7.0, 10.0, 14.0, 19.0, 774.0, 26.0, 18.0, 14.0, 13.0, 12.0, 12.0, 6.0, 5.0, 6.0, 3.0, 3.0, 3.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0025920867919921875, -0.0024993717670440674, -0.0024066567420959473, -0.002313941717147827, -0.002221226692199707, -0.002128511667251587, -0.002035796642303467, -0.0019430816173553467, -0.0018503665924072266, -0.0017576515674591064, -0.0016649365425109863, -0.0015722215175628662, -0.001479506492614746, -0.001386791467666626, -0.0012940764427185059, -0.0012013614177703857, -0.0011086463928222656, -0.0010159313678741455, -0.0009232163429260254, -0.0008305013179779053, -0.0007377862930297852, -0.000645071268081665, -0.0005523562431335449, -0.0004596412181854248, -0.0003669261932373047, -0.00027421116828918457, -0.00018149614334106445, -8.878111839294434e-05, 3.933906555175781e-06, 9.66489315032959e-05, 0.00018936395645141602, 0.00028207898139953613, 0.00037479400634765625, 0.00046750903129577637, 0.0005602240562438965, 0.0006529390811920166, 0.0007456541061401367, 0.0008383691310882568, 0.000931084156036377, 0.001023799180984497, 0.0011165142059326172, 0.0012092292308807373, 0.0013019442558288574, 0.0013946592807769775, 0.0014873743057250977, 0.0015800893306732178, 0.0016728043556213379, 0.001765519380569458, 0.0018582344055175781, 0.0019509494304656982, 0.0020436644554138184, 0.0021363794803619385, 0.0022290945053100586, 0.0023218095302581787, 0.002414524555206299, 0.002507239580154419, 0.002599954605102539, 0.002692669630050659, 0.0027853846549987793, 0.0028780996799468994, 0.0029708147048950195, 0.0030635297298431396, 0.0031562447547912598, 0.00324895977973938, 0.0033416748046875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 2.0, 2.0, 4.0, 7.0, 10.0, 14.0, 10.0, 17.0, 22.0, 30.0, 53.0, 84.0, 114.0, 158.0, 296.0, 525.0, 1074.0, 2667.0, 9863.0, 100972.0, 3995357.0, 70202.0, 8214.0, 2365.0, 919.0, 483.0, 281.0, 177.0, 118.0, 78.0, 47.0, 36.0, 19.0, 15.0, 19.0, 8.0, 8.0, 9.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.038421630859375, -0.03696870803833008, -0.035515785217285156, -0.034062862396240234, -0.03260993957519531, -0.03115701675415039, -0.02970409393310547, -0.028251171112060547, -0.026798248291015625, -0.025345325469970703, -0.02389240264892578, -0.02243947982788086, -0.020986557006835938, -0.019533634185791016, -0.018080711364746094, -0.016627788543701172, -0.01517486572265625, -0.013721942901611328, -0.012269020080566406, -0.010816097259521484, -0.009363174438476562, -0.00791025161743164, -0.006457328796386719, -0.005004405975341797, -0.003551483154296875, -0.002098560333251953, -0.0006456375122070312, 0.0008072853088378906, 0.0022602081298828125, 0.0037131309509277344, 0.005166053771972656, 0.006618976593017578, 0.0080718994140625, 0.009524822235107422, 0.010977745056152344, 0.012430667877197266, 0.013883590698242188, 0.01533651351928711, 0.01678943634033203, 0.018242359161376953, 0.019695281982421875, 0.021148204803466797, 0.02260112762451172, 0.02405405044555664, 0.025506973266601562, 0.026959896087646484, 0.028412818908691406, 0.029865741729736328, 0.03131866455078125, 0.03277158737182617, 0.034224510192871094, 0.035677433013916016, 0.03713035583496094, 0.03858327865600586, 0.04003620147705078, 0.0414891242980957, 0.042942047119140625, 0.04439496994018555, 0.04584789276123047, 0.04730081558227539, 0.04875373840332031, 0.050206661224365234, 0.051659584045410156, 0.05311250686645508, 0.0545654296875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 7.0, 5.0, 5.0, 17.0, 14.0, 23.0, 30.0, 32.0, 44.0, 64.0, 99.0, 180.0, 382.0, 2038.0, 534.0, 211.0, 135.0, 70.0, 55.0, 36.0, 23.0, 22.0, 11.0, 10.0, 10.0, 5.0, 7.0, 0.0, 3.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006481170654296875, -0.006293833255767822, -0.0061064958572387695, -0.005919158458709717, -0.005731821060180664, -0.005544483661651611, -0.005357146263122559, -0.005169808864593506, -0.004982471466064453, -0.0047951340675354, -0.004607796669006348, -0.004420459270477295, -0.004233121871948242, -0.0040457844734191895, -0.0038584470748901367, -0.003671109676361084, -0.0034837722778320312, -0.0032964348793029785, -0.0031090974807739258, -0.002921760082244873, -0.0027344226837158203, -0.0025470852851867676, -0.002359747886657715, -0.002172410488128662, -0.0019850730895996094, -0.0017977356910705566, -0.001610398292541504, -0.0014230608940124512, -0.0012357234954833984, -0.0010483860969543457, -0.000861048698425293, -0.0006737112998962402, -0.0004863739013671875, -0.00029903650283813477, -0.00011169910430908203, 7.56382942199707e-05, 0.00026297569274902344, 0.00045031309127807617, 0.0006376504898071289, 0.0008249878883361816, 0.0010123252868652344, 0.0011996626853942871, 0.0013870000839233398, 0.0015743374824523926, 0.0017616748809814453, 0.001949012279510498, 0.0021363496780395508, 0.0023236870765686035, 0.0025110244750976562, 0.002698361873626709, 0.0028856992721557617, 0.0030730366706848145, 0.003260374069213867, 0.00344771146774292, 0.0036350488662719727, 0.0038223862648010254, 0.004009723663330078, 0.004197061061859131, 0.004384398460388184, 0.004571735858917236, 0.004759073257446289, 0.004946410655975342, 0.0051337480545043945, 0.005321085453033447, 0.0055084228515625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 6.0, 42.0, 143.0, 498.0, 236.0, 43.0, 20.0, 7.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04315029829740524, -0.0403917171061039, -0.03763313218951225, -0.03487455099821091, -0.03211596608161926, -0.029357384890317917, -0.02659880369901657, -0.023840220645070076, -0.02108163759112358, -0.018323054537177086, -0.015564472414553165, -0.012805890291929245, -0.01004730723798275, -0.007288724184036255, -0.004530142992734909, -0.001771559938788414, 0.000987023115158081, 0.003745605703443289, 0.0065041882917284966, 0.009262770414352417, 0.012021353468298912, 0.014779936522245407, 0.017538517713546753, 0.020297100767493248, 0.023055683821439743, 0.025814266875386238, 0.028572849929332733, 0.03133143112063408, 0.034090012311935425, 0.03684859722852707, 0.039607178419828415, 0.04236575961112976, 0.04512433707714081, 0.047882918268442154, 0.0506415031850338, 0.053400084376335144, 0.05615866929292679, 0.058917250484228134, 0.06167583167552948, 0.06443441659212112, 0.06719300150871277, 0.06995158642530441, 0.07271016389131546, 0.0754687488079071, 0.07822733372449875, 0.0809859186410904, 0.08374449610710144, 0.08650308102369308, 0.08926165848970413, 0.09202024340629578, 0.09477882087230682, 0.09753740578889847, 0.10029599070549011, 0.10305456817150116, 0.1058131530880928, 0.10857173800468445, 0.1113303154706955, 0.11408890038728714, 0.11684747785329819, 0.11960606276988983, 0.12236464768648148, 0.12512323260307312, 0.12788181006908417, 0.13064038753509521, 0.13339897990226746]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 6.0, 4.0, 7.0, 9.0, 11.0, 15.0, 18.0, 35.0, 39.0, 50.0, 47.0, 75.0, 69.0, 81.0, 76.0, 69.0, 62.0, 64.0, 46.0, 53.0, 41.0, 28.0, 15.0, 21.0, 14.0, 10.0, 7.0, 12.0, 2.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.023454368114471436, -0.022792736068367958, -0.02213110402226448, -0.021469471976161003, -0.020807839930057526, -0.020146207883954048, -0.01948457583785057, -0.018822943791747093, -0.018161311745643616, -0.017499679699540138, -0.01683804765343666, -0.016176415607333183, -0.015514783561229706, -0.014853151515126228, -0.01419151946902275, -0.013529887422919273, -0.012868255376815796, -0.012206623330712318, -0.011544991284608841, -0.010883359238505363, -0.010221727192401886, -0.009560095146298409, -0.008898463100194931, -0.008236831054091454, -0.007575199007987976, -0.006913566961884499, -0.006251934915781021, -0.005590302869677544, -0.004928670823574066, -0.004267038777470589, -0.003605406731367111, -0.0029437746852636337, -0.0022821426391601562, -0.0016205105930566788, -0.0009588785469532013, -0.0002972465008497238, 0.00036438554525375366, 0.0010260175913572311, 0.0016876496374607086, 0.002349281683564186, 0.0030109137296676636, 0.003672545775771141, 0.0043341778218746185, 0.004995809867978096, 0.0056574419140815735, 0.006319073960185051, 0.0069807060062885284, 0.007642338052392006, 0.008303970098495483, 0.008965602144598961, 0.009627234190702438, 0.010288866236805916, 0.010950498282909393, 0.01161213032901287, 0.012273762375116348, 0.012935394421219826, 0.013597026467323303, 0.01425865851342678, 0.014920290559530258, 0.015581922605633736, 0.016243554651737213, 0.01690518669784069, 0.017566818743944168, 0.018228450790047646, 0.018890082836151123]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 3.0, 10.0, 12.0, 12.0, 30.0, 34.0, 41.0, 55.0, 72.0, 102.0, 141.0, 183.0, 272.0, 390.0, 560.0, 839.0, 1366.0, 2108.0, 3458.0, 6354.0, 12152.0, 29357.0, 891614.0, 61333.0, 17316.0, 8351.0, 4576.0, 2687.0, 1687.0, 1084.0, 731.0, 470.0, 324.0, 223.0, 160.0, 130.0, 71.0, 68.0, 54.0, 36.0, 23.0, 23.0, 11.0, 9.0, 7.0, 9.0, 4.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0306396484375, -0.029674053192138672, -0.028708457946777344, -0.027742862701416016, -0.026777267456054688, -0.02581167221069336, -0.02484607696533203, -0.023880481719970703, -0.022914886474609375, -0.021949291229248047, -0.02098369598388672, -0.02001810073852539, -0.019052505493164062, -0.018086910247802734, -0.017121315002441406, -0.016155719757080078, -0.01519012451171875, -0.014224529266357422, -0.013258934020996094, -0.012293338775634766, -0.011327743530273438, -0.01036214828491211, -0.009396553039550781, -0.008430957794189453, -0.007465362548828125, -0.006499767303466797, -0.005534172058105469, -0.004568576812744141, -0.0036029815673828125, -0.0026373863220214844, -0.0016717910766601562, -0.0007061958312988281, 0.0002593994140625, 0.0012249946594238281, 0.0021905899047851562, 0.0031561851501464844, 0.0041217803955078125, 0.005087375640869141, 0.006052970886230469, 0.007018566131591797, 0.007984161376953125, 0.008949756622314453, 0.009915351867675781, 0.01088094711303711, 0.011846542358398438, 0.012812137603759766, 0.013777732849121094, 0.014743328094482422, 0.01570892333984375, 0.016674518585205078, 0.017640113830566406, 0.018605709075927734, 0.019571304321289062, 0.02053689956665039, 0.02150249481201172, 0.022468090057373047, 0.023433685302734375, 0.024399280548095703, 0.02536487579345703, 0.02633047103881836, 0.027296066284179688, 0.028261661529541016, 0.029227256774902344, 0.030192852020263672, 0.031158447265625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 6.0, 6.0, 4.0, 6.0, 7.0, 13.0, 14.0, 10.0, 27.0, 444.0, 341.0, 16.0, 22.0, 9.0, 9.0, 15.0, 8.0, 4.0, 7.0, 3.0, 4.0, 1.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002429962158203125, -0.0023435354232788086, -0.002257108688354492, -0.0021706819534301758, -0.0020842552185058594, -0.001997828483581543, -0.0019114017486572266, -0.0018249750137329102, -0.0017385482788085938, -0.0016521215438842773, -0.001565694808959961, -0.0014792680740356445, -0.0013928413391113281, -0.0013064146041870117, -0.0012199878692626953, -0.001133561134338379, -0.0010471343994140625, -0.0009607076644897461, -0.0008742809295654297, -0.0007878541946411133, -0.0007014274597167969, -0.0006150007247924805, -0.0005285739898681641, -0.00044214725494384766, -0.00035572052001953125, -0.00026929378509521484, -0.00018286705017089844, -9.644031524658203e-05, -1.0013580322265625e-05, 7.641315460205078e-05, 0.0001628398895263672, 0.0002492666244506836, 0.000335693359375, 0.0004221200942993164, 0.0005085468292236328, 0.0005949735641479492, 0.0006814002990722656, 0.000767827033996582, 0.0008542537689208984, 0.0009406805038452148, 0.0010271072387695312, 0.0011135339736938477, 0.001199960708618164, 0.0012863874435424805, 0.0013728141784667969, 0.0014592409133911133, 0.0015456676483154297, 0.001632094383239746, 0.0017185211181640625, 0.001804947853088379, 0.0018913745880126953, 0.0019778013229370117, 0.002064228057861328, 0.0021506547927856445, 0.002237081527709961, 0.0023235082626342773, 0.0024099349975585938, 0.00249636173248291, 0.0025827884674072266, 0.002669215202331543, 0.0027556419372558594, 0.0028420686721801758, 0.002928495407104492, 0.0030149221420288086, 0.003101348876953125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 8.0, 9.0, 15.0, 13.0, 17.0, 23.0, 26.0, 38.0, 81.0, 125.0, 186.0, 267.0, 437.0, 770.0, 1288.0, 2422.0, 5758.0, 19671.0, 591616.0, 396772.0, 18020.0, 5463.0, 2310.0, 1322.0, 710.0, 376.0, 264.0, 185.0, 135.0, 85.0, 59.0, 29.0, 14.0, 20.0, 9.0, 6.0, 6.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05535888671875, -0.05357170104980469, -0.051784515380859375, -0.04999732971191406, -0.04821014404296875, -0.04642295837402344, -0.044635772705078125, -0.04284858703613281, -0.0410614013671875, -0.03927421569824219, -0.037487030029296875, -0.03569984436035156, -0.03391265869140625, -0.03212547302246094, -0.030338287353515625, -0.028551101684570312, -0.026763916015625, -0.024976730346679688, -0.023189544677734375, -0.021402359008789062, -0.01961517333984375, -0.017827987670898438, -0.016040802001953125, -0.014253616333007812, -0.0124664306640625, -0.010679244995117188, -0.008892059326171875, -0.0071048736572265625, -0.00531768798828125, -0.0035305023193359375, -0.001743316650390625, 4.38690185546875e-05, 0.0018310546875, 0.0036182403564453125, 0.005405426025390625, 0.0071926116943359375, 0.00897979736328125, 0.010766983032226562, 0.012554168701171875, 0.014341354370117188, 0.0161285400390625, 0.017915725708007812, 0.019702911376953125, 0.021490097045898438, 0.02327728271484375, 0.025064468383789062, 0.026851654052734375, 0.028638839721679688, 0.030426025390625, 0.03221321105957031, 0.034000396728515625, 0.03578758239746094, 0.03757476806640625, 0.03936195373535156, 0.041149139404296875, 0.04293632507324219, 0.0447235107421875, 0.04651069641113281, 0.048297882080078125, 0.05008506774902344, 0.05187225341796875, 0.05365943908691406, 0.055446624755859375, 0.05723381042480469, 0.05902099609375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 8.0, 3.0, 12.0, 15.0, 11.0, 15.0, 14.0, 13.0, 25.0, 32.0, 37.0, 41.0, 28.0, 48.0, 48.0, 50.0, 49.0, 50.0, 56.0, 55.0, 46.0, 49.0, 47.0, 29.0, 30.0, 32.0, 30.0, 26.0, 19.0, 23.0, 16.0, 11.0, 12.0, 10.0, 7.0, 4.0, 1.0, 6.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.011871337890625, -0.011478781700134277, -0.011086225509643555, -0.010693669319152832, -0.01030111312866211, -0.009908556938171387, -0.009516000747680664, -0.009123444557189941, -0.008730888366699219, -0.008338332176208496, -0.007945775985717773, -0.007553219795227051, -0.007160663604736328, -0.0067681074142456055, -0.006375551223754883, -0.00598299503326416, -0.0055904388427734375, -0.005197882652282715, -0.004805326461791992, -0.0044127702713012695, -0.004020214080810547, -0.0036276578903198242, -0.0032351016998291016, -0.002842545509338379, -0.0024499893188476562, -0.0020574331283569336, -0.001664876937866211, -0.0012723207473754883, -0.0008797645568847656, -0.00048720836639404297, -9.465217590332031e-05, 0.00029790401458740234, 0.000690460205078125, 0.0010830163955688477, 0.0014755725860595703, 0.001868128776550293, 0.0022606849670410156, 0.0026532411575317383, 0.003045797348022461, 0.0034383535385131836, 0.0038309097290039062, 0.004223465919494629, 0.0046160221099853516, 0.005008578300476074, 0.005401134490966797, 0.0057936906814575195, 0.006186246871948242, 0.006578803062438965, 0.0069713592529296875, 0.00736391544342041, 0.007756471633911133, 0.008149027824401855, 0.008541584014892578, 0.0089341402053833, 0.009326696395874023, 0.009719252586364746, 0.010111808776855469, 0.010504364967346191, 0.010896921157836914, 0.011289477348327637, 0.01168203353881836, 0.012074589729309082, 0.012467145919799805, 0.012859702110290527, 0.01325225830078125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 9.0, 9.0, 14.0, 18.0, 30.0, 42.0, 55.0, 72.0, 112.0, 200.0, 328.0, 520.0, 1183.0, 3294.0, 15982.0, 904105.0, 110811.0, 7596.0, 2122.0, 873.0, 442.0, 237.0, 165.0, 100.0, 67.0, 42.0, 36.0, 22.0, 17.0, 15.0, 8.0, 7.0, 5.0, 2.0, 5.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0210113525390625, -0.020407676696777344, -0.019804000854492188, -0.01920032501220703, -0.018596649169921875, -0.01799297332763672, -0.017389297485351562, -0.016785621643066406, -0.01618194580078125, -0.015578269958496094, -0.014974594116210938, -0.014370918273925781, -0.013767242431640625, -0.013163566589355469, -0.012559890747070312, -0.011956214904785156, -0.0113525390625, -0.010748863220214844, -0.010145187377929688, -0.009541511535644531, -0.008937835693359375, -0.008334159851074219, -0.0077304840087890625, -0.007126808166503906, -0.00652313232421875, -0.005919456481933594, -0.0053157806396484375, -0.004712104797363281, -0.004108428955078125, -0.0035047531127929688, -0.0029010772705078125, -0.0022974014282226562, -0.0016937255859375, -0.0010900497436523438, -0.0004863739013671875, 0.00011730194091796875, 0.000720977783203125, 0.0013246536254882812, 0.0019283294677734375, 0.0025320053100585938, 0.00313568115234375, 0.0037393569946289062, 0.0043430328369140625, 0.004946708679199219, 0.005550384521484375, 0.006154060363769531, 0.0067577362060546875, 0.007361412048339844, 0.007965087890625, 0.008568763732910156, 0.009172439575195312, 0.009776115417480469, 0.010379791259765625, 0.010983467102050781, 0.011587142944335938, 0.012190818786621094, 0.01279449462890625, 0.013398170471191406, 0.014001846313476562, 0.014605522155761719, 0.015209197998046875, 0.01581287384033203, 0.016416549682617188, 0.017020225524902344, 0.0176239013671875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 6.0, 3.0, 7.0, 18.0, 15.0, 20.0, 12.0, 24.0, 39.0, 33.0, 60.0, 43.0, 79.0, 77.0, 94.0, 70.0, 68.0, 61.0, 61.0, 48.0, 38.0, 19.0, 31.0, 14.0, 12.0, 11.0, 11.0, 6.0, 5.0, 5.0, 3.0, 4.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.59634780883789e-06, -9.250827133655548e-06, -8.905306458473206e-06, -8.559785783290863e-06, -8.21426510810852e-06, -7.868744432926178e-06, -7.5232237577438354e-06, -7.177703082561493e-06, -6.83218240737915e-06, -6.486661732196808e-06, -6.141141057014465e-06, -5.795620381832123e-06, -5.45009970664978e-06, -5.104579031467438e-06, -4.759058356285095e-06, -4.413537681102753e-06, -4.06801700592041e-06, -3.7224963307380676e-06, -3.376975655555725e-06, -3.0314549803733826e-06, -2.68593430519104e-06, -2.3404136300086975e-06, -1.994892954826355e-06, -1.6493722796440125e-06, -1.30385160446167e-06, -9.583309292793274e-07, -6.128102540969849e-07, -2.6728957891464233e-07, 7.82310962677002e-08, 4.237517714500427e-07, 7.692724466323853e-07, 1.1147931218147278e-06, 1.4603137969970703e-06, 1.8058344721794128e-06, 2.1513551473617554e-06, 2.496875822544098e-06, 2.8423964977264404e-06, 3.187917172908783e-06, 3.5334378480911255e-06, 3.878958523273468e-06, 4.2244791984558105e-06, 4.569999873638153e-06, 4.915520548820496e-06, 5.261041224002838e-06, 5.606561899185181e-06, 5.952082574367523e-06, 6.297603249549866e-06, 6.643123924732208e-06, 6.988644599914551e-06, 7.334165275096893e-06, 7.679685950279236e-06, 8.025206625461578e-06, 8.370727300643921e-06, 8.716247975826263e-06, 9.061768651008606e-06, 9.407289326190948e-06, 9.752810001373291e-06, 1.0098330676555634e-05, 1.0443851351737976e-05, 1.0789372026920319e-05, 1.1134892702102661e-05, 1.1480413377285004e-05, 1.1825934052467346e-05, 1.2171454727649689e-05, 1.2516975402832031e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 1.0, 2.0, 4.0, 6.0, 14.0, 13.0, 25.0, 34.0, 60.0, 87.0, 150.0, 240.0, 428.0, 789.0, 1790.0, 4825.0, 19860.0, 740286.0, 256884.0, 15773.0, 4017.0, 1562.0, 748.0, 357.0, 212.0, 119.0, 74.0, 55.0, 44.0, 32.0, 19.0, 15.0, 13.0, 5.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0309295654296875, -0.030044078826904297, -0.029158592224121094, -0.02827310562133789, -0.027387619018554688, -0.026502132415771484, -0.02561664581298828, -0.024731159210205078, -0.023845672607421875, -0.022960186004638672, -0.02207469940185547, -0.021189212799072266, -0.020303726196289062, -0.01941823959350586, -0.018532752990722656, -0.017647266387939453, -0.01676177978515625, -0.015876293182373047, -0.014990806579589844, -0.01410531997680664, -0.013219833374023438, -0.012334346771240234, -0.011448860168457031, -0.010563373565673828, -0.009677886962890625, -0.008792400360107422, -0.007906913757324219, -0.007021427154541016, -0.0061359405517578125, -0.005250453948974609, -0.004364967346191406, -0.003479480743408203, -0.002593994140625, -0.0017085075378417969, -0.0008230209350585938, 6.246566772460938e-05, 0.0009479522705078125, 0.0018334388732910156, 0.0027189254760742188, 0.003604412078857422, 0.004489898681640625, 0.005375385284423828, 0.006260871887207031, 0.007146358489990234, 0.008031845092773438, 0.00891733169555664, 0.009802818298339844, 0.010688304901123047, 0.01157379150390625, 0.012459278106689453, 0.013344764709472656, 0.01423025131225586, 0.015115737915039062, 0.016001224517822266, 0.01688671112060547, 0.017772197723388672, 0.018657684326171875, 0.019543170928955078, 0.02042865753173828, 0.021314144134521484, 0.022199630737304688, 0.02308511734008789, 0.023970603942871094, 0.024856090545654297, 0.0257415771484375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 1.0, 4.0, 8.0, 5.0, 4.0, 11.0, 7.0, 12.0, 17.0, 9.0, 26.0, 52.0, 162.0, 323.0, 188.0, 70.0, 30.0, 25.0, 12.0, 6.0, 6.0, 6.0, 4.0, 1.0, 3.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.017669677734375, -0.01710963249206543, -0.01654958724975586, -0.01598954200744629, -0.015429496765136719, -0.014869451522827148, -0.014309406280517578, -0.013749361038208008, -0.013189315795898438, -0.012629270553588867, -0.012069225311279297, -0.011509180068969727, -0.010949134826660156, -0.010389089584350586, -0.009829044342041016, -0.009268999099731445, -0.008708953857421875, -0.008148908615112305, -0.007588863372802734, -0.007028818130493164, -0.006468772888183594, -0.0059087276458740234, -0.005348682403564453, -0.004788637161254883, -0.0042285919189453125, -0.003668546676635742, -0.003108501434326172, -0.0025484561920166016, -0.0019884109497070312, -0.001428365707397461, -0.0008683204650878906, -0.0003082752227783203, 0.00025177001953125, 0.0008118152618408203, 0.0013718605041503906, 0.001931905746459961, 0.0024919509887695312, 0.0030519962310791016, 0.003612041473388672, 0.004172086715698242, 0.0047321319580078125, 0.005292177200317383, 0.005852222442626953, 0.0064122676849365234, 0.006972312927246094, 0.007532358169555664, 0.008092403411865234, 0.008652448654174805, 0.009212493896484375, 0.009772539138793945, 0.010332584381103516, 0.010892629623413086, 0.011452674865722656, 0.012012720108032227, 0.012572765350341797, 0.013132810592651367, 0.013692855834960938, 0.014252901077270508, 0.014812946319580078, 0.015372991561889648, 0.01593303680419922, 0.01649308204650879, 0.01705312728881836, 0.01761317253112793, 0.0181732177734375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 2.0, 8.0, 12.0, 20.0, 46.0, 457.0, 360.0, 39.0, 21.0, 8.0, 6.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4165916442871094, -0.4005395770072937, -0.384487509727478, -0.36843544244766235, -0.3523833751678467, -0.336331307888031, -0.3202792704105377, -0.30422720313072205, -0.28817513585090637, -0.2721230685710907, -0.256071001291275, -0.24001894891262054, -0.22396688163280487, -0.2079148143529892, -0.19186276197433472, -0.17581069469451904, -0.15975862741470337, -0.1437065601348877, -0.12765449285507202, -0.11160244047641754, -0.09555037319660187, -0.0794983059167862, -0.06344624608755112, -0.04739418625831604, -0.031342118978500366, -0.01529005542397499, 0.0007620081305503845, 0.01681407168507576, 0.032866135239601135, 0.04891820251941681, 0.06497026234865189, 0.08102232217788696, 0.09707438945770264, 0.11312645673751831, 0.12917852401733398, 0.14523057639598846, 0.16128264367580414, 0.1773347109556198, 0.1933867633342743, 0.20943883061408997, 0.22549089789390564, 0.2415429651737213, 0.257595032453537, 0.27364709973335266, 0.28969913721084595, 0.3057512044906616, 0.3218032717704773, 0.33785533905029297, 0.35390740633010864, 0.3699594736099243, 0.38601154088974, 0.40206360816955566, 0.41811567544937134, 0.434167742729187, 0.4502197802066803, 0.46627184748649597, 0.48232391476631165, 0.4983759820461273, 0.5144280195236206, 0.5304800868034363, 0.546532154083252, 0.5625842213630676, 0.5786362886428833, 0.594688355922699, 0.6107404232025146]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 6.0, 2.0, 4.0, 5.0, 3.0, 4.0, 8.0, 13.0, 8.0, 18.0, 23.0, 36.0, 63.0, 118.0, 151.0, 180.0, 127.0, 90.0, 51.0, 27.0, 16.0, 12.0, 8.0, 8.0, 8.0, 2.0, 5.0, 0.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2642490267753601, -0.2569133937358856, -0.24957779049873352, -0.24224215745925903, -0.23490653932094574, -0.22757092118263245, -0.22023528814315796, -0.21289967000484467, -0.20556405186653137, -0.19822843372821808, -0.19089281558990479, -0.1835571825504303, -0.176221564412117, -0.1688859462738037, -0.16155031323432922, -0.15421469509601593, -0.14687907695770264, -0.13954345881938934, -0.13220784068107605, -0.12487220764160156, -0.11753658950328827, -0.11020097136497498, -0.10286534577608109, -0.0955297201871872, -0.0881941020488739, -0.08085848391056061, -0.07352285832166672, -0.06618723273277283, -0.058851614594459534, -0.05151599273085594, -0.04418037086725235, -0.03684474900364876, -0.029509127140045166, -0.022173505276441574, -0.014837883412837982, -0.00750226154923439, -0.00016663968563079834, 0.007168982177972794, 0.014504604041576385, 0.021840225905179977, 0.02917584776878357, 0.03651146963238716, 0.04384709149599075, 0.051182713359594345, 0.05851833522319794, 0.06585395336151123, 0.07318957895040512, 0.08052520453929901, 0.0878608226776123, 0.0951964408159256, 0.10253206640481949, 0.10986769199371338, 0.11720331013202667, 0.12453892827033997, 0.13187456130981445, 0.13921017944812775, 0.14654579758644104, 0.15388141572475433, 0.16121703386306763, 0.16855266690254211, 0.1758882850408554, 0.1832239031791687, 0.1905595362186432, 0.19789515435695648, 0.20523077249526978]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 6.0, 4.0, 1.0, 10.0, 6.0, 10.0, 16.0, 14.0, 26.0, 30.0, 65.0, 238.0, 3233.0, 4156485.0, 33120.0, 753.0, 93.0, 43.0, 23.0, 23.0, 14.0, 14.0, 15.0, 9.0, 3.0, 4.0, 2.0, 5.0, 3.0, 6.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.27734375, -3.17730712890625, -3.0772705078125, -2.97723388671875, -2.877197265625, -2.77716064453125, -2.6771240234375, -2.57708740234375, -2.47705078125, -2.37701416015625, -2.2769775390625, -2.17694091796875, -2.076904296875, -1.97686767578125, -1.8768310546875, -1.77679443359375, -1.6767578125, -1.57672119140625, -1.4766845703125, -1.37664794921875, -1.276611328125, -1.17657470703125, -1.0765380859375, -0.97650146484375, -0.87646484375, -0.77642822265625, -0.6763916015625, -0.57635498046875, -0.476318359375, -0.37628173828125, -0.2762451171875, -0.17620849609375, -0.076171875, 0.02386474609375, 0.1239013671875, 0.22393798828125, 0.323974609375, 0.42401123046875, 0.5240478515625, 0.62408447265625, 0.72412109375, 0.82415771484375, 0.9241943359375, 1.02423095703125, 1.124267578125, 1.22430419921875, 1.3243408203125, 1.42437744140625, 1.5244140625, 1.62445068359375, 1.7244873046875, 1.82452392578125, 1.924560546875, 2.02459716796875, 2.1246337890625, 2.22467041015625, 2.32470703125, 2.42474365234375, 2.5247802734375, 2.62481689453125, 2.724853515625, 2.82489013671875, 2.9249267578125, 3.02496337890625, 3.125]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 8.0, 3.0, 6.0, 5.0, 4.0, 8.0, 11.0, 11.0, 9.0, 14.0, 29.0, 276.0, 442.0, 62.0, 13.0, 17.0, 13.0, 10.0, 9.0, 7.0, 6.0, 9.0, 4.0, 3.0, 2.0, 4.0, 6.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0022449493408203125, -0.0021733343601226807, -0.002101719379425049, -0.002030104398727417, -0.001958489418029785, -0.0018868744373321533, -0.0018152594566345215, -0.0017436444759368896, -0.0016720294952392578, -0.001600414514541626, -0.0015287995338439941, -0.0014571845531463623, -0.0013855695724487305, -0.0013139545917510986, -0.0012423396110534668, -0.001170724630355835, -0.0010991096496582031, -0.0010274946689605713, -0.0009558796882629395, -0.0008842647075653076, -0.0008126497268676758, -0.0007410347461700439, -0.0006694197654724121, -0.0005978047847747803, -0.0005261898040771484, -0.0004545748233795166, -0.00038295984268188477, -0.00031134486198425293, -0.0002397298812866211, -0.00016811490058898926, -9.649991989135742e-05, -2.4884939193725586e-05, 4.673004150390625e-05, 0.00011834502220153809, 0.00018996000289916992, 0.00026157498359680176, 0.0003331899642944336, 0.00040480494499206543, 0.00047641992568969727, 0.0005480349063873291, 0.0006196498870849609, 0.0006912648677825928, 0.0007628798484802246, 0.0008344948291778564, 0.0009061098098754883, 0.0009777247905731201, 0.001049339771270752, 0.0011209547519683838, 0.0011925697326660156, 0.0012641847133636475, 0.0013357996940612793, 0.0014074146747589111, 0.001479029655456543, 0.0015506446361541748, 0.0016222596168518066, 0.0016938745975494385, 0.0017654895782470703, 0.0018371045589447021, 0.001908719539642334, 0.001980334520339966, 0.0020519495010375977, 0.0021235644817352295, 0.0021951794624328613, 0.002266794443130493, 0.002338409423828125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 2.0, 3.0, 7.0, 11.0, 10.0, 17.0, 20.0, 28.0, 37.0, 51.0, 67.0, 69.0, 82.0, 110.0, 125.0, 187.0, 1524.0, 4082424.0, 107701.0, 814.0, 230.0, 132.0, 122.0, 99.0, 83.0, 69.0, 51.0, 36.0, 36.0, 26.0, 29.0, 20.0, 14.0, 13.0, 9.0, 10.0, 6.0, 5.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5634765625, -0.5463333129882812, -0.5291900634765625, -0.5120468139648438, -0.494903564453125, -0.47776031494140625, -0.4606170654296875, -0.44347381591796875, -0.42633056640625, -0.40918731689453125, -0.3920440673828125, -0.37490081787109375, -0.357757568359375, -0.34061431884765625, -0.3234710693359375, -0.30632781982421875, -0.2891845703125, -0.27204132080078125, -0.2548980712890625, -0.23775482177734375, -0.220611572265625, -0.20346832275390625, -0.1863250732421875, -0.16918182373046875, -0.15203857421875, -0.13489532470703125, -0.1177520751953125, -0.10060882568359375, -0.083465576171875, -0.06632232666015625, -0.0491790771484375, -0.03203582763671875, -0.014892578125, 0.00225067138671875, 0.0193939208984375, 0.03653717041015625, 0.053680419921875, 0.07082366943359375, 0.0879669189453125, 0.10511016845703125, 0.12225341796875, 0.13939666748046875, 0.1565399169921875, 0.17368316650390625, 0.190826416015625, 0.20796966552734375, 0.2251129150390625, 0.24225616455078125, 0.2593994140625, 0.27654266357421875, 0.2936859130859375, 0.31082916259765625, 0.327972412109375, 0.34511566162109375, 0.3622589111328125, 0.37940216064453125, 0.39654541015625, 0.41368865966796875, 0.4308319091796875, 0.44797515869140625, 0.465118408203125, 0.48226165771484375, 0.4994049072265625, 0.5165481567382812, 0.53369140625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 5.0, 3.0, 3.0, 7.0, 7.0, 10.0, 11.0, 22.0, 28.0, 37.0, 45.0, 68.0, 69.0, 80.0, 109.0, 140.0, 164.0, 193.0, 295.0, 1218.0, 296.0, 247.0, 190.0, 156.0, 143.0, 112.0, 85.0, 68.0, 47.0, 40.0, 37.0, 28.0, 26.0, 22.0, 13.0, 14.0, 11.0, 10.0, 7.0, 5.0, 4.0, 2.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004302978515625, -0.004170775413513184, -0.004038572311401367, -0.003906369209289551, -0.0037741661071777344, -0.003641963005065918, -0.0035097599029541016, -0.003377556800842285, -0.0032453536987304688, -0.0031131505966186523, -0.002980947494506836, -0.0028487443923950195, -0.002716541290283203, -0.0025843381881713867, -0.0024521350860595703, -0.002319931983947754, -0.0021877288818359375, -0.002055525779724121, -0.0019233226776123047, -0.0017911195755004883, -0.0016589164733886719, -0.0015267133712768555, -0.001394510269165039, -0.0012623071670532227, -0.0011301040649414062, -0.0009979009628295898, -0.0008656978607177734, -0.000733494758605957, -0.0006012916564941406, -0.0004690885543823242, -0.0003368854522705078, -0.0002046823501586914, -7.2479248046875e-05, 5.9723854064941406e-05, 0.0001919269561767578, 0.0003241300582885742, 0.0004563331604003906, 0.000588536262512207, 0.0007207393646240234, 0.0008529424667358398, 0.0009851455688476562, 0.0011173486709594727, 0.001249551773071289, 0.0013817548751831055, 0.0015139579772949219, 0.0016461610794067383, 0.0017783641815185547, 0.001910567283630371, 0.0020427703857421875, 0.002174973487854004, 0.0023071765899658203, 0.0024393796920776367, 0.002571582794189453, 0.0027037858963012695, 0.002835988998413086, 0.0029681921005249023, 0.0031003952026367188, 0.003232598304748535, 0.0033648014068603516, 0.003497004508972168, 0.0036292076110839844, 0.0037614107131958008, 0.003893613815307617, 0.004025816917419434, 0.00415802001953125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 17.0, 747.0, 208.0, 28.0, 11.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05087721720337868, -0.0319625586271286, -0.013047903776168823, 0.005866754800081253, 0.02478140965104103, 0.04369606450200081, 0.06261073052883148, 0.08152538537979126, 0.10044004023075104, 0.11935469508171082, 0.1382693499326706, 0.15718400478363037, 0.17609867453575134, 0.19501331448554993, 0.2139279842376709, 0.23284263908863068, 0.25175729393959045, 0.2706719636917114, 0.28958660364151, 0.308501273393631, 0.32741591334342957, 0.34633058309555054, 0.3652452230453491, 0.3841598927974701, 0.4030745327472687, 0.42198920249938965, 0.44090384244918823, 0.4598185122013092, 0.4787331521511078, 0.49764782190322876, 0.5165624618530273, 0.5354771614074707, 0.5543918013572693, 0.5733064413070679, 0.5922211408615112, 0.6111357808113098, 0.6300504207611084, 0.648965060710907, 0.6678797602653503, 0.6867944002151489, 0.7057090401649475, 0.7246236801147461, 0.7435383796691895, 0.762453019618988, 0.7813676595687866, 0.8002822995185852, 0.8191969990730286, 0.8381116390228271, 0.8570263385772705, 0.8759409785270691, 0.8948556780815125, 0.913770318031311, 0.9326849579811096, 0.9515995979309082, 0.9705142974853516, 0.9894289374351501, 1.0083435773849487, 1.027258276939392, 1.046172857284546, 1.0650875568389893, 1.0840022563934326, 1.1029168367385864, 1.1218315362930298, 1.1407461166381836, 1.159660816192627]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 3.0, 11.0, 2.0, 8.0, 13.0, 15.0, 20.0, 27.0, 26.0, 41.0, 60.0, 55.0, 68.0, 60.0, 70.0, 82.0, 70.0, 61.0, 64.0, 50.0, 39.0, 40.0, 28.0, 30.0, 10.0, 13.0, 18.0, 10.0, 6.0, 7.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.061509907245635986, -0.05964859575033188, -0.05778728798031807, -0.05592598021030426, -0.05406466871500015, -0.052203357219696045, -0.050342049449682236, -0.048480741679668427, -0.04661943018436432, -0.04475811868906021, -0.0428968109190464, -0.04103550314903259, -0.039174191653728485, -0.03731288015842438, -0.03545157238841057, -0.03359026461839676, -0.03172895312309265, -0.029867643490433693, -0.028006333857774734, -0.026145024225115776, -0.024283714592456818, -0.02242240495979786, -0.0205610953271389, -0.018699785694479942, -0.016838476061820984, -0.014977166429162025, -0.013115856796503067, -0.011254547163844109, -0.00939323753118515, -0.007531927898526192, -0.005670618265867233, -0.003809308633208275, -0.0019479990005493164, -8.668936789035797e-05, 0.0017746202647686005, 0.003635929897427559, 0.005497239530086517, 0.007358549162745476, 0.009219858795404434, 0.011081168428063393, 0.012942478060722351, 0.01480378769338131, 0.016665097326040268, 0.018526406958699226, 0.020387716591358185, 0.022249026224017143, 0.0241103358566761, 0.02597164548933506, 0.02783295512199402, 0.029694264754652977, 0.031555574387311935, 0.033416882157325745, 0.03527819365262985, 0.03713950514793396, 0.03900081291794777, 0.04086212068796158, 0.042723432183265686, 0.044584743678569794, 0.0464460514485836, 0.04830735921859741, 0.05016867071390152, 0.05202998220920563, 0.05389128997921944, 0.055752597749233246, 0.057613909244537354]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 8.0, 13.0, 21.0, 19.0, 33.0, 34.0, 54.0, 63.0, 120.0, 206.0, 286.0, 454.0, 684.0, 1151.0, 2132.0, 4030.0, 8322.0, 20365.0, 203337.0, 762379.0, 25011.0, 9601.0, 4550.0, 2295.0, 1234.0, 740.0, 461.0, 330.0, 208.0, 141.0, 76.0, 51.0, 45.0, 42.0, 23.0, 13.0, 8.0, 3.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04931640625, -0.04762125015258789, -0.04592609405517578, -0.04423093795776367, -0.04253578186035156, -0.04084062576293945, -0.039145469665527344, -0.037450313568115234, -0.035755157470703125, -0.034060001373291016, -0.032364845275878906, -0.030669689178466797, -0.028974533081054688, -0.027279376983642578, -0.02558422088623047, -0.02388906478881836, -0.02219390869140625, -0.02049875259399414, -0.01880359649658203, -0.017108440399169922, -0.015413284301757812, -0.013718128204345703, -0.012022972106933594, -0.010327816009521484, -0.008632659912109375, -0.006937503814697266, -0.005242347717285156, -0.003547191619873047, -0.0018520355224609375, -0.00015687942504882812, 0.0015382766723632812, 0.0032334327697753906, 0.0049285888671875, 0.006623744964599609, 0.008318901062011719, 0.010014057159423828, 0.011709213256835938, 0.013404369354248047, 0.015099525451660156, 0.016794681549072266, 0.018489837646484375, 0.020184993743896484, 0.021880149841308594, 0.023575305938720703, 0.025270462036132812, 0.026965618133544922, 0.02866077423095703, 0.03035593032836914, 0.03205108642578125, 0.03374624252319336, 0.03544139862060547, 0.03713655471801758, 0.03883171081542969, 0.0405268669128418, 0.042222023010253906, 0.043917179107666016, 0.045612335205078125, 0.047307491302490234, 0.049002647399902344, 0.05069780349731445, 0.05239295959472656, 0.05408811569213867, 0.05578327178955078, 0.05747842788696289, 0.059173583984375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 5.0, 4.0, 3.0, 4.0, 8.0, 6.0, 12.0, 18.0, 14.0, 28.0, 134.0, 418.0, 215.0, 53.0, 13.0, 15.0, 17.0, 8.0, 9.0, 4.0, 7.0, 3.0, 3.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0036563873291015625, -0.00357075035572052, -0.0034851133823394775, -0.003399476408958435, -0.0033138394355773926, -0.00322820246219635, -0.0031425654888153076, -0.003056928515434265, -0.0029712915420532227, -0.00288565456867218, -0.0028000175952911377, -0.002714380621910095, -0.0026287436485290527, -0.0025431066751480103, -0.0024574697017669678, -0.0023718327283859253, -0.002286195755004883, -0.0022005587816238403, -0.002114921808242798, -0.0020292848348617554, -0.0019436478614807129, -0.0018580108880996704, -0.001772373914718628, -0.0016867369413375854, -0.001601099967956543, -0.0015154629945755005, -0.001429826021194458, -0.0013441890478134155, -0.001258552074432373, -0.0011729151010513306, -0.001087278127670288, -0.0010016411542892456, -0.0009160041809082031, -0.0008303672075271606, -0.0007447302341461182, -0.0006590932607650757, -0.0005734562873840332, -0.0004878193140029907, -0.00040218234062194824, -0.00031654536724090576, -0.00023090839385986328, -0.0001452714204788208, -5.963444709777832e-05, 2.600252628326416e-05, 0.00011163949966430664, 0.00019727647304534912, 0.0002829134464263916, 0.0003685504198074341, 0.00045418739318847656, 0.000539824366569519, 0.0006254613399505615, 0.000711098313331604, 0.0007967352867126465, 0.000882372260093689, 0.0009680092334747314, 0.001053646206855774, 0.0011392831802368164, 0.0012249201536178589, 0.0013105571269989014, 0.0013961941003799438, 0.0014818310737609863, 0.0015674680471420288, 0.0016531050205230713, 0.0017387419939041138, 0.0018243789672851562]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 4.0, 4.0, 8.0, 6.0, 9.0, 17.0, 11.0, 10.0, 18.0, 17.0, 23.0, 20.0, 25.0, 36.0, 23.0, 41.0, 45.0, 72.0, 300.0, 1728.0, 23055.0, 1002002.0, 18928.0, 1495.0, 243.0, 79.0, 46.0, 37.0, 36.0, 31.0, 36.0, 25.0, 19.0, 14.0, 13.0, 12.0, 13.0, 9.0, 8.0, 8.0, 5.0, 5.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.10009765625, -0.09691715240478516, -0.09373664855957031, -0.09055614471435547, -0.08737564086914062, -0.08419513702392578, -0.08101463317871094, -0.0778341293334961, -0.07465362548828125, -0.0714731216430664, -0.06829261779785156, -0.06511211395263672, -0.061931610107421875, -0.05875110626220703, -0.05557060241699219, -0.052390098571777344, -0.0492095947265625, -0.046029090881347656, -0.04284858703613281, -0.03966808319091797, -0.036487579345703125, -0.03330707550048828, -0.030126571655273438, -0.026946067810058594, -0.02376556396484375, -0.020585060119628906, -0.017404556274414062, -0.014224052429199219, -0.011043548583984375, -0.007863044738769531, -0.0046825408935546875, -0.0015020370483398438, 0.001678466796875, 0.004858970642089844, 0.008039474487304688, 0.011219978332519531, 0.014400482177734375, 0.01758098602294922, 0.020761489868164062, 0.023941993713378906, 0.02712249755859375, 0.030303001403808594, 0.03348350524902344, 0.03666400909423828, 0.039844512939453125, 0.04302501678466797, 0.04620552062988281, 0.049386024475097656, 0.0525665283203125, 0.055747032165527344, 0.05892753601074219, 0.06210803985595703, 0.06528854370117188, 0.06846904754638672, 0.07164955139160156, 0.0748300552368164, 0.07801055908203125, 0.0811910629272461, 0.08437156677246094, 0.08755207061767578, 0.09073257446289062, 0.09391307830810547, 0.09709358215332031, 0.10027408599853516, 0.10345458984375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 8.0, 7.0, 6.0, 8.0, 11.0, 10.0, 14.0, 15.0, 14.0, 13.0, 12.0, 34.0, 27.0, 33.0, 27.0, 40.0, 42.0, 52.0, 31.0, 47.0, 52.0, 30.0, 39.0, 39.0, 41.0, 44.0, 36.0, 38.0, 31.0, 23.0, 22.0, 24.0, 27.0, 18.0, 9.0, 22.0, 11.0, 9.0, 9.0, 7.0, 6.0, 5.0, 3.0, 4.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00580596923828125, -0.005625486373901367, -0.005445003509521484, -0.0052645206451416016, -0.005084037780761719, -0.004903554916381836, -0.004723072052001953, -0.00454258918762207, -0.0043621063232421875, -0.004181623458862305, -0.004001140594482422, -0.003820657730102539, -0.0036401748657226562, -0.0034596920013427734, -0.0032792091369628906, -0.003098726272583008, -0.002918243408203125, -0.002737760543823242, -0.0025572776794433594, -0.0023767948150634766, -0.0021963119506835938, -0.002015829086303711, -0.0018353462219238281, -0.0016548633575439453, -0.0014743804931640625, -0.0012938976287841797, -0.0011134147644042969, -0.0009329319000244141, -0.0007524490356445312, -0.0005719661712646484, -0.0003914833068847656, -0.0002110004425048828, -3.0517578125e-05, 0.0001499652862548828, 0.0003304481506347656, 0.0005109310150146484, 0.0006914138793945312, 0.0008718967437744141, 0.0010523796081542969, 0.0012328624725341797, 0.0014133453369140625, 0.0015938282012939453, 0.0017743110656738281, 0.001954793930053711, 0.0021352767944335938, 0.0023157596588134766, 0.0024962425231933594, 0.002676725387573242, 0.002857208251953125, 0.003037691116333008, 0.0032181739807128906, 0.0033986568450927734, 0.0035791397094726562, 0.003759622573852539, 0.003940105438232422, 0.004120588302612305, 0.0043010711669921875, 0.00448155403137207, 0.004662036895751953, 0.004842519760131836, 0.005023002624511719, 0.0052034854888916016, 0.005383968353271484, 0.005564451217651367, 0.00574493408203125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 2.0, 5.0, 5.0, 7.0, 5.0, 8.0, 15.0, 22.0, 20.0, 22.0, 60.0, 139.0, 1227.0, 943641.0, 102195.0, 871.0, 144.0, 44.0, 36.0, 25.0, 11.0, 14.0, 10.0, 10.0, 4.0, 2.0, 1.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09539794921875, -0.0923147201538086, -0.08923149108886719, -0.08614826202392578, -0.08306503295898438, -0.07998180389404297, -0.07689857482910156, -0.07381534576416016, -0.07073211669921875, -0.06764888763427734, -0.06456565856933594, -0.06148242950439453, -0.058399200439453125, -0.05531597137451172, -0.05223274230957031, -0.049149513244628906, -0.0460662841796875, -0.042983055114746094, -0.03989982604980469, -0.03681659698486328, -0.033733367919921875, -0.03065013885498047, -0.027566909790039062, -0.024483680725097656, -0.02140045166015625, -0.018317222595214844, -0.015233993530273438, -0.012150764465332031, -0.009067535400390625, -0.005984306335449219, -0.0029010772705078125, 0.00018215179443359375, 0.003265380859375, 0.006348609924316406, 0.009431838989257812, 0.012515068054199219, 0.015598297119140625, 0.01868152618408203, 0.021764755249023438, 0.024847984313964844, 0.02793121337890625, 0.031014442443847656, 0.03409767150878906, 0.03718090057373047, 0.040264129638671875, 0.04334735870361328, 0.04643058776855469, 0.049513816833496094, 0.0525970458984375, 0.055680274963378906, 0.05876350402832031, 0.06184673309326172, 0.06492996215820312, 0.06801319122314453, 0.07109642028808594, 0.07417964935302734, 0.07726287841796875, 0.08034610748291016, 0.08342933654785156, 0.08651256561279297, 0.08959579467773438, 0.09267902374267578, 0.09576225280761719, 0.0988454818725586, 0.1019287109375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 8.0, 4.0, 6.0, 10.0, 11.0, 14.0, 24.0, 28.0, 61.0, 83.0, 289.0, 258.0, 66.0, 39.0, 26.0, 16.0, 19.0, 17.0, 7.0, 7.0, 6.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00020933151245117188, -0.00020456314086914062, -0.00019979476928710938, -0.00019502639770507812, -0.00019025802612304688, -0.00018548965454101562, -0.00018072128295898438, -0.00017595291137695312, -0.00017118453979492188, -0.00016641616821289062, -0.00016164779663085938, -0.00015687942504882812, -0.00015211105346679688, -0.00014734268188476562, -0.00014257431030273438, -0.00013780593872070312, -0.00013303756713867188, -0.00012826919555664062, -0.00012350082397460938, -0.00011873245239257812, -0.00011396408081054688, -0.00010919570922851562, -0.00010442733764648438, -9.965896606445312e-05, -9.489059448242188e-05, -9.012222290039062e-05, -8.535385131835938e-05, -8.058547973632812e-05, -7.581710815429688e-05, -7.104873657226562e-05, -6.628036499023438e-05, -6.151199340820312e-05, -5.6743621826171875e-05, -5.1975250244140625e-05, -4.7206878662109375e-05, -4.2438507080078125e-05, -3.7670135498046875e-05, -3.2901763916015625e-05, -2.8133392333984375e-05, -2.3365020751953125e-05, -1.8596649169921875e-05, -1.3828277587890625e-05, -9.059906005859375e-06, -4.291534423828125e-06, 4.76837158203125e-07, 5.245208740234375e-06, 1.0013580322265625e-05, 1.4781951904296875e-05, 1.9550323486328125e-05, 2.4318695068359375e-05, 2.9087066650390625e-05, 3.3855438232421875e-05, 3.8623809814453125e-05, 4.3392181396484375e-05, 4.8160552978515625e-05, 5.2928924560546875e-05, 5.7697296142578125e-05, 6.246566772460938e-05, 6.723403930664062e-05, 7.200241088867188e-05, 7.677078247070312e-05, 8.153915405273438e-05, 8.630752563476562e-05, 9.107589721679688e-05, 9.584426879882812e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 6.0, 2.0, 8.0, 12.0, 28.0, 38.0, 52.0, 113.0, 306.0, 1029.0, 5871.0, 880770.0, 154203.0, 4670.0, 890.0, 269.0, 122.0, 60.0, 26.0, 20.0, 15.0, 8.0, 12.0, 6.0, 7.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08489990234375, -0.0814962387084961, -0.07809257507324219, -0.07468891143798828, -0.07128524780273438, -0.06788158416748047, -0.06447792053222656, -0.061074256896972656, -0.05767059326171875, -0.054266929626464844, -0.05086326599121094, -0.04745960235595703, -0.044055938720703125, -0.04065227508544922, -0.03724861145019531, -0.033844947814941406, -0.0304412841796875, -0.027037620544433594, -0.023633956909179688, -0.02023029327392578, -0.016826629638671875, -0.013422966003417969, -0.010019302368164062, -0.006615638732910156, -0.00321197509765625, 0.00019168853759765625, 0.0035953521728515625, 0.006999015808105469, 0.010402679443359375, 0.013806343078613281, 0.017210006713867188, 0.020613670349121094, 0.024017333984375, 0.027420997619628906, 0.030824661254882812, 0.03422832489013672, 0.037631988525390625, 0.04103565216064453, 0.04443931579589844, 0.047842979431152344, 0.05124664306640625, 0.054650306701660156, 0.05805397033691406, 0.06145763397216797, 0.06486129760742188, 0.06826496124267578, 0.07166862487792969, 0.0750722885131836, 0.0784759521484375, 0.0818796157836914, 0.08528327941894531, 0.08868694305419922, 0.09209060668945312, 0.09549427032470703, 0.09889793395996094, 0.10230159759521484, 0.10570526123046875, 0.10910892486572266, 0.11251258850097656, 0.11591625213623047, 0.11931991577148438, 0.12272357940673828, 0.1261272430419922, 0.1295309066772461, 0.1329345703125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 7.0, 5.0, 7.0, 12.0, 20.0, 31.0, 49.0, 136.0, 544.0, 99.0, 33.0, 18.0, 17.0, 5.0, 6.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0232696533203125, -0.022275209426879883, -0.021280765533447266, -0.02028632164001465, -0.01929187774658203, -0.018297433853149414, -0.017302989959716797, -0.01630854606628418, -0.015314102172851562, -0.014319658279418945, -0.013325214385986328, -0.012330770492553711, -0.011336326599121094, -0.010341882705688477, -0.00934743881225586, -0.008352994918823242, -0.007358551025390625, -0.006364107131958008, -0.005369663238525391, -0.0043752193450927734, -0.0033807754516601562, -0.002386331558227539, -0.0013918876647949219, -0.0003974437713623047, 0.0005970001220703125, 0.0015914440155029297, 0.002585887908935547, 0.003580331802368164, 0.004574775695800781, 0.0055692195892333984, 0.006563663482666016, 0.007558107376098633, 0.00855255126953125, 0.009546995162963867, 0.010541439056396484, 0.011535882949829102, 0.012530326843261719, 0.013524770736694336, 0.014519214630126953, 0.01551365852355957, 0.016508102416992188, 0.017502546310424805, 0.018496990203857422, 0.01949143409729004, 0.020485877990722656, 0.021480321884155273, 0.02247476577758789, 0.023469209671020508, 0.024463653564453125, 0.025458097457885742, 0.02645254135131836, 0.027446985244750977, 0.028441429138183594, 0.02943587303161621, 0.030430316925048828, 0.031424760818481445, 0.03241920471191406, 0.03341364860534668, 0.0344080924987793, 0.035402536392211914, 0.03639698028564453, 0.03739142417907715, 0.038385868072509766, 0.03938031196594238, 0.040374755859375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 8.0, 25.0, 171.0, 689.0, 90.0, 20.0, 6.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.7421064376831055, -0.7279297709465027, -0.7137531042098999, -0.6995764374732971, -0.6853997707366943, -0.6712231040000916, -0.6570464372634888, -0.642869770526886, -0.6286931037902832, -0.6145164370536804, -0.6003397703170776, -0.5861631035804749, -0.5719864368438721, -0.5578097701072693, -0.5436331033706665, -0.5294564366340637, -0.5152798295021057, -0.5011031627655029, -0.48692649602890015, -0.47274982929229736, -0.4585731625556946, -0.4443964958190918, -0.430219829082489, -0.4160431921482086, -0.40186649560928345, -0.38768982887268066, -0.3735131621360779, -0.3593364953994751, -0.3451598286628723, -0.33098316192626953, -0.31680649518966675, -0.30262985825538635, -0.2884531617164612, -0.2742764949798584, -0.2600998282432556, -0.24592316150665283, -0.23174650967121124, -0.21756984293460846, -0.20339317619800568, -0.1892165243625641, -0.1750398576259613, -0.16086319088935852, -0.14668652415275574, -0.13250985741615295, -0.11833320558071136, -0.10415653884410858, -0.0899798721075058, -0.07580321282148361, -0.061626553535461426, -0.04744989052414894, -0.033273227512836456, -0.019096560776233673, -0.004919897764921188, 0.009256765246391296, 0.02343343198299408, 0.037610091269016266, 0.05178675800561905, 0.06596342474222183, 0.08014008402824402, 0.0943167507648468, 0.10849341750144958, 0.12267007678747177, 0.13684675097465515, 0.15102340281009674, 0.16520006954669952]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 6.0, 4.0, 5.0, 8.0, 5.0, 9.0, 17.0, 29.0, 26.0, 57.0, 54.0, 76.0, 84.0, 99.0, 102.0, 97.0, 84.0, 69.0, 56.0, 26.0, 22.0, 16.0, 18.0, 3.0, 10.0, 3.0, 4.0, 4.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.058924734592437744, -0.05648486316204071, -0.05404499173164368, -0.051605116575956345, -0.04916524514555931, -0.04672537371516228, -0.044285498559474945, -0.04184562712907791, -0.03940575569868088, -0.036965884268283844, -0.03452601283788681, -0.03208613768219948, -0.029646266251802444, -0.02720639482140541, -0.024766521528363228, -0.022326648235321045, -0.01988677680492401, -0.017446905374526978, -0.015007032081484795, -0.012567159719765186, -0.010127287358045578, -0.00768741499632597, -0.005247542634606361, -0.0028076693415641785, -0.0003677979111671448, 0.0020720744505524635, 0.004511946812272072, 0.00695181917399168, 0.009391691535711288, 0.011831563897430897, 0.014271436259150505, 0.016711309552192688, 0.01915118098258972, 0.021591052412986755, 0.02403092570602894, 0.02647079899907112, 0.028910670429468155, 0.03135054185986519, 0.03379041701555252, 0.036230288445949554, 0.03867015987634659, 0.04111003130674362, 0.043549902737140656, 0.04598977789282799, 0.04842964932322502, 0.050869520753622055, 0.05330939590930939, 0.05574926733970642, 0.058189138770103455, 0.06062901020050049, 0.06306888163089752, 0.06550875306129456, 0.06794862449169159, 0.07038850337266922, 0.07282837480306625, 0.07526824623346329, 0.07770811766386032, 0.08014798909425735, 0.08258786052465439, 0.08502773195505142, 0.08746761083602905, 0.08990748226642609, 0.09234735369682312, 0.09478722512722015, 0.09722709655761719]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 2.0, 6.0, 6.0, 4.0, 8.0, 6.0, 8.0, 14.0, 12.0, 14.0, 24.0, 24.0, 10.0, 32.0, 36.0, 50794.0, 4143032.0, 42.0, 42.0, 14.0, 24.0, 6.0, 10.0, 22.0, 20.0, 14.0, 4.0, 8.0, 2.0, 8.0, 6.0, 0.0, 0.0, 6.0, 4.0, 0.0, 4.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0], "bins": [-1.748046875, -1.6934661865234375, -1.638885498046875, -1.5843048095703125, -1.52972412109375, -1.4751434326171875, -1.420562744140625, -1.3659820556640625, -1.3114013671875, -1.2568206787109375, -1.202239990234375, -1.1476593017578125, -1.09307861328125, -1.0384979248046875, -0.983917236328125, -0.9293365478515625, -0.874755859375, -0.8201751708984375, -0.765594482421875, -0.7110137939453125, -0.65643310546875, -0.6018524169921875, -0.547271728515625, -0.4926910400390625, -0.4381103515625, -0.3835296630859375, -0.328948974609375, -0.2743682861328125, -0.21978759765625, -0.1652069091796875, -0.110626220703125, -0.0560455322265625, -0.00146484375, 0.0531158447265625, 0.107696533203125, 0.1622772216796875, 0.21685791015625, 0.2714385986328125, 0.326019287109375, 0.3805999755859375, 0.4351806640625, 0.4897613525390625, 0.544342041015625, 0.5989227294921875, 0.65350341796875, 0.7080841064453125, 0.762664794921875, 0.8172454833984375, 0.871826171875, 0.9264068603515625, 0.980987548828125, 1.0355682373046875, 1.09014892578125, 1.1447296142578125, 1.199310302734375, 1.2538909912109375, 1.3084716796875, 1.3630523681640625, 1.417633056640625, 1.4722137451171875, 1.52679443359375, 1.5813751220703125, 1.635955810546875, 1.6905364990234375, 1.7451171875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 3.0, 4.0, 4.0, 2.0, 6.0, 12.0, 9.0, 5.0, 7.0, 18.0, 25.0, 38.0, 103.0, 190.0, 207.0, 148.0, 72.0, 33.0, 31.0, 4.0, 9.0, 11.0, 5.0, 7.0, 5.0, 13.0, 4.0, 1.0, 2.0, 2.0, 8.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0015239715576171875, -0.0014755427837371826, -0.0014271140098571777, -0.0013786852359771729, -0.001330256462097168, -0.001281827688217163, -0.0012333989143371582, -0.0011849701404571533, -0.0011365413665771484, -0.0010881125926971436, -0.0010396838188171387, -0.0009912550449371338, -0.0009428262710571289, -0.000894397497177124, -0.0008459687232971191, -0.0007975399494171143, -0.0007491111755371094, -0.0007006824016571045, -0.0006522536277770996, -0.0006038248538970947, -0.0005553960800170898, -0.000506967306137085, -0.0004585385322570801, -0.0004101097583770752, -0.0003616809844970703, -0.00031325221061706543, -0.00026482343673706055, -0.00021639466285705566, -0.00016796588897705078, -0.0001195371150970459, -7.110834121704102e-05, -2.2679567337036133e-05, 2.574920654296875e-05, 7.417798042297363e-05, 0.00012260675430297852, 0.0001710355281829834, 0.00021946430206298828, 0.00026789307594299316, 0.00031632184982299805, 0.00036475062370300293, 0.0004131793975830078, 0.0004616081714630127, 0.0005100369453430176, 0.0005584657192230225, 0.0006068944931030273, 0.0006553232669830322, 0.0007037520408630371, 0.000752180814743042, 0.0008006095886230469, 0.0008490383625030518, 0.0008974671363830566, 0.0009458959102630615, 0.0009943246841430664, 0.0010427534580230713, 0.0010911822319030762, 0.001139611005783081, 0.001188039779663086, 0.0012364685535430908, 0.0012848973274230957, 0.0013333261013031006, 0.0013817548751831055, 0.0014301836490631104, 0.0014786124229431152, 0.0015270411968231201, 0.001575469970703125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 3.0, 1.0, 7.0, 5.0, 14.0, 11.0, 20.0, 22.0, 54.0, 94.0, 230.0, 2057.0, 4190836.0, 587.0, 146.0, 85.0, 42.0, 24.0, 20.0, 7.0, 9.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.80908203125, -0.7899398803710938, -0.7707977294921875, -0.7516555786132812, -0.732513427734375, -0.7133712768554688, -0.6942291259765625, -0.6750869750976562, -0.65594482421875, -0.6368026733398438, -0.6176605224609375, -0.5985183715820312, -0.579376220703125, -0.5602340698242188, -0.5410919189453125, -0.5219497680664062, -0.5028076171875, -0.48366546630859375, -0.4645233154296875, -0.44538116455078125, -0.426239013671875, -0.40709686279296875, -0.3879547119140625, -0.36881256103515625, -0.34967041015625, -0.33052825927734375, -0.3113861083984375, -0.29224395751953125, -0.273101806640625, -0.25395965576171875, -0.2348175048828125, -0.21567535400390625, -0.196533203125, -0.17739105224609375, -0.1582489013671875, -0.13910675048828125, -0.119964599609375, -0.10082244873046875, -0.0816802978515625, -0.06253814697265625, -0.04339599609375, -0.02425384521484375, -0.0051116943359375, 0.01403045654296875, 0.033172607421875, 0.05231475830078125, 0.0714569091796875, 0.09059906005859375, 0.1097412109375, 0.12888336181640625, 0.1480255126953125, 0.16716766357421875, 0.186309814453125, 0.20545196533203125, 0.2245941162109375, 0.24373626708984375, 0.26287841796875, 0.28202056884765625, 0.3011627197265625, 0.32030487060546875, 0.339447021484375, 0.35858917236328125, 0.3777313232421875, 0.39687347412109375, 0.416015625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 9.0, 10.0, 22.0, 29.0, 106.0, 311.0, 2361.0, 930.0, 207.0, 55.0, 22.0, 11.0, 5.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.019012451171875, -0.018645524978637695, -0.01827859878540039, -0.017911672592163086, -0.01754474639892578, -0.017177820205688477, -0.016810894012451172, -0.016443967819213867, -0.016077041625976562, -0.015710115432739258, -0.015343189239501953, -0.014976263046264648, -0.014609336853027344, -0.014242410659790039, -0.013875484466552734, -0.01350855827331543, -0.013141632080078125, -0.01277470588684082, -0.012407779693603516, -0.012040853500366211, -0.011673927307128906, -0.011307001113891602, -0.010940074920654297, -0.010573148727416992, -0.010206222534179688, -0.009839296340942383, -0.009472370147705078, -0.009105443954467773, -0.008738517761230469, -0.008371591567993164, -0.00800466537475586, -0.007637739181518555, -0.00727081298828125, -0.006903886795043945, -0.006536960601806641, -0.006170034408569336, -0.005803108215332031, -0.0054361820220947266, -0.005069255828857422, -0.004702329635620117, -0.0043354034423828125, -0.003968477249145508, -0.003601551055908203, -0.0032346248626708984, -0.0028676986694335938, -0.002500772476196289, -0.0021338462829589844, -0.0017669200897216797, -0.001399993896484375, -0.0010330677032470703, -0.0006661415100097656, -0.00029921531677246094, 6.771087646484375e-05, 0.00043463706970214844, 0.0008015632629394531, 0.0011684894561767578, 0.0015354156494140625, 0.0019023418426513672, 0.002269268035888672, 0.0026361942291259766, 0.0030031204223632812, 0.003370046615600586, 0.0037369728088378906, 0.004103899002075195, 0.0044708251953125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 325.0, 693.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9341109991073608, -1.898314356803894, -1.8625178337097168, -1.82672119140625, -1.7909245491027832, -1.755128026008606, -1.7193313837051392, -1.683534860610962, -1.6477382183074951, -1.6119415760040283, -1.576145052909851, -1.5403484106063843, -1.504551887512207, -1.4687552452087402, -1.4329586029052734, -1.3971619606018066, -1.3613654375076294, -1.3255687952041626, -1.2897722721099854, -1.2539756298065186, -1.2181789875030518, -1.1823824644088745, -1.1465858221054077, -1.1107892990112305, -1.0749926567077637, -1.0391960144042969, -1.0033994913101196, -0.9676028490066528, -0.9318062663078308, -0.8960096836090088, -0.860213041305542, -0.82441645860672, -0.7886199951171875, -0.7528234124183655, -0.7170268297195435, -0.6812301874160767, -0.6454336047172546, -0.6096370220184326, -0.5738403797149658, -0.5380437970161438, -0.5022472143173218, -0.46645063161849976, -0.43065401911735535, -0.39485740661621094, -0.3590608239173889, -0.3232642412185669, -0.2874676287174225, -0.2516710162162781, -0.21587443351745605, -0.18007783591747284, -0.14428123831748962, -0.10848464071750641, -0.0726880431175232, -0.03689144551753998, -0.0010948479175567627, 0.034701764583587646, 0.07049834728240967, 0.10629494488239288, 0.1420915424823761, 0.17788814008235931, 0.21368473768234253, 0.24948133528232574, 0.28527793288230896, 0.32107454538345337, 0.3568711280822754]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 15.0, 22.0, 86.0, 212.0, 283.0, 210.0, 119.0, 43.0, 20.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.39581185579299927, -0.3881129026412964, -0.3804139196872711, -0.37271496653556824, -0.36501598358154297, -0.3573170304298401, -0.3496180772781372, -0.34191909432411194, -0.33422014117240906, -0.3265211880207062, -0.3188222050666809, -0.311123251914978, -0.30342426896095276, -0.2957253158092499, -0.2880263328552246, -0.28032737970352173, -0.27262842655181885, -0.26492947340011597, -0.2572304904460907, -0.24953153729438782, -0.24183256924152374, -0.23413360118865967, -0.2264346331357956, -0.21873566508293152, -0.21103668212890625, -0.20333771407604218, -0.1956387460231781, -0.18793979287147522, -0.18024082481861115, -0.17254185676574707, -0.164842888712883, -0.15714392066001892, -0.14944496750831604, -0.14174599945545197, -0.1340470314025879, -0.126348078250885, -0.11864911019802094, -0.11095014214515686, -0.10325117409229279, -0.09555220603942871, -0.08785324543714523, -0.08015427738428116, -0.07245531678199768, -0.0647563487291336, -0.05705738440155983, -0.04935842007398605, -0.04165945202112198, -0.0339604876935482, -0.026261523365974426, -0.01856255903840065, -0.010863592848181725, -0.003164626657962799, 0.004534337669610977, 0.012233301997184753, 0.019932270050048828, 0.027631234377622604, 0.03533019870519638, 0.04302916303277016, 0.05072812736034393, 0.05842709541320801, 0.06612606346607208, 0.07382502406835556, 0.08152399212121964, 0.08922295272350311, 0.09692192077636719]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 5.0, 12.0, 12.0, 15.0, 18.0, 15.0, 26.0, 24.0, 47.0, 42.0, 51.0, 52.0, 64.0, 73.0, 77459.0, 970172.0, 99.0, 53.0, 47.0, 40.0, 38.0, 29.0, 27.0, 18.0, 28.0, 18.0, 15.0, 12.0, 10.0, 5.0, 2.0, 4.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.36572265625, -0.3539581298828125, -0.342193603515625, -0.3304290771484375, -0.31866455078125, -0.3069000244140625, -0.295135498046875, -0.2833709716796875, -0.2716064453125, -0.2598419189453125, -0.248077392578125, -0.2363128662109375, -0.22454833984375, -0.2127838134765625, -0.201019287109375, -0.1892547607421875, -0.177490234375, -0.1657257080078125, -0.153961181640625, -0.1421966552734375, -0.13043212890625, -0.1186676025390625, -0.106903076171875, -0.0951385498046875, -0.0833740234375, -0.0716094970703125, -0.059844970703125, -0.0480804443359375, -0.03631591796875, -0.0245513916015625, -0.012786865234375, -0.0010223388671875, 0.0107421875, 0.0225067138671875, 0.034271240234375, 0.0460357666015625, 0.05780029296875, 0.0695648193359375, 0.081329345703125, 0.0930938720703125, 0.1048583984375, 0.1166229248046875, 0.128387451171875, 0.1401519775390625, 0.15191650390625, 0.1636810302734375, 0.175445556640625, 0.1872100830078125, 0.198974609375, 0.2107391357421875, 0.222503662109375, 0.2342681884765625, 0.24603271484375, 0.2577972412109375, 0.269561767578125, 0.2813262939453125, 0.2930908203125, 0.3048553466796875, 0.316619873046875, 0.3283843994140625, 0.34014892578125, 0.3519134521484375, 0.363677978515625, 0.3754425048828125, 0.38720703125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 84.0, 689.0, 235.0, 12.0], "bins": [-0.08319091796875, -0.08184072375297546, -0.08049052953720093, -0.07914033532142639, -0.07779014110565186, -0.07643994688987732, -0.07508975267410278, -0.07373955845832825, -0.07238936424255371, -0.07103917002677917, -0.06968897581100464, -0.0683387815952301, -0.06698858737945557, -0.06563839316368103, -0.0642881989479065, -0.06293800473213196, -0.06158781051635742, -0.060237616300582886, -0.05888742208480835, -0.057537227869033813, -0.05618703365325928, -0.05483683943748474, -0.053486645221710205, -0.05213645100593567, -0.05078625679016113, -0.0494360625743866, -0.04808586835861206, -0.046735674142837524, -0.04538547992706299, -0.04403528571128845, -0.042685091495513916, -0.04133489727973938, -0.039984703063964844, -0.03863450884819031, -0.03728431463241577, -0.035934120416641235, -0.0345839262008667, -0.03323373198509216, -0.03188353776931763, -0.03053334355354309, -0.029183149337768555, -0.02783295512199402, -0.026482760906219482, -0.025132566690444946, -0.02378237247467041, -0.022432178258895874, -0.021081984043121338, -0.019731789827346802, -0.018381595611572266, -0.01703140139579773, -0.015681207180023193, -0.014331012964248657, -0.012980818748474121, -0.011630624532699585, -0.010280430316925049, -0.008930236101150513, -0.0075800418853759766, -0.00622984766960144, -0.004879653453826904, -0.003529459238052368, -0.002179265022277832, -0.0008290708065032959, 0.0005211234092712402, 0.0018713176250457764, 0.0032215118408203125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 1.0, 2.0, 6.0, 7.0, 8.0, 11.0, 12.0, 12.0, 17.0, 28.0, 53.0, 72.0, 99.0, 184.0, 543.0, 3334.0, 76045.0, 943129.0, 22474.0, 1681.0, 392.0, 154.0, 101.0, 50.0, 34.0, 29.0, 25.0, 14.0, 8.0, 8.0, 8.0, 2.0, 2.0, 6.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.164306640625, -0.1585102081298828, -0.15271377563476562, -0.14691734313964844, -0.14112091064453125, -0.13532447814941406, -0.12952804565429688, -0.12373161315917969, -0.1179351806640625, -0.11213874816894531, -0.10634231567382812, -0.10054588317871094, -0.09474945068359375, -0.08895301818847656, -0.08315658569335938, -0.07736015319824219, -0.071563720703125, -0.06576728820800781, -0.059970855712890625, -0.05417442321777344, -0.04837799072265625, -0.04258155822753906, -0.036785125732421875, -0.030988693237304688, -0.0251922607421875, -0.019395828247070312, -0.013599395751953125, -0.0078029632568359375, -0.00200653076171875, 0.0037899017333984375, 0.009586334228515625, 0.015382766723632812, 0.02117919921875, 0.026975631713867188, 0.032772064208984375, 0.03856849670410156, 0.04436492919921875, 0.05016136169433594, 0.055957794189453125, 0.06175422668457031, 0.0675506591796875, 0.07334709167480469, 0.07914352416992188, 0.08493995666503906, 0.09073638916015625, 0.09653282165527344, 0.10232925415039062, 0.10812568664550781, 0.113922119140625, 0.11971855163574219, 0.12551498413085938, 0.13131141662597656, 0.13710784912109375, 0.14290428161621094, 0.14870071411132812, 0.1544971466064453, 0.1602935791015625, 0.1660900115966797, 0.17188644409179688, 0.17768287658691406, 0.18347930908203125, 0.18927574157714844, 0.19507217407226562, 0.2008686065673828, 0.2066650390625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 5.0, 1.0, 2.0, 1.0, 6.0, 9.0, 9.0, 18.0, 15.0, 21.0, 16.0, 30.0, 43.0, 46.0, 47.0, 71.0, 58.0, 69.0, 72.0, 81.0, 73.0, 57.0, 49.0, 43.0, 41.0, 28.0, 25.0, 20.0, 12.0, 16.0, 5.0, 3.0, 9.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.060150146484375, -0.05810213088989258, -0.056054115295410156, -0.054006099700927734, -0.05195808410644531, -0.04991006851196289, -0.04786205291748047, -0.04581403732299805, -0.043766021728515625, -0.0417180061340332, -0.03966999053955078, -0.03762197494506836, -0.03557395935058594, -0.033525943756103516, -0.031477928161621094, -0.029429912567138672, -0.02738189697265625, -0.025333881378173828, -0.023285865783691406, -0.021237850189208984, -0.019189834594726562, -0.01714181900024414, -0.015093803405761719, -0.013045787811279297, -0.010997772216796875, -0.008949756622314453, -0.006901741027832031, -0.004853725433349609, -0.0028057098388671875, -0.0007576942443847656, 0.0012903213500976562, 0.003338336944580078, 0.0053863525390625, 0.007434368133544922, 0.009482383728027344, 0.011530399322509766, 0.013578414916992188, 0.01562643051147461, 0.01767444610595703, 0.019722461700439453, 0.021770477294921875, 0.023818492889404297, 0.02586650848388672, 0.02791452407836914, 0.029962539672851562, 0.032010555267333984, 0.034058570861816406, 0.03610658645629883, 0.03815460205078125, 0.04020261764526367, 0.042250633239746094, 0.044298648834228516, 0.04634666442871094, 0.04839468002319336, 0.05044269561767578, 0.0524907112121582, 0.054538726806640625, 0.05658674240112305, 0.05863475799560547, 0.06068277359008789, 0.06273078918457031, 0.06477880477905273, 0.06682682037353516, 0.06887483596801758, 0.0709228515625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 4.0, 4.0, 9.0, 17.0, 20.0, 13.0, 19.0, 42.0, 89.0, 190.0, 447.0, 2209.0, 28252.0, 1001363.0, 13758.0, 1420.0, 338.0, 149.0, 69.0, 40.0, 27.0, 17.0, 13.0, 8.0, 10.0, 4.0, 9.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.29931640625, -0.29131126403808594, -0.2833061218261719, -0.2753009796142578, -0.26729583740234375, -0.2592906951904297, -0.2512855529785156, -0.24328041076660156, -0.2352752685546875, -0.22727012634277344, -0.21926498413085938, -0.2112598419189453, -0.20325469970703125, -0.1952495574951172, -0.18724441528320312, -0.17923927307128906, -0.171234130859375, -0.16322898864746094, -0.15522384643554688, -0.1472187042236328, -0.13921356201171875, -0.1312084197998047, -0.12320327758789062, -0.11519813537597656, -0.1071929931640625, -0.09918785095214844, -0.09118270874023438, -0.08317756652832031, -0.07517242431640625, -0.06716728210449219, -0.059162139892578125, -0.05115699768066406, -0.04315185546875, -0.03514671325683594, -0.027141571044921875, -0.019136428833007812, -0.01113128662109375, -0.0031261444091796875, 0.004878997802734375, 0.012884140014648438, 0.0208892822265625, 0.028894424438476562, 0.036899566650390625, 0.04490470886230469, 0.05290985107421875, 0.06091499328613281, 0.06892013549804688, 0.07692527770996094, 0.084930419921875, 0.09293556213378906, 0.10094070434570312, 0.10894584655761719, 0.11695098876953125, 0.12495613098144531, 0.13296127319335938, 0.14096641540527344, 0.1489715576171875, 0.15697669982910156, 0.16498184204101562, 0.1729869842529297, 0.18099212646484375, 0.1889972686767578, 0.19700241088867188, 0.20500755310058594, 0.2130126953125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 5.0, 3.0, 9.0, 11.0, 6.0, 19.0, 15.0, 44.0, 49.0, 73.0, 104.0, 112.0, 126.0, 142.0, 75.0, 61.0, 35.0, 26.0, 18.0, 12.0, 14.0, 4.0, 3.0, 10.0, 7.0, 3.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.3589859008789062e-05, -1.308973878622055e-05, -1.2589618563652039e-05, -1.2089498341083527e-05, -1.1589378118515015e-05, -1.1089257895946503e-05, -1.058913767337799e-05, -1.0089017450809479e-05, -9.588897228240967e-06, -9.088777005672455e-06, -8.588656783103943e-06, -8.088536560535431e-06, -7.588416337966919e-06, -7.088296115398407e-06, -6.588175892829895e-06, -6.088055670261383e-06, -5.587935447692871e-06, -5.087815225124359e-06, -4.587695002555847e-06, -4.087574779987335e-06, -3.5874545574188232e-06, -3.0873343348503113e-06, -2.5872141122817993e-06, -2.0870938897132874e-06, -1.5869736671447754e-06, -1.0868534445762634e-06, -5.867332220077515e-07, -8.66129994392395e-08, 4.1350722312927246e-07, 9.136274456977844e-07, 1.4137476682662964e-06, 1.9138678908348083e-06, 2.4139881134033203e-06, 2.9141083359718323e-06, 3.4142285585403442e-06, 3.914348781108856e-06, 4.414469003677368e-06, 4.91458922624588e-06, 5.414709448814392e-06, 5.914829671382904e-06, 6.414949893951416e-06, 6.915070116519928e-06, 7.41519033908844e-06, 7.915310561656952e-06, 8.415430784225464e-06, 8.915551006793976e-06, 9.415671229362488e-06, 9.915791451931e-06, 1.0415911674499512e-05, 1.0916031897068024e-05, 1.1416152119636536e-05, 1.1916272342205048e-05, 1.241639256477356e-05, 1.2916512787342072e-05, 1.3416633009910583e-05, 1.3916753232479095e-05, 1.4416873455047607e-05, 1.491699367761612e-05, 1.541711390018463e-05, 1.5917234122753143e-05, 1.6417354345321655e-05, 1.6917474567890167e-05, 1.741759479045868e-05, 1.791771501302719e-05, 1.8417835235595703e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 3.0, 4.0, 2.0, 7.0, 8.0, 7.0, 15.0, 15.0, 23.0, 57.0, 128.0, 425.0, 2649.0, 998172.0, 44887.0, 1597.0, 294.0, 123.0, 61.0, 20.0, 15.0, 18.0, 6.0, 8.0, 7.0, 6.0, 2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.80126953125, -0.7776107788085938, -0.7539520263671875, -0.7302932739257812, -0.706634521484375, -0.6829757690429688, -0.6593170166015625, -0.6356582641601562, -0.61199951171875, -0.5883407592773438, -0.5646820068359375, -0.5410232543945312, -0.517364501953125, -0.49370574951171875, -0.4700469970703125, -0.44638824462890625, -0.4227294921875, -0.39907073974609375, -0.3754119873046875, -0.35175323486328125, -0.328094482421875, -0.30443572998046875, -0.2807769775390625, -0.25711822509765625, -0.23345947265625, -0.20980072021484375, -0.1861419677734375, -0.16248321533203125, -0.138824462890625, -0.11516571044921875, -0.0915069580078125, -0.06784820556640625, -0.044189453125, -0.02053070068359375, 0.0031280517578125, 0.02678680419921875, 0.050445556640625, 0.07410430908203125, 0.0977630615234375, 0.12142181396484375, 0.14508056640625, 0.16873931884765625, 0.1923980712890625, 0.21605682373046875, 0.239715576171875, 0.26337432861328125, 0.2870330810546875, 0.31069183349609375, 0.3343505859375, 0.35800933837890625, 0.3816680908203125, 0.40532684326171875, 0.428985595703125, 0.45264434814453125, 0.4763031005859375, 0.49996185302734375, 0.52362060546875, 0.5472793579101562, 0.5709381103515625, 0.5945968627929688, 0.618255615234375, 0.6419143676757812, 0.6655731201171875, 0.6892318725585938, 0.712890625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 8.0, 12.0, 27.0, 91.0, 607.0, 168.0, 41.0, 14.0, 7.0, 4.0, 4.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.186767578125, -0.17814254760742188, -0.16951751708984375, -0.16089248657226562, -0.1522674560546875, -0.14364242553710938, -0.13501739501953125, -0.12639236450195312, -0.117767333984375, -0.10914230346679688, -0.10051727294921875, -0.09189224243164062, -0.0832672119140625, -0.07464218139648438, -0.06601715087890625, -0.057392120361328125, -0.04876708984375, -0.040142059326171875, -0.03151702880859375, -0.022891998291015625, -0.0142669677734375, -0.005641937255859375, 0.00298309326171875, 0.011608123779296875, 0.020233154296875, 0.028858184814453125, 0.03748321533203125, 0.046108245849609375, 0.0547332763671875, 0.06335830688476562, 0.07198333740234375, 0.08060836791992188, 0.0892333984375, 0.09785842895507812, 0.10648345947265625, 0.11510848999023438, 0.1237335205078125, 0.13235855102539062, 0.14098358154296875, 0.14960861206054688, 0.158233642578125, 0.16685867309570312, 0.17548370361328125, 0.18410873413085938, 0.1927337646484375, 0.20135879516601562, 0.20998382568359375, 0.21860885620117188, 0.22723388671875, 0.23585891723632812, 0.24448394775390625, 0.2531089782714844, 0.2617340087890625, 0.2703590393066406, 0.27898406982421875, 0.2876091003417969, 0.296234130859375, 0.3048591613769531, 0.31348419189453125, 0.3221092224121094, 0.3307342529296875, 0.3393592834472656, 0.34798431396484375, 0.3566093444824219, 0.365234375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 41.0, 945.0, 25.0, 4.0, 3.0], "bins": [-11.769240379333496, -11.573806762695312, -11.378374099731445, -11.182940483093262, -10.987507820129395, -10.792074203491211, -10.596641540527344, -10.40120792388916, -10.205775260925293, -10.01034164428711, -9.814908981323242, -9.619475364685059, -9.424042701721191, -9.228609085083008, -9.03317642211914, -8.837742805480957, -8.64231014251709, -8.446876525878906, -8.251443862915039, -8.056010246276855, -7.860577583312988, -7.665144443511963, -7.4697113037109375, -7.274278163909912, -7.0788445472717285, -6.883411407470703, -6.687978267669678, -6.492545127868652, -6.297111988067627, -6.101678848266602, -5.906245708465576, -5.710812568664551, -5.515379428863525, -5.3199462890625, -5.124513149261475, -4.929080009460449, -4.733646869659424, -4.538213729858398, -4.342780590057373, -4.147347450256348, -3.9519143104553223, -3.756481170654297, -3.5610480308532715, -3.365614891052246, -3.1701817512512207, -2.9747486114501953, -2.77931547164917, -2.5838823318481445, -2.388449192047119, -2.1930160522460938, -1.9975829124450684, -1.802149772644043, -1.6067166328430176, -1.4112834930419922, -1.2158502340316772, -1.0204170942306519, -0.8249838352203369, -0.6295506954193115, -0.43411752581596375, -0.23868435621261597, -0.043251216411590576, 0.15218192338943481, 0.347615122795105, 0.5430482625961304, 0.7384814023971558]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 12.0, 19.0, 51.0, 72.0, 126.0, 155.0, 159.0, 146.0, 100.0, 80.0, 44.0, 24.0, 16.0, 4.0, 0.0, 3.0, 1.0], "bins": [-2.0967516899108887, -2.058851718902588, -2.020951747894287, -1.9830516576766968, -1.9451515674591064, -1.9072515964508057, -1.8693515062332153, -1.8314515352249146, -1.7935514450073242, -1.7556514739990234, -1.717751383781433, -1.6798514127731323, -1.641951322555542, -1.6040513515472412, -1.5661512613296509, -1.52825129032135, -1.4903513193130493, -1.4524513483047485, -1.4145512580871582, -1.3766512870788574, -1.338751196861267, -1.3008512258529663, -1.262951135635376, -1.2250511646270752, -1.1871511936187744, -1.1492512226104736, -1.1113511323928833, -1.0734511613845825, -1.0355510711669922, -0.9976511001586914, -0.9597510695457458, -0.9218510389328003, -0.8839510083198547, -0.8460509777069092, -0.8081509470939636, -0.7702509164810181, -0.7323509454727173, -0.694450855255127, -0.6565508842468262, -0.6186508536338806, -0.5807508230209351, -0.5428507924079895, -0.504950761795044, -0.4670507609844208, -0.4291507303714752, -0.39125069975852966, -0.3533506989479065, -0.31545066833496094, -0.2775506377220154, -0.23965060710906982, -0.20175059139728546, -0.1638505756855011, -0.12595054507255554, -0.08805051445960999, -0.05015049874782562, -0.01225048303604126, 0.025649547576904297, 0.06354957073926926, 0.10144959390163422, 0.13934960961341858, 0.17724964022636414, 0.2151496708393097, 0.25304967164993286, 0.2909497022628784, 0.328849732875824]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 16.0, 23.0, 42.0, 77.0, 228.0, 770.0, 4184285.0, 8593.0, 205.0, 41.0, 7.0], "bins": [-2.6875, -2.642576217651367, -2.5976524353027344, -2.5527286529541016, -2.5078048706054688, -2.462881088256836, -2.417957305908203, -2.3730335235595703, -2.3281097412109375, -2.2831859588623047, -2.238262176513672, -2.193338394165039, -2.1484146118164062, -2.1034908294677734, -2.0585670471191406, -2.013643264770508, -1.968719482421875, -1.9237957000732422, -1.8788719177246094, -1.8339481353759766, -1.7890243530273438, -1.744100570678711, -1.6991767883300781, -1.6542530059814453, -1.6093292236328125, -1.5644054412841797, -1.5194816589355469, -1.474557876586914, -1.4296340942382812, -1.3847103118896484, -1.3397865295410156, -1.2948627471923828, -1.24993896484375, -1.2050151824951172, -1.1600914001464844, -1.1151676177978516, -1.0702438354492188, -1.025320053100586, -0.9803962707519531, -0.9354724884033203, -0.8905487060546875, -0.8456249237060547, -0.8007011413574219, -0.7557773590087891, -0.7108535766601562, -0.6659297943115234, -0.6210060119628906, -0.5760822296142578, -0.531158447265625, -0.4862346649169922, -0.4413108825683594, -0.39638710021972656, -0.35146331787109375, -0.30653953552246094, -0.2616157531738281, -0.2166919708251953, -0.1717681884765625, -0.1268444061279297, -0.08192062377929688, -0.03699684143066406, 0.00792694091796875, 0.05285072326660156, 0.09777450561523438, 0.1426982879638672, 0.1876220703125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 19.0, 81.0, 274.0, 388.0, 179.0, 60.0, 16.0], "bins": [-0.09686279296875, -0.09525567293167114, -0.09364855289459229, -0.09204143285751343, -0.09043431282043457, -0.08882719278335571, -0.08722007274627686, -0.085612952709198, -0.08400583267211914, -0.08239871263504028, -0.08079159259796143, -0.07918447256088257, -0.07757735252380371, -0.07597023248672485, -0.074363112449646, -0.07275599241256714, -0.07114887237548828, -0.06954175233840942, -0.06793463230133057, -0.06632751226425171, -0.06472039222717285, -0.063113272190094, -0.06150615215301514, -0.05989903211593628, -0.05829191207885742, -0.056684792041778564, -0.05507767200469971, -0.05347055196762085, -0.05186343193054199, -0.050256311893463135, -0.04864919185638428, -0.04704207181930542, -0.04543495178222656, -0.043827831745147705, -0.04222071170806885, -0.04061359167098999, -0.03900647163391113, -0.037399351596832275, -0.03579223155975342, -0.03418511152267456, -0.0325779914855957, -0.030970871448516846, -0.02936375141143799, -0.02775663137435913, -0.026149511337280273, -0.024542391300201416, -0.02293527126312256, -0.0213281512260437, -0.019721031188964844, -0.018113911151885986, -0.01650679111480713, -0.014899671077728271, -0.013292551040649414, -0.011685431003570557, -0.0100783109664917, -0.008471190929412842, -0.006864070892333984, -0.005256950855255127, -0.0036498308181762695, -0.002042710781097412, -0.0004355907440185547, 0.0011715292930603027, 0.00277864933013916, 0.004385769367218018, 0.005992889404296875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 13.0, 30.0, 38.0, 60.0, 138.0, 180.0, 255.0, 741.0, 4190456.0, 1728.0, 329.0, 141.0, 87.0, 41.0, 29.0, 10.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.51953125, -2.446746826171875, -2.37396240234375, -2.301177978515625, -2.2283935546875, -2.155609130859375, -2.08282470703125, -2.010040283203125, -1.937255859375, -1.864471435546875, -1.79168701171875, -1.718902587890625, -1.6461181640625, -1.573333740234375, -1.50054931640625, -1.427764892578125, -1.35498046875, -1.282196044921875, -1.20941162109375, -1.136627197265625, -1.0638427734375, -0.991058349609375, -0.91827392578125, -0.845489501953125, -0.772705078125, -0.699920654296875, -0.62713623046875, -0.554351806640625, -0.4815673828125, -0.408782958984375, -0.33599853515625, -0.263214111328125, -0.1904296875, -0.117645263671875, -0.04486083984375, 0.027923583984375, 0.1007080078125, 0.173492431640625, 0.24627685546875, 0.319061279296875, 0.391845703125, 0.464630126953125, 0.53741455078125, 0.610198974609375, 0.6829833984375, 0.755767822265625, 0.82855224609375, 0.901336669921875, 0.97412109375, 1.046905517578125, 1.11968994140625, 1.192474365234375, 1.2652587890625, 1.338043212890625, 1.41082763671875, 1.483612060546875, 1.556396484375, 1.629180908203125, 1.70196533203125, 1.774749755859375, 1.8475341796875, 1.920318603515625, 1.99310302734375, 2.065887451171875, 2.138671875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 5.0, 121.0, 3861.0, 83.0, 10.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51708984375, -0.5068149566650391, -0.4965400695800781, -0.4862651824951172, -0.47599029541015625, -0.4657154083251953, -0.4554405212402344, -0.44516563415527344, -0.4348907470703125, -0.42461585998535156, -0.4143409729003906, -0.4040660858154297, -0.39379119873046875, -0.3835163116455078, -0.3732414245605469, -0.36296653747558594, -0.352691650390625, -0.34241676330566406, -0.3321418762207031, -0.3218669891357422, -0.31159210205078125, -0.3013172149658203, -0.2910423278808594, -0.28076744079589844, -0.2704925537109375, -0.26021766662597656, -0.24994277954101562, -0.2396678924560547, -0.22939300537109375, -0.2191181182861328, -0.20884323120117188, -0.19856834411621094, -0.18829345703125, -0.17801856994628906, -0.16774368286132812, -0.1574687957763672, -0.14719390869140625, -0.1369190216064453, -0.12664413452148438, -0.11636924743652344, -0.1060943603515625, -0.09581947326660156, -0.08554458618164062, -0.07526969909667969, -0.06499481201171875, -0.05471992492675781, -0.044445037841796875, -0.03417015075683594, -0.023895263671875, -0.013620376586914062, -0.003345489501953125, 0.0069293975830078125, 0.01720428466796875, 0.027479171752929688, 0.037754058837890625, 0.04802894592285156, 0.0583038330078125, 0.06857872009277344, 0.07885360717773438, 0.08912849426269531, 0.09940338134765625, 0.10967826843261719, 0.11995315551757812, 0.13022804260253906, 0.1405029296875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 10.0, 686.0, 304.0, 14.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.677498817443848, -6.518243789672852, -6.3589887619018555, -6.199733734130859, -6.040478706359863, -5.881223678588867, -5.721968650817871, -5.562713623046875, -5.403458595275879, -5.244203567504883, -5.084948539733887, -4.925693511962891, -4.7664384841918945, -4.607183456420898, -4.447928428649902, -4.288673400878906, -4.129417896270752, -3.970162868499756, -3.8109078407287598, -3.6516528129577637, -3.4923977851867676, -3.3331427574157715, -3.1738874912261963, -3.0146324634552, -2.855377435684204, -2.696122407913208, -2.536867380142212, -2.377612352371216, -2.2183570861816406, -2.0591020584106445, -1.8998470306396484, -1.7405920028686523, -1.581336498260498, -1.422081470489502, -1.2628264427185059, -1.1035712957382202, -0.9443162679672241, -0.785061240196228, -0.6258061528205872, -0.4665510654449463, -0.3072960376739502, -0.1480409801006317, 0.011214077472686768, 0.17046913504600525, 0.32972419261932373, 0.4889792203903198, 0.6482343077659607, 0.8074893951416016, 0.9667444229125977, 1.1259994506835938, 1.2852544784545898, 1.4445096254348755, 1.6037646532058716, 1.7630196809768677, 1.9222748279571533, 2.0815298557281494, 2.2407848834991455, 2.4000399112701416, 2.5592949390411377, 2.718549966812134, 2.877805233001709, 3.037060260772705, 3.196315288543701, 3.3555703163146973, 3.5148253440856934]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 13.0, 20.0, 28.0, 61.0, 92.0, 145.0, 155.0, 151.0, 126.0, 88.0, 62.0, 37.0, 13.0, 8.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4944888353347778, -1.4473156929016113, -1.4001424312591553, -1.3529691696166992, -1.3057960271835327, -1.2586228847503662, -1.2114496231079102, -1.164276361465454, -1.1171032190322876, -1.069930076599121, -1.022756814956665, -0.9755836129188538, -0.9284104108810425, -0.8812372088432312, -0.8340640068054199, -0.7868908047676086, -0.7397176027297974, -0.6925444006919861, -0.6453711986541748, -0.5981979966163635, -0.5510247945785522, -0.503851592540741, -0.4566783905029297, -0.4095051884651184, -0.36233198642730713, -0.31515878438949585, -0.26798558235168457, -0.2208123803138733, -0.173639178276062, -0.12646597623825073, -0.07929277420043945, -0.032119572162628174, 0.015053749084472656, 0.062226951122283936, 0.10940015316009521, 0.1565733551979065, 0.20374655723571777, 0.25091975927352905, 0.29809296131134033, 0.3452661633491516, 0.3924393653869629, 0.43961256742477417, 0.48678576946258545, 0.5339589715003967, 0.581132173538208, 0.6283053755760193, 0.6754785776138306, 0.7226517796516418, 0.7698249816894531, 0.8169981837272644, 0.8641713857650757, 0.911344587802887, 0.9585177898406982, 1.0056910514831543, 1.0528641939163208, 1.1000373363494873, 1.1472105979919434, 1.1943838596343994, 1.241557002067566, 1.2887301445007324, 1.3359034061431885, 1.3830766677856445, 1.430249810218811, 1.4774229526519775, 1.5245962142944336]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 10.0, 8.0, 14.0, 28.0, 25.0, 36.0, 67.0, 115.0, 263.0, 806.0, 3600.0, 104248.0, 924191.0, 12968.0, 1356.0, 434.0, 165.0, 73.0, 36.0, 32.0, 16.0, 21.0, 6.0, 10.0, 9.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.642578125, -0.6232452392578125, -0.603912353515625, -0.5845794677734375, -0.56524658203125, -0.5459136962890625, -0.526580810546875, -0.5072479248046875, -0.4879150390625, -0.4685821533203125, -0.449249267578125, -0.4299163818359375, -0.41058349609375, -0.3912506103515625, -0.371917724609375, -0.3525848388671875, -0.333251953125, -0.3139190673828125, -0.294586181640625, -0.2752532958984375, -0.25592041015625, -0.2365875244140625, -0.217254638671875, -0.1979217529296875, -0.1785888671875, -0.1592559814453125, -0.139923095703125, -0.1205902099609375, -0.10125732421875, -0.0819244384765625, -0.062591552734375, -0.0432586669921875, -0.02392578125, -0.0045928955078125, 0.014739990234375, 0.0340728759765625, 0.05340576171875, 0.0727386474609375, 0.092071533203125, 0.1114044189453125, 0.1307373046875, 0.1500701904296875, 0.169403076171875, 0.1887359619140625, 0.20806884765625, 0.2274017333984375, 0.246734619140625, 0.2660675048828125, 0.285400390625, 0.3047332763671875, 0.324066162109375, 0.3433990478515625, 0.36273193359375, 0.3820648193359375, 0.401397705078125, 0.4207305908203125, 0.4400634765625, 0.4593963623046875, 0.478729248046875, 0.4980621337890625, 0.51739501953125, 0.5367279052734375, 0.556060791015625, 0.5753936767578125, 0.5947265625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 1.0, 4.0, 18.0, 40.0, 86.0, 158.0, 223.0, 207.0, 141.0, 75.0, 35.0, 14.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1279296875, -0.12536191940307617, -0.12279415130615234, -0.12022638320922852, -0.11765861511230469, -0.11509084701538086, -0.11252307891845703, -0.1099553108215332, -0.10738754272460938, -0.10481977462768555, -0.10225200653076172, -0.09968423843383789, -0.09711647033691406, -0.09454870223999023, -0.0919809341430664, -0.08941316604614258, -0.08684539794921875, -0.08427762985229492, -0.0817098617553711, -0.07914209365844727, -0.07657432556152344, -0.07400655746459961, -0.07143878936767578, -0.06887102127075195, -0.06630325317382812, -0.0637354850769043, -0.06116771697998047, -0.05859994888305664, -0.05603218078613281, -0.053464412689208984, -0.050896644592285156, -0.04832887649536133, -0.0457611083984375, -0.04319334030151367, -0.040625572204589844, -0.038057804107666016, -0.03549003601074219, -0.03292226791381836, -0.03035449981689453, -0.027786731719970703, -0.025218963623046875, -0.022651195526123047, -0.02008342742919922, -0.01751565933227539, -0.014947891235351562, -0.012380123138427734, -0.009812355041503906, -0.007244586944580078, -0.00467681884765625, -0.002109050750732422, 0.00045871734619140625, 0.0030264854431152344, 0.0055942535400390625, 0.00816202163696289, 0.010729789733886719, 0.013297557830810547, 0.015865325927734375, 0.018433094024658203, 0.02100086212158203, 0.02356863021850586, 0.026136398315429688, 0.028704166412353516, 0.031271934509277344, 0.03383970260620117, 0.036407470703125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 9.0, 4.0, 6.0, 11.0, 14.0, 7.0, 22.0, 23.0, 50.0, 61.0, 81.0, 150.0, 406.0, 1578.0, 15243.0, 881380.0, 143232.0, 4864.0, 793.0, 267.0, 126.0, 67.0, 51.0, 30.0, 26.0, 8.0, 10.0, 9.0, 12.0, 6.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.375, -0.36421966552734375, -0.3534393310546875, -0.34265899658203125, -0.331878662109375, -0.32109832763671875, -0.3103179931640625, -0.29953765869140625, -0.28875732421875, -0.27797698974609375, -0.2671966552734375, -0.25641632080078125, -0.245635986328125, -0.23485565185546875, -0.2240753173828125, -0.21329498291015625, -0.2025146484375, -0.19173431396484375, -0.1809539794921875, -0.17017364501953125, -0.159393310546875, -0.14861297607421875, -0.1378326416015625, -0.12705230712890625, -0.11627197265625, -0.10549163818359375, -0.0947113037109375, -0.08393096923828125, -0.073150634765625, -0.06237030029296875, -0.0515899658203125, -0.04080963134765625, -0.030029296875, -0.01924896240234375, -0.0084686279296875, 0.00231170654296875, 0.013092041015625, 0.02387237548828125, 0.0346527099609375, 0.04543304443359375, 0.05621337890625, 0.06699371337890625, 0.0777740478515625, 0.08855438232421875, 0.099334716796875, 0.11011505126953125, 0.1208953857421875, 0.13167572021484375, 0.1424560546875, 0.15323638916015625, 0.1640167236328125, 0.17479705810546875, 0.185577392578125, 0.19635772705078125, 0.2071380615234375, 0.21791839599609375, 0.22869873046875, 0.23947906494140625, 0.2502593994140625, 0.26103973388671875, 0.271820068359375, 0.28260040283203125, 0.2933807373046875, 0.30416107177734375, 0.31494140625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 7.0, 7.0, 10.0, 14.0, 6.0, 24.0, 23.0, 36.0, 36.0, 34.0, 36.0, 49.0, 65.0, 59.0, 83.0, 69.0, 57.0, 61.0, 61.0, 53.0, 38.0, 32.0, 30.0, 34.0, 15.0, 15.0, 8.0, 13.0, 9.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1400146484375, -0.1360187530517578, -0.13202285766601562, -0.12802696228027344, -0.12403106689453125, -0.12003517150878906, -0.11603927612304688, -0.11204338073730469, -0.1080474853515625, -0.10405158996582031, -0.10005569458007812, -0.09605979919433594, -0.09206390380859375, -0.08806800842285156, -0.08407211303710938, -0.08007621765136719, -0.076080322265625, -0.07208442687988281, -0.06808853149414062, -0.06409263610839844, -0.06009674072265625, -0.05610084533691406, -0.052104949951171875, -0.04810905456542969, -0.0441131591796875, -0.04011726379394531, -0.036121368408203125, -0.03212547302246094, -0.02812957763671875, -0.024133682250976562, -0.020137786865234375, -0.016141891479492188, -0.01214599609375, -0.008150100708007812, -0.004154205322265625, -0.0001583099365234375, 0.00383758544921875, 0.007833480834960938, 0.011829376220703125, 0.015825271606445312, 0.0198211669921875, 0.023817062377929688, 0.027812957763671875, 0.03180885314941406, 0.03580474853515625, 0.03980064392089844, 0.043796539306640625, 0.04779243469238281, 0.051788330078125, 0.05578422546386719, 0.059780120849609375, 0.06377601623535156, 0.06777191162109375, 0.07176780700683594, 0.07576370239257812, 0.07975959777832031, 0.0837554931640625, 0.08775138854980469, 0.09174728393554688, 0.09574317932128906, 0.09973907470703125, 0.10373497009277344, 0.10773086547851562, 0.11172676086425781, 0.11572265625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 2.0, 3.0, 9.0, 4.0, 6.0, 11.0, 13.0, 21.0, 24.0, 35.0, 45.0, 97.0, 126.0, 212.0, 463.0, 939.0, 2423.0, 9458.0, 123884.0, 864822.0, 37343.0, 5290.0, 1713.0, 708.0, 351.0, 188.0, 113.0, 83.0, 53.0, 31.0, 20.0, 13.0, 17.0, 13.0, 2.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0], "bins": [-0.1285400390625, -0.12479496002197266, -0.12104988098144531, -0.11730480194091797, -0.11355972290039062, -0.10981464385986328, -0.10606956481933594, -0.1023244857788086, -0.09857940673828125, -0.0948343276977539, -0.09108924865722656, -0.08734416961669922, -0.08359909057617188, -0.07985401153564453, -0.07610893249511719, -0.07236385345458984, -0.0686187744140625, -0.06487369537353516, -0.06112861633300781, -0.05738353729248047, -0.053638458251953125, -0.04989337921142578, -0.04614830017089844, -0.042403221130371094, -0.03865814208984375, -0.034913063049316406, -0.031167984008789062, -0.02742290496826172, -0.023677825927734375, -0.01993274688720703, -0.016187667846679688, -0.012442588806152344, -0.008697509765625, -0.004952430725097656, -0.0012073516845703125, 0.0025377273559570312, 0.006282806396484375, 0.010027885437011719, 0.013772964477539062, 0.017518043518066406, 0.02126312255859375, 0.025008201599121094, 0.028753280639648438, 0.03249835968017578, 0.036243438720703125, 0.03998851776123047, 0.04373359680175781, 0.047478675842285156, 0.0512237548828125, 0.054968833923339844, 0.05871391296386719, 0.06245899200439453, 0.06620407104492188, 0.06994915008544922, 0.07369422912597656, 0.0774393081665039, 0.08118438720703125, 0.0849294662475586, 0.08867454528808594, 0.09241962432861328, 0.09616470336914062, 0.09990978240966797, 0.10365486145019531, 0.10739994049072266, 0.11114501953125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 7.0, 15.0, 9.0, 16.0, 26.0, 21.0, 32.0, 43.0, 64.0, 66.0, 59.0, 92.0, 105.0, 68.0, 95.0, 65.0, 64.0, 52.0, 30.0, 38.0, 13.0, 9.0, 9.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.47713851928711e-06, -9.141862392425537e-06, -8.806586265563965e-06, -8.471310138702393e-06, -8.13603401184082e-06, -7.800757884979248e-06, -7.465481758117676e-06, -7.1302056312561035e-06, -6.794929504394531e-06, -6.459653377532959e-06, -6.124377250671387e-06, -5.7891011238098145e-06, -5.453824996948242e-06, -5.11854887008667e-06, -4.783272743225098e-06, -4.447996616363525e-06, -4.112720489501953e-06, -3.777444362640381e-06, -3.4421682357788086e-06, -3.1068921089172363e-06, -2.771615982055664e-06, -2.436339855194092e-06, -2.1010637283325195e-06, -1.7657876014709473e-06, -1.430511474609375e-06, -1.0952353477478027e-06, -7.599592208862305e-07, -4.246830940246582e-07, -8.940696716308594e-08, 2.4586915969848633e-07, 5.811452865600586e-07, 9.164214134216309e-07, 1.2516975402832031e-06, 1.5869736671447754e-06, 1.9222497940063477e-06, 2.25752592086792e-06, 2.592802047729492e-06, 2.9280781745910645e-06, 3.2633543014526367e-06, 3.598630428314209e-06, 3.933906555175781e-06, 4.2691826820373535e-06, 4.604458808898926e-06, 4.939734935760498e-06, 5.27501106262207e-06, 5.610287189483643e-06, 5.945563316345215e-06, 6.280839443206787e-06, 6.616115570068359e-06, 6.951391696929932e-06, 7.286667823791504e-06, 7.621943950653076e-06, 7.957220077514648e-06, 8.29249620437622e-06, 8.627772331237793e-06, 8.963048458099365e-06, 9.298324584960938e-06, 9.63360071182251e-06, 9.968876838684082e-06, 1.0304152965545654e-05, 1.0639429092407227e-05, 1.0974705219268799e-05, 1.1309981346130371e-05, 1.1645257472991943e-05, 1.1980533599853516e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 6.0, 7.0, 0.0, 9.0, 17.0, 34.0, 73.0, 187.0, 590.0, 3356.0, 838742.0, 202729.0, 2141.0, 436.0, 127.0, 49.0, 18.0, 16.0, 9.0, 5.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.272705078125, -0.2632713317871094, -0.25383758544921875, -0.24440383911132812, -0.2349700927734375, -0.22553634643554688, -0.21610260009765625, -0.20666885375976562, -0.197235107421875, -0.18780136108398438, -0.17836761474609375, -0.16893386840820312, -0.1595001220703125, -0.15006637573242188, -0.14063262939453125, -0.13119888305664062, -0.12176513671875, -0.11233139038085938, -0.10289764404296875, -0.09346389770507812, -0.0840301513671875, -0.07459640502929688, -0.06516265869140625, -0.055728912353515625, -0.046295166015625, -0.036861419677734375, -0.02742767333984375, -0.017993927001953125, -0.0085601806640625, 0.000873565673828125, 0.01030731201171875, 0.019741058349609375, 0.0291748046875, 0.038608551025390625, 0.04804229736328125, 0.057476043701171875, 0.0669097900390625, 0.07634353637695312, 0.08577728271484375, 0.09521102905273438, 0.104644775390625, 0.11407852172851562, 0.12351226806640625, 0.13294601440429688, 0.1423797607421875, 0.15181350708007812, 0.16124725341796875, 0.17068099975585938, 0.18011474609375, 0.18954849243164062, 0.19898223876953125, 0.20841598510742188, 0.2178497314453125, 0.22728347778320312, 0.23671722412109375, 0.24615097045898438, 0.255584716796875, 0.2650184631347656, 0.27445220947265625, 0.2838859558105469, 0.2933197021484375, 0.3027534484863281, 0.31218719482421875, 0.3216209411621094, 0.3310546875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 5.0, 6.0, 8.0, 25.0, 27.0, 58.0, 129.0, 165.0, 249.0, 137.0, 85.0, 64.0, 23.0, 9.0, 9.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.17578125, -0.17206335067749023, -0.16834545135498047, -0.1646275520324707, -0.16090965270996094, -0.15719175338745117, -0.1534738540649414, -0.14975595474243164, -0.14603805541992188, -0.1423201560974121, -0.13860225677490234, -0.13488435745239258, -0.1311664581298828, -0.12744855880737305, -0.12373065948486328, -0.12001276016235352, -0.11629486083984375, -0.11257696151733398, -0.10885906219482422, -0.10514116287231445, -0.10142326354980469, -0.09770536422729492, -0.09398746490478516, -0.09026956558227539, -0.08655166625976562, -0.08283376693725586, -0.0791158676147461, -0.07539796829223633, -0.07168006896972656, -0.0679621696472168, -0.06424427032470703, -0.060526371002197266, -0.0568084716796875, -0.053090572357177734, -0.04937267303466797, -0.0456547737121582, -0.04193687438964844, -0.03821897506713867, -0.034501075744628906, -0.03078317642211914, -0.027065277099609375, -0.02334737777709961, -0.019629478454589844, -0.015911579132080078, -0.012193679809570312, -0.008475780487060547, -0.004757881164550781, -0.0010399818420410156, 0.00267791748046875, 0.006395816802978516, 0.010113716125488281, 0.013831615447998047, 0.017549514770507812, 0.021267414093017578, 0.024985313415527344, 0.02870321273803711, 0.032421112060546875, 0.03613901138305664, 0.039856910705566406, 0.04357481002807617, 0.04729270935058594, 0.0510106086730957, 0.05472850799560547, 0.058446407318115234, 0.062164306640625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 9.0, 24.0, 126.0, 579.0, 227.0, 31.0, 13.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.020843505859375, -1.9545860290527344, -1.8883285522460938, -1.8220710754394531, -1.7558135986328125, -1.6895561218261719, -1.6232987642288208, -1.5570412874221802, -1.4907838106155396, -1.424526333808899, -1.3582688570022583, -1.2920113801956177, -1.2257540225982666, -1.159496545791626, -1.0932390689849854, -1.0269815921783447, -0.9607241153717041, -0.8944666385650635, -0.8282091617584229, -0.761951744556427, -0.6956942677497864, -0.6294367909431458, -0.5631793737411499, -0.4969218969345093, -0.43066442012786865, -0.364406943321228, -0.2981494963169098, -0.23189203441143036, -0.16563457250595093, -0.0993770956993103, -0.033119648694992065, 0.03313779830932617, 0.0993952751159668, 0.16565273702144623, 0.23191019892692566, 0.2981676459312439, 0.3644251227378845, 0.43068259954452515, 0.4969400465488434, 0.5631974935531616, 0.6294549703598022, 0.6957124471664429, 0.7619699239730835, 0.8282273411750793, 0.89448481798172, 0.9607422947883606, 1.0269997119903564, 1.093257188796997, 1.1595146656036377, 1.2257721424102783, 1.292029619216919, 1.3582870960235596, 1.4245445728302002, 1.4908020496368408, 1.557059407234192, 1.6233168840408325, 1.6895743608474731, 1.7558318376541138, 1.8220893144607544, 1.888346791267395, 1.954604148864746, 2.0208616256713867, 2.0871191024780273, 2.153376579284668, 2.2196340560913086]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 5.0, 4.0, 7.0, 6.0, 9.0, 15.0, 12.0, 13.0, 26.0, 31.0, 39.0, 46.0, 48.0, 52.0, 59.0, 50.0, 66.0, 61.0, 72.0, 61.0, 55.0, 47.0, 40.0, 31.0, 32.0, 27.0, 22.0, 18.0, 13.0, 8.0, 12.0, 5.0, 4.0, 2.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6824823617935181, -0.6587573289871216, -0.6350323557853699, -0.6113073229789734, -0.5875823497772217, -0.5638573169708252, -0.5401322841644287, -0.516407310962677, -0.4926823079586029, -0.4689573049545288, -0.4452323019504547, -0.4215072989463806, -0.39778226613998413, -0.3740572929382324, -0.35033226013183594, -0.32660725712776184, -0.30288225412368774, -0.27915725111961365, -0.25543224811553955, -0.23170723021030426, -0.20798222720623016, -0.18425722420215607, -0.16053220629692078, -0.13680720329284668, -0.11308220028877258, -0.08935719728469849, -0.06563218683004379, -0.0419071763753891, -0.018182173371315002, 0.005542829632759094, 0.029267847537994385, 0.05299285054206848, 0.07671791315078735, 0.10044291615486145, 0.12416792660951614, 0.14789293706417084, 0.17161794006824493, 0.19534294307231903, 0.21906796097755432, 0.24279296398162842, 0.2665179669857025, 0.2902429699897766, 0.3139679729938507, 0.3376929759979248, 0.3614180088043213, 0.385142982006073, 0.4088680148124695, 0.4325930178165436, 0.4563180208206177, 0.4800430238246918, 0.5037680268287659, 0.5274930596351624, 0.5512180328369141, 0.5749430656433105, 0.598668098449707, 0.6223930716514587, 0.6461180448532104, 0.6698430776596069, 0.6935680508613586, 0.7172930836677551, 0.7410180568695068, 0.7647430896759033, 0.7884681224822998, 0.8121930956840515, 0.835918128490448]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 6.0, 3.0, 3.0, 6.0, 6.0, 2.0, 6.0, 7.0, 5.0, 16.0, 13.0, 12.0, 12.0, 10.0, 25.0, 30.0, 37.0, 33.0, 51.0, 62.0, 92.0, 117.0, 185.0, 267.0, 458.0, 1223.0, 3494.0, 15754.0, 193403.0, 3890538.0, 75851.0, 9378.0, 2137.0, 656.0, 210.0, 103.0, 34.0, 17.0, 17.0, 7.0, 4.0], "bins": [-0.486572265625, -0.4772758483886719, -0.46797943115234375, -0.4586830139160156, -0.4493865966796875, -0.4400901794433594, -0.43079376220703125, -0.4214973449707031, -0.412200927734375, -0.4029045104980469, -0.39360809326171875, -0.3843116760253906, -0.3750152587890625, -0.3657188415527344, -0.35642242431640625, -0.3471260070800781, -0.33782958984375, -0.3285331726074219, -0.31923675537109375, -0.3099403381347656, -0.3006439208984375, -0.2913475036621094, -0.28205108642578125, -0.2727546691894531, -0.263458251953125, -0.2541618347167969, -0.24486541748046875, -0.23556900024414062, -0.2262725830078125, -0.21697616577148438, -0.20767974853515625, -0.19838333129882812, -0.1890869140625, -0.17979049682617188, -0.17049407958984375, -0.16119766235351562, -0.1519012451171875, -0.14260482788085938, -0.13330841064453125, -0.12401199340820312, -0.114715576171875, -0.10541915893554688, -0.09612274169921875, -0.08682632446289062, -0.0775299072265625, -0.06823348999023438, -0.05893707275390625, -0.049640655517578125, -0.04034423828125, -0.031047821044921875, -0.02175140380859375, -0.012454986572265625, -0.0031585693359375, 0.006137847900390625, 0.01543426513671875, 0.024730682373046875, 0.034027099609375, 0.043323516845703125, 0.05261993408203125, 0.061916351318359375, 0.0712127685546875, 0.08050918579101562, 0.08980560302734375, 0.09910202026367188, 0.1083984375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 7.0, 12.0, 40.0, 70.0, 118.0, 183.0, 203.0, 161.0, 100.0, 58.0, 33.0, 19.0, 3.0, 1.0, 3.0, 0.0, 2.0], "bins": [-0.1268310546875, -0.1244509220123291, -0.1220707893371582, -0.1196906566619873, -0.1173105239868164, -0.11493039131164551, -0.11255025863647461, -0.11017012596130371, -0.10778999328613281, -0.10540986061096191, -0.10302972793579102, -0.10064959526062012, -0.09826946258544922, -0.09588932991027832, -0.09350919723510742, -0.09112906455993652, -0.08874893188476562, -0.08636879920959473, -0.08398866653442383, -0.08160853385925293, -0.07922840118408203, -0.07684826850891113, -0.07446813583374023, -0.07208800315856934, -0.06970787048339844, -0.06732773780822754, -0.06494760513305664, -0.06256747245788574, -0.060187339782714844, -0.057807207107543945, -0.05542707443237305, -0.05304694175720215, -0.05066680908203125, -0.04828667640686035, -0.04590654373168945, -0.043526411056518555, -0.041146278381347656, -0.03876614570617676, -0.03638601303100586, -0.03400588035583496, -0.03162574768066406, -0.029245615005493164, -0.026865482330322266, -0.024485349655151367, -0.02210521697998047, -0.01972508430480957, -0.017344951629638672, -0.014964818954467773, -0.012584686279296875, -0.010204553604125977, -0.007824420928955078, -0.00544428825378418, -0.0030641555786132812, -0.0006840229034423828, 0.0016961097717285156, 0.004076242446899414, 0.0064563751220703125, 0.008836507797241211, 0.01121664047241211, 0.013596773147583008, 0.015976905822753906, 0.018357038497924805, 0.020737171173095703, 0.0231173038482666, 0.0254974365234375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 9.0, 15.0, 28.0, 49.0, 125.0, 315.0, 1315.0, 4090933.0, 100561.0, 658.0, 164.0, 73.0, 26.0, 8.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.83203125, -2.7753067016601562, -2.7185821533203125, -2.6618576049804688, -2.605133056640625, -2.5484085083007812, -2.4916839599609375, -2.4349594116210938, -2.37823486328125, -2.3215103149414062, -2.2647857666015625, -2.2080612182617188, -2.151336669921875, -2.0946121215820312, -2.0378875732421875, -1.9811630249023438, -1.9244384765625, -1.8677139282226562, -1.8109893798828125, -1.7542648315429688, -1.697540283203125, -1.6408157348632812, -1.5840911865234375, -1.5273666381835938, -1.47064208984375, -1.4139175415039062, -1.3571929931640625, -1.3004684448242188, -1.243743896484375, -1.1870193481445312, -1.1302947998046875, -1.0735702514648438, -1.016845703125, -0.9601211547851562, -0.9033966064453125, -0.8466720581054688, -0.789947509765625, -0.7332229614257812, -0.6764984130859375, -0.6197738647460938, -0.56304931640625, -0.5063247680664062, -0.4496002197265625, -0.39287567138671875, -0.336151123046875, -0.27942657470703125, -0.2227020263671875, -0.16597747802734375, -0.1092529296875, -0.05252838134765625, 0.0041961669921875, 0.06092071533203125, 0.117645263671875, 0.17436981201171875, 0.2310943603515625, 0.28781890869140625, 0.34454345703125, 0.40126800537109375, 0.4579925537109375, 0.5147171020507812, 0.571441650390625, 0.6281661987304688, 0.6848907470703125, 0.7416152954101562, 0.79833984375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 10.0, 8.0, 18.0, 47.0, 220.0, 3307.0, 341.0, 70.0, 26.0, 17.0, 8.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.30615234375, -0.30022430419921875, -0.2942962646484375, -0.28836822509765625, -0.282440185546875, -0.27651214599609375, -0.2705841064453125, -0.26465606689453125, -0.25872802734375, -0.25279998779296875, -0.2468719482421875, -0.24094390869140625, -0.235015869140625, -0.22908782958984375, -0.2231597900390625, -0.21723175048828125, -0.2113037109375, -0.20537567138671875, -0.1994476318359375, -0.19351959228515625, -0.187591552734375, -0.18166351318359375, -0.1757354736328125, -0.16980743408203125, -0.16387939453125, -0.15795135498046875, -0.1520233154296875, -0.14609527587890625, -0.140167236328125, -0.13423919677734375, -0.1283111572265625, -0.12238311767578125, -0.116455078125, -0.11052703857421875, -0.1045989990234375, -0.09867095947265625, -0.092742919921875, -0.08681488037109375, -0.0808868408203125, -0.07495880126953125, -0.06903076171875, -0.06310272216796875, -0.0571746826171875, -0.05124664306640625, -0.045318603515625, -0.03939056396484375, -0.0334625244140625, -0.02753448486328125, -0.0216064453125, -0.01567840576171875, -0.0097503662109375, -0.00382232666015625, 0.002105712890625, 0.00803375244140625, 0.0139617919921875, 0.01988983154296875, 0.02581787109375, 0.03174591064453125, 0.0376739501953125, 0.04360198974609375, 0.049530029296875, 0.05545806884765625, 0.0613861083984375, 0.06731414794921875, 0.0732421875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 9.0, 42.0, 555.0, 377.0, 19.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7191885709762573, -0.6472967863082886, -0.5754050612449646, -0.5035132765769958, -0.4316215217113495, -0.3597297668457031, -0.2878379821777344, -0.2159462571144104, -0.14405447244644165, -0.07216271013021469, -0.00027094781398773193, 0.07162082195281982, 0.1435125768184662, 0.21540433168411255, 0.2872961163520813, 0.3591878414154053, 0.431079626083374, 0.5029714107513428, 0.5748631358146667, 0.6467549204826355, 0.7186466455459595, 0.7905384302139282, 0.862430214881897, 0.934321939945221, 1.006213665008545, 1.0781054496765137, 1.1499972343444824, 1.2218890190124512, 1.2937806844711304, 1.3656724691390991, 1.4375642538070679, 1.509455919265747, 1.5813477039337158, 1.6532394886016846, 1.7251312732696533, 1.797023057937622, 1.8689147233963013, 1.94080650806427, 2.012698173522949, 2.084589958190918, 2.1564817428588867, 2.2283735275268555, 2.300265312194824, 2.372157096862793, 2.4440488815307617, 2.5159406661987305, 2.587832450866699, 2.659723997116089, 2.7316160202026367, 2.8035078048706055, 2.875399589538574, 2.947291374206543, 3.0191831588745117, 3.0910749435424805, 3.162966728210449, 3.234858274459839, 3.3067500591278076, 3.3786418437957764, 3.450533628463745, 3.522425413131714, 3.5943171977996826, 3.6662087440490723, 3.738100528717041, 3.8099923133850098, 3.8818840980529785]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 11.0, 7.0, 22.0, 37.0, 45.0, 90.0, 90.0, 111.0, 120.0, 109.0, 86.0, 94.0, 61.0, 52.0, 27.0, 16.0, 9.0, 4.0, 6.0, 1.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8962656259536743, -0.8706783056259155, -0.8450910449028015, -0.8195037841796875, -0.7939164638519287, -0.7683291435241699, -0.7427418828010559, -0.7171546220779419, -0.6915673017501831, -0.6659799814224243, -0.6403927206993103, -0.6148054599761963, -0.5892181396484375, -0.5636308193206787, -0.5380435585975647, -0.5124562978744507, -0.4868689775466919, -0.4612816870212555, -0.4356943964958191, -0.4101071059703827, -0.3845198154449463, -0.3589325249195099, -0.3333452343940735, -0.3077579438686371, -0.2821706533432007, -0.2565833628177643, -0.23099607229232788, -0.20540878176689148, -0.17982149124145508, -0.15423420071601868, -0.12864691019058228, -0.10305961966514587, -0.07747238874435425, -0.05188509821891785, -0.026297807693481445, -0.0007105171680450439, 0.024876773357391357, 0.05046406388282776, 0.07605135440826416, 0.10163864493370056, 0.12722593545913696, 0.15281322598457336, 0.17840051651000977, 0.20398780703544617, 0.22957509756088257, 0.25516238808631897, 0.28074967861175537, 0.3063369691371918, 0.3319242596626282, 0.3575115501880646, 0.383098840713501, 0.4086861312389374, 0.4342734217643738, 0.4598607122898102, 0.4854480028152466, 0.5110353231430054, 0.5366225838661194, 0.5622098445892334, 0.5877971649169922, 0.613384485244751, 0.638971745967865, 0.664559006690979, 0.6901463270187378, 0.7157336473464966, 0.7413209080696106]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 1.0, 4.0, 6.0, 5.0, 10.0, 20.0, 16.0, 19.0, 38.0, 35.0, 53.0, 77.0, 115.0, 194.0, 318.0, 626.0, 1494.0, 5485.0, 30218.0, 465628.0, 503438.0, 31945.0, 5649.0, 1619.0, 662.0, 339.0, 175.0, 104.0, 81.0, 54.0, 33.0, 18.0, 20.0, 16.0, 9.0, 5.0, 7.0, 4.0, 7.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.370361328125, -0.360076904296875, -0.34979248046875, -0.339508056640625, -0.3292236328125, -0.318939208984375, -0.30865478515625, -0.298370361328125, -0.2880859375, -0.277801513671875, -0.26751708984375, -0.257232666015625, -0.2469482421875, -0.236663818359375, -0.22637939453125, -0.216094970703125, -0.205810546875, -0.195526123046875, -0.18524169921875, -0.174957275390625, -0.1646728515625, -0.154388427734375, -0.14410400390625, -0.133819580078125, -0.12353515625, -0.113250732421875, -0.10296630859375, -0.092681884765625, -0.0823974609375, -0.072113037109375, -0.06182861328125, -0.051544189453125, -0.041259765625, -0.030975341796875, -0.02069091796875, -0.010406494140625, -0.0001220703125, 0.010162353515625, 0.02044677734375, 0.030731201171875, 0.041015625, 0.051300048828125, 0.06158447265625, 0.071868896484375, 0.0821533203125, 0.092437744140625, 0.10272216796875, 0.113006591796875, 0.123291015625, 0.133575439453125, 0.14385986328125, 0.154144287109375, 0.1644287109375, 0.174713134765625, 0.18499755859375, 0.195281982421875, 0.20556640625, 0.215850830078125, 0.22613525390625, 0.236419677734375, 0.2467041015625, 0.256988525390625, 0.26727294921875, 0.277557373046875, 0.287841796875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 8.0, 10.0, 11.0, 31.0, 51.0, 81.0, 92.0, 136.0, 147.0, 152.0, 108.0, 76.0, 46.0, 29.0, 15.0, 7.0, 6.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.12127685546875, -0.11877250671386719, -0.11626815795898438, -0.11376380920410156, -0.11125946044921875, -0.10875511169433594, -0.10625076293945312, -0.10374641418457031, -0.1012420654296875, -0.09873771667480469, -0.09623336791992188, -0.09372901916503906, -0.09122467041015625, -0.08872032165527344, -0.08621597290039062, -0.08371162414550781, -0.081207275390625, -0.07870292663574219, -0.07619857788085938, -0.07369422912597656, -0.07118988037109375, -0.06868553161621094, -0.06618118286132812, -0.06367683410644531, -0.0611724853515625, -0.05866813659667969, -0.056163787841796875, -0.05365943908691406, -0.05115509033203125, -0.04865074157714844, -0.046146392822265625, -0.04364204406738281, -0.0411376953125, -0.03863334655761719, -0.036128997802734375, -0.03362464904785156, -0.03112030029296875, -0.028615951538085938, -0.026111602783203125, -0.023607254028320312, -0.0211029052734375, -0.018598556518554688, -0.016094207763671875, -0.013589859008789062, -0.01108551025390625, -0.008581161499023438, -0.006076812744140625, -0.0035724639892578125, -0.001068115234375, 0.0014362335205078125, 0.003940582275390625, 0.0064449310302734375, 0.00894927978515625, 0.011453628540039062, 0.013957977294921875, 0.016462326049804688, 0.0189666748046875, 0.021471023559570312, 0.023975372314453125, 0.026479721069335938, 0.02898406982421875, 0.03148841857910156, 0.033992767333984375, 0.03649711608886719, 0.03900146484375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 8.0, 10.0, 9.0, 8.0, 13.0, 27.0, 31.0, 62.0, 95.0, 120.0, 206.0, 457.0, 1152.0, 3481.0, 14580.0, 118032.0, 792732.0, 99278.0, 13111.0, 3031.0, 1087.0, 446.0, 214.0, 99.0, 69.0, 49.0, 33.0, 31.0, 13.0, 12.0, 16.0, 10.0, 6.0, 4.0, 4.0, 3.0, 2.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1981201171875, -0.1911602020263672, -0.18420028686523438, -0.17724037170410156, -0.17028045654296875, -0.16332054138183594, -0.15636062622070312, -0.1494007110595703, -0.1424407958984375, -0.1354808807373047, -0.12852096557617188, -0.12156105041503906, -0.11460113525390625, -0.10764122009277344, -0.10068130493164062, -0.09372138977050781, -0.086761474609375, -0.07980155944824219, -0.07284164428710938, -0.06588172912597656, -0.05892181396484375, -0.05196189880371094, -0.045001983642578125, -0.03804206848144531, -0.0310821533203125, -0.024122238159179688, -0.017162322998046875, -0.010202407836914062, -0.00324249267578125, 0.0037174224853515625, 0.010677337646484375, 0.017637252807617188, 0.02459716796875, 0.03155708312988281, 0.038516998291015625, 0.04547691345214844, 0.05243682861328125, 0.05939674377441406, 0.06635665893554688, 0.07331657409667969, 0.0802764892578125, 0.08723640441894531, 0.09419631958007812, 0.10115623474121094, 0.10811614990234375, 0.11507606506347656, 0.12203598022460938, 0.1289958953857422, 0.135955810546875, 0.1429157257080078, 0.14987564086914062, 0.15683555603027344, 0.16379547119140625, 0.17075538635253906, 0.17771530151367188, 0.1846752166748047, 0.1916351318359375, 0.1985950469970703, 0.20555496215820312, 0.21251487731933594, 0.21947479248046875, 0.22643470764160156, 0.23339462280273438, 0.2403545379638672, 0.247314453125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 0.0, 0.0, 4.0, 4.0, 6.0, 9.0, 5.0, 11.0, 14.0, 17.0, 20.0, 36.0, 37.0, 32.0, 39.0, 34.0, 51.0, 61.0, 60.0, 55.0, 70.0, 68.0, 60.0, 46.0, 44.0, 36.0, 30.0, 30.0, 27.0, 23.0, 12.0, 16.0, 13.0, 11.0, 1.0, 2.0, 7.0, 4.0, 3.0, 3.0, 1.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.130126953125, -0.12544631958007812, -0.12076568603515625, -0.11608505249023438, -0.1114044189453125, -0.10672378540039062, -0.10204315185546875, -0.09736251831054688, -0.092681884765625, -0.08800125122070312, -0.08332061767578125, -0.07863998413085938, -0.0739593505859375, -0.06927871704101562, -0.06459808349609375, -0.059917449951171875, -0.05523681640625, -0.050556182861328125, -0.04587554931640625, -0.041194915771484375, -0.0365142822265625, -0.031833648681640625, -0.02715301513671875, -0.022472381591796875, -0.017791748046875, -0.013111114501953125, -0.00843048095703125, -0.003749847412109375, 0.0009307861328125, 0.005611419677734375, 0.01029205322265625, 0.014972686767578125, 0.0196533203125, 0.024333953857421875, 0.02901458740234375, 0.033695220947265625, 0.0383758544921875, 0.043056488037109375, 0.04773712158203125, 0.052417755126953125, 0.057098388671875, 0.061779022216796875, 0.06645965576171875, 0.07114028930664062, 0.0758209228515625, 0.08050155639648438, 0.08518218994140625, 0.08986282348632812, 0.09454345703125, 0.09922409057617188, 0.10390472412109375, 0.10858535766601562, 0.1132659912109375, 0.11794662475585938, 0.12262725830078125, 0.12730789184570312, 0.131988525390625, 0.13666915893554688, 0.14134979248046875, 0.14603042602539062, 0.1507110595703125, 0.15539169311523438, 0.16007232666015625, 0.16475296020507812, 0.16943359375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 6.0, 7.0, 12.0, 19.0, 25.0, 48.0, 87.0, 176.0, 482.0, 1675.0, 7844.0, 162903.0, 845574.0, 24828.0, 3342.0, 937.0, 294.0, 128.0, 67.0, 29.0, 24.0, 9.0, 9.0, 5.0, 5.0, 3.0, 4.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11431884765625, -0.11066055297851562, -0.10700225830078125, -0.10334396362304688, -0.0996856689453125, -0.09602737426757812, -0.09236907958984375, -0.08871078491210938, -0.085052490234375, -0.08139419555664062, -0.07773590087890625, -0.07407760620117188, -0.0704193115234375, -0.06676101684570312, -0.06310272216796875, -0.059444427490234375, -0.0557861328125, -0.052127838134765625, -0.04846954345703125, -0.044811248779296875, -0.0411529541015625, -0.037494659423828125, -0.03383636474609375, -0.030178070068359375, -0.026519775390625, -0.022861480712890625, -0.01920318603515625, -0.015544891357421875, -0.0118865966796875, -0.008228302001953125, -0.00457000732421875, -0.000911712646484375, 0.00274658203125, 0.006404876708984375, 0.01006317138671875, 0.013721466064453125, 0.0173797607421875, 0.021038055419921875, 0.02469635009765625, 0.028354644775390625, 0.032012939453125, 0.035671234130859375, 0.03932952880859375, 0.042987823486328125, 0.0466461181640625, 0.050304412841796875, 0.05396270751953125, 0.057621002197265625, 0.061279296875, 0.06493759155273438, 0.06859588623046875, 0.07225418090820312, 0.0759124755859375, 0.07957077026367188, 0.08322906494140625, 0.08688735961914062, 0.090545654296875, 0.09420394897460938, 0.09786224365234375, 0.10152053833007812, 0.1051788330078125, 0.10883712768554688, 0.11249542236328125, 0.11615371704101562, 0.11981201171875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 3.0, 6.0, 12.0, 13.0, 26.0, 20.0, 51.0, 65.0, 82.0, 110.0, 144.0, 106.0, 94.0, 97.0, 41.0, 39.0, 27.0, 24.0, 8.0, 11.0, 7.0, 7.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.728534698486328e-05, -1.6851350665092468e-05, -1.6417354345321655e-05, -1.5983358025550842e-05, -1.554936170578003e-05, -1.5115365386009216e-05, -1.4681369066238403e-05, -1.424737274646759e-05, -1.3813376426696777e-05, -1.3379380106925964e-05, -1.2945383787155151e-05, -1.2511387467384338e-05, -1.2077391147613525e-05, -1.1643394827842712e-05, -1.12093985080719e-05, -1.0775402188301086e-05, -1.0341405868530273e-05, -9.90740954875946e-06, -9.473413228988647e-06, -9.039416909217834e-06, -8.605420589447021e-06, -8.171424269676208e-06, -7.737427949905396e-06, -7.3034316301345825e-06, -6.8694353103637695e-06, -6.4354389905929565e-06, -6.0014426708221436e-06, -5.5674463510513306e-06, -5.133450031280518e-06, -4.699453711509705e-06, -4.265457391738892e-06, -3.831461071968079e-06, -3.3974647521972656e-06, -2.9634684324264526e-06, -2.5294721126556396e-06, -2.0954757928848267e-06, -1.6614794731140137e-06, -1.2274831533432007e-06, -7.934868335723877e-07, -3.594905138015747e-07, 7.450580596923828e-08, 5.085021257400513e-07, 9.424984455108643e-07, 1.3764947652816772e-06, 1.8104910850524902e-06, 2.2444874048233032e-06, 2.678483724594116e-06, 3.112480044364929e-06, 3.546476364135742e-06, 3.980472683906555e-06, 4.414469003677368e-06, 4.848465323448181e-06, 5.282461643218994e-06, 5.716457962989807e-06, 6.15045428276062e-06, 6.584450602531433e-06, 7.018446922302246e-06, 7.452443242073059e-06, 7.886439561843872e-06, 8.320435881614685e-06, 8.754432201385498e-06, 9.188428521156311e-06, 9.622424840927124e-06, 1.0056421160697937e-05, 1.049041748046875e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 3.0, 8.0, 10.0, 6.0, 14.0, 15.0, 24.0, 25.0, 51.0, 87.0, 90.0, 162.0, 279.0, 482.0, 989.0, 2445.0, 7721.0, 36880.0, 474577.0, 475318.0, 37114.0, 7756.0, 2330.0, 947.0, 477.0, 247.0, 153.0, 115.0, 55.0, 45.0, 38.0, 22.0, 16.0, 10.0, 22.0, 8.0, 5.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.060546875, -0.05865478515625, -0.0567626953125, -0.05487060546875, -0.052978515625, -0.05108642578125, -0.0491943359375, -0.04730224609375, -0.04541015625, -0.04351806640625, -0.0416259765625, -0.03973388671875, -0.037841796875, -0.03594970703125, -0.0340576171875, -0.03216552734375, -0.0302734375, -0.02838134765625, -0.0264892578125, -0.02459716796875, -0.022705078125, -0.02081298828125, -0.0189208984375, -0.01702880859375, -0.01513671875, -0.01324462890625, -0.0113525390625, -0.00946044921875, -0.007568359375, -0.00567626953125, -0.0037841796875, -0.00189208984375, 0.0, 0.00189208984375, 0.0037841796875, 0.00567626953125, 0.007568359375, 0.00946044921875, 0.0113525390625, 0.01324462890625, 0.01513671875, 0.01702880859375, 0.0189208984375, 0.02081298828125, 0.022705078125, 0.02459716796875, 0.0264892578125, 0.02838134765625, 0.0302734375, 0.03216552734375, 0.0340576171875, 0.03594970703125, 0.037841796875, 0.03973388671875, 0.0416259765625, 0.04351806640625, 0.04541015625, 0.04730224609375, 0.0491943359375, 0.05108642578125, 0.052978515625, 0.05487060546875, 0.0567626953125, 0.05865478515625, 0.060546875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 5.0, 4.0, 5.0, 11.0, 11.0, 28.0, 28.0, 37.0, 44.0, 57.0, 87.0, 87.0, 86.0, 104.0, 88.0, 73.0, 69.0, 39.0, 31.0, 19.0, 21.0, 17.0, 15.0, 8.0, 2.0, 3.0, 9.0, 4.0, 1.0, 2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.048004150390625, -0.04659605026245117, -0.045187950134277344, -0.043779850006103516, -0.04237174987792969, -0.04096364974975586, -0.03955554962158203, -0.0381474494934082, -0.036739349365234375, -0.03533124923706055, -0.03392314910888672, -0.03251504898071289, -0.031106948852539062, -0.029698848724365234, -0.028290748596191406, -0.026882648468017578, -0.02547454833984375, -0.024066448211669922, -0.022658348083496094, -0.021250247955322266, -0.019842147827148438, -0.01843404769897461, -0.01702594757080078, -0.015617847442626953, -0.014209747314453125, -0.012801647186279297, -0.011393547058105469, -0.00998544692993164, -0.008577346801757812, -0.007169246673583984, -0.005761146545410156, -0.004353046417236328, -0.0029449462890625, -0.0015368461608886719, -0.00012874603271484375, 0.0012793540954589844, 0.0026874542236328125, 0.004095554351806641, 0.005503654479980469, 0.006911754608154297, 0.008319854736328125, 0.009727954864501953, 0.011136054992675781, 0.01254415512084961, 0.013952255249023438, 0.015360355377197266, 0.016768455505371094, 0.018176555633544922, 0.01958465576171875, 0.020992755889892578, 0.022400856018066406, 0.023808956146240234, 0.025217056274414062, 0.02662515640258789, 0.02803325653076172, 0.029441356658935547, 0.030849456787109375, 0.0322575569152832, 0.03366565704345703, 0.03507375717163086, 0.03648185729980469, 0.037889957427978516, 0.039298057556152344, 0.04070615768432617, 0.0421142578125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 7.0, 26.0, 81.0, 278.0, 431.0, 120.0, 38.0, 13.0, 4.0, 7.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.793364405632019, -1.7357144355773926, -1.6780643463134766, -1.62041437625885, -1.5627644062042236, -1.5051143169403076, -1.4474643468856812, -1.3898143768310547, -1.3321642875671387, -1.2745143175125122, -1.2168642282485962, -1.1592142581939697, -1.1015642881393433, -1.0439141988754272, -0.9862642288208008, -0.9286141991615295, -0.8709642291069031, -0.8133141994476318, -0.7556642293930054, -0.6980141997337341, -0.6403641700744629, -0.5827142000198364, -0.5250641703605652, -0.46741414070129395, -0.4097641408443451, -0.35211414098739624, -0.294464111328125, -0.23681411147117615, -0.1791640967130661, -0.12151408195495605, -0.0638640820980072, -0.006214052438735962, 0.05143594741821289, 0.10908596217632294, 0.16673597693443298, 0.22438597679138184, 0.2820360064506531, 0.33968600630760193, 0.3973360061645508, 0.454986035823822, 0.5126360654830933, 0.5702860951423645, 0.627936065196991, 0.6855860948562622, 0.7432361245155334, 0.8008861541748047, 0.8585361242294312, 0.9161861538887024, 0.9738361239433289, 1.0314861536026, 1.0891361236572266, 1.1467862129211426, 1.204436182975769, 1.2620861530303955, 1.3197362422943115, 1.377386212348938, 1.4350361824035645, 1.492686152458191, 1.550336241722107, 1.6079862117767334, 1.6656361818313599, 1.7232862710952759, 1.7809362411499023, 1.8385863304138184, 1.8962363004684448]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 9.0, 8.0, 5.0, 8.0, 18.0, 22.0, 19.0, 21.0, 24.0, 25.0, 44.0, 44.0, 40.0, 56.0, 45.0, 44.0, 69.0, 60.0, 50.0, 55.0, 39.0, 34.0, 36.0, 41.0, 41.0, 35.0, 18.0, 19.0, 14.0, 9.0, 8.0, 16.0, 6.0, 7.0, 3.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6836400032043457, -0.6603651642799377, -0.6370903253555298, -0.6138154864311218, -0.5905406475067139, -0.5672657489776611, -0.5439909100532532, -0.5207160711288452, -0.49744123220443726, -0.4741663932800293, -0.45089155435562134, -0.427616685628891, -0.40434184670448303, -0.3810670077800751, -0.3577921390533447, -0.33451730012893677, -0.3112424612045288, -0.28796762228012085, -0.2646927833557129, -0.24141791462898254, -0.21814307570457458, -0.19486823678016663, -0.17159338295459747, -0.14831852912902832, -0.12504369020462036, -0.1017688438296318, -0.07849399745464325, -0.055219151079654694, -0.03194430470466614, -0.008669458329677582, 0.014605388045310974, 0.03788024187088013, 0.06115502119064331, 0.08442986756563187, 0.10770471394062042, 0.13097956776618958, 0.15425440669059753, 0.1775292456150055, 0.20080409944057465, 0.2240789532661438, 0.24735379219055176, 0.2706286311149597, 0.2939034700393677, 0.317178338766098, 0.340453177690506, 0.36372801661491394, 0.3870028853416443, 0.41027772426605225, 0.4335525631904602, 0.45682740211486816, 0.4801022410392761, 0.5033770799636841, 0.5266519784927368, 0.5499268174171448, 0.5732016563415527, 0.5964764952659607, 0.6197513341903687, 0.6430261731147766, 0.6663010120391846, 0.6895758509635925, 0.7128506898880005, 0.7361255884170532, 0.7594004273414612, 0.7826752662658691, 0.8059501051902771]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 8.0, 5.0, 11.0, 8.0, 19.0, 13.0, 30.0, 46.0, 58.0, 98.0, 145.0, 262.0, 494.0, 1088.0, 3395.0, 18091.0, 989444.0, 3152272.0, 23381.0, 3714.0, 1077.0, 341.0, 143.0, 67.0, 31.0, 19.0, 6.0, 8.0, 3.0, 0.0, 3.0], "bins": [-0.55029296875, -0.5392971038818359, -0.5283012390136719, -0.5173053741455078, -0.5063095092773438, -0.4953136444091797, -0.4843177795410156, -0.47332191467285156, -0.4623260498046875, -0.45133018493652344, -0.4403343200683594, -0.4293384552001953, -0.41834259033203125, -0.4073467254638672, -0.3963508605957031, -0.38535499572753906, -0.374359130859375, -0.36336326599121094, -0.3523674011230469, -0.3413715362548828, -0.33037567138671875, -0.3193798065185547, -0.3083839416503906, -0.29738807678222656, -0.2863922119140625, -0.27539634704589844, -0.2644004821777344, -0.2534046173095703, -0.24240875244140625, -0.2314128875732422, -0.22041702270507812, -0.20942115783691406, -0.19842529296875, -0.18742942810058594, -0.17643356323242188, -0.1654376983642578, -0.15444183349609375, -0.1434459686279297, -0.13245010375976562, -0.12145423889160156, -0.1104583740234375, -0.09946250915527344, -0.08846664428710938, -0.07747077941894531, -0.06647491455078125, -0.05547904968261719, -0.044483184814453125, -0.03348731994628906, -0.022491455078125, -0.011495590209960938, -0.000499725341796875, 0.010496139526367188, 0.02149200439453125, 0.03248786926269531, 0.043483734130859375, 0.05447959899902344, 0.0654754638671875, 0.07647132873535156, 0.08746719360351562, 0.09846305847167969, 0.10945892333984375, 0.12045478820800781, 0.13145065307617188, 0.14244651794433594, 0.1534423828125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 12.0, 19.0, 34.0, 75.0, 95.0, 129.0, 138.0, 153.0, 125.0, 71.0, 68.0, 33.0, 22.0, 10.0, 5.0, 4.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1217041015625, -0.11916065216064453, -0.11661720275878906, -0.1140737533569336, -0.11153030395507812, -0.10898685455322266, -0.10644340515136719, -0.10389995574951172, -0.10135650634765625, -0.09881305694580078, -0.09626960754394531, -0.09372615814208984, -0.09118270874023438, -0.0886392593383789, -0.08609580993652344, -0.08355236053466797, -0.0810089111328125, -0.07846546173095703, -0.07592201232910156, -0.0733785629272461, -0.07083511352539062, -0.06829166412353516, -0.06574821472167969, -0.06320476531982422, -0.06066131591796875, -0.05811786651611328, -0.05557441711425781, -0.053030967712402344, -0.050487518310546875, -0.047944068908691406, -0.04540061950683594, -0.04285717010498047, -0.040313720703125, -0.03777027130126953, -0.03522682189941406, -0.032683372497558594, -0.030139923095703125, -0.027596473693847656, -0.025053024291992188, -0.02250957489013672, -0.01996612548828125, -0.01742267608642578, -0.014879226684570312, -0.012335777282714844, -0.009792327880859375, -0.007248878479003906, -0.0047054290771484375, -0.0021619796752929688, 0.0003814697265625, 0.0029249191284179688, 0.0054683685302734375, 0.008011817932128906, 0.010555267333984375, 0.013098716735839844, 0.015642166137695312, 0.01818561553955078, 0.02072906494140625, 0.02327251434326172, 0.025815963745117188, 0.028359413146972656, 0.030902862548828125, 0.033446311950683594, 0.03598976135253906, 0.03853321075439453, 0.04107666015625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 7.0, 7.0, 13.0, 22.0, 49.0, 81.0, 140.0, 227.0, 698.0, 155814.0, 4035446.0, 1044.0, 317.0, 168.0, 84.0, 64.0, 41.0, 29.0, 15.0, 13.0, 3.0, 6.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.99853515625, -0.9629745483398438, -0.9274139404296875, -0.8918533325195312, -0.856292724609375, -0.8207321166992188, -0.7851715087890625, -0.7496109008789062, -0.71405029296875, -0.6784896850585938, -0.6429290771484375, -0.6073684692382812, -0.571807861328125, -0.5362472534179688, -0.5006866455078125, -0.46512603759765625, -0.4295654296875, -0.39400482177734375, -0.3584442138671875, -0.32288360595703125, -0.287322998046875, -0.25176239013671875, -0.2162017822265625, -0.18064117431640625, -0.14508056640625, -0.10951995849609375, -0.0739593505859375, -0.03839874267578125, -0.002838134765625, 0.03272247314453125, 0.0682830810546875, 0.10384368896484375, 0.139404296875, 0.17496490478515625, 0.2105255126953125, 0.24608612060546875, 0.281646728515625, 0.31720733642578125, 0.3527679443359375, 0.38832855224609375, 0.42388916015625, 0.45944976806640625, 0.4950103759765625, 0.5305709838867188, 0.566131591796875, 0.6016921997070312, 0.6372528076171875, 0.6728134155273438, 0.7083740234375, 0.7439346313476562, 0.7794952392578125, 0.8150558471679688, 0.850616455078125, 0.8861770629882812, 0.9217376708984375, 0.9572982788085938, 0.99285888671875, 1.0284194946289062, 1.0639801025390625, 1.0995407104492188, 1.135101318359375, 1.1706619262695312, 1.2062225341796875, 1.2417831420898438, 1.27734375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 6.0, 30.0, 219.0, 3591.0, 192.0, 30.0, 12.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.157470703125, -0.14939498901367188, -0.14131927490234375, -0.13324356079101562, -0.1251678466796875, -0.11709213256835938, -0.10901641845703125, -0.10094070434570312, -0.092864990234375, -0.08478927612304688, -0.07671356201171875, -0.06863784790039062, -0.0605621337890625, -0.052486419677734375, -0.04441070556640625, -0.036334991455078125, -0.02825927734375, -0.020183563232421875, -0.01210784912109375, -0.004032135009765625, 0.0040435791015625, 0.012119293212890625, 0.02019500732421875, 0.028270721435546875, 0.036346435546875, 0.044422149658203125, 0.05249786376953125, 0.060573577880859375, 0.0686492919921875, 0.07672500610351562, 0.08480072021484375, 0.09287643432617188, 0.1009521484375, 0.10902786254882812, 0.11710357666015625, 0.12517929077148438, 0.1332550048828125, 0.14133071899414062, 0.14940643310546875, 0.15748214721679688, 0.165557861328125, 0.17363357543945312, 0.18170928955078125, 0.18978500366210938, 0.1978607177734375, 0.20593643188476562, 0.21401214599609375, 0.22208786010742188, 0.23016357421875, 0.23823928833007812, 0.24631500244140625, 0.2543907165527344, 0.2624664306640625, 0.2705421447753906, 0.27861785888671875, 0.2866935729980469, 0.294769287109375, 0.3028450012207031, 0.31092071533203125, 0.3189964294433594, 0.3270721435546875, 0.3351478576660156, 0.34322357177734375, 0.3512992858886719, 0.359375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 16.0, 990.0, 10.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.808521747589111, -7.66502571105957, -7.521529674530029, -7.37803316116333, -7.234537124633789, -7.091041088104248, -6.947545051574707, -6.804049015045166, -6.660552978515625, -6.517056941986084, -6.373560905456543, -6.230064392089844, -6.086568355560303, -5.943072319030762, -5.799576282501221, -5.65608024597168, -5.5125837326049805, -5.3690876960754395, -5.225591659545898, -5.082095146179199, -4.938599109649658, -4.795103073120117, -4.651607036590576, -4.508111000061035, -4.364614486694336, -4.221118450164795, -4.077622413635254, -3.934126138687134, -3.7906298637390137, -3.6471338272094727, -3.5036377906799316, -3.3601417541503906, -3.2166452407836914, -3.0731492042541504, -2.9296529293060303, -2.7861568927764893, -2.642660617828369, -2.499164581298828, -2.355668544769287, -2.212172508239746, -2.068676233291626, -1.9251800775527954, -1.7816839218139648, -1.6381878852844238, -1.4946917295455933, -1.3511955738067627, -1.2076995372772217, -1.0642033815383911, -0.9207072257995605, -0.77721107006073, -0.6337149739265442, -0.490218847990036, -0.34672272205352783, -0.20322656631469727, -0.059730470180511475, 0.08376562595367432, 0.22726178169250488, 0.37075790762901306, 0.5142540335655212, 0.657750129699707, 0.8012462854385376, 0.9447424411773682, 1.0882384777069092, 1.2317346334457397, 1.3752307891845703]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 8.0, 12.0, 13.0, 32.0, 38.0, 55.0, 80.0, 105.0, 121.0, 120.0, 110.0, 85.0, 82.0, 71.0, 35.0, 21.0, 11.0, 4.0, 0.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.5628576874732971, -0.548931360244751, -0.5350049734115601, -0.5210786461830139, -0.507152259349823, -0.49322590231895447, -0.47929954528808594, -0.4653732180595398, -0.4514468312263489, -0.43752047419548035, -0.4235941171646118, -0.4096677601337433, -0.39574140310287476, -0.3818150460720062, -0.3678886890411377, -0.35396236181259155, -0.340036004781723, -0.3261096477508545, -0.31218329071998596, -0.29825693368911743, -0.2843305766582489, -0.27040421962738037, -0.25647789239883423, -0.2425515204668045, -0.22862516343593597, -0.21469880640506744, -0.2007724493741989, -0.18684610724449158, -0.17291975021362305, -0.15899339318275452, -0.145067036151886, -0.13114067912101746, -0.11721432209014893, -0.1032879650592804, -0.08936160802841187, -0.07543525844812393, -0.0615089014172554, -0.04758254438638687, -0.03365619480609894, -0.019729837775230408, -0.0058034807443618774, 0.008122874423861504, 0.022049229592084885, 0.035975582897663116, 0.04990193992853165, 0.06382829695940018, 0.07775464653968811, 0.09168100357055664, 0.10560736060142517, 0.1195337176322937, 0.13346007466316223, 0.14738643169403076, 0.1613127887248993, 0.17523914575576782, 0.18916548788547516, 0.2030918449163437, 0.21701820194721222, 0.23094455897808075, 0.24487091600894928, 0.2587972581386566, 0.27272361516952515, 0.2866499722003937, 0.3005763292312622, 0.31450268626213074, 0.32842904329299927]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 5.0, 4.0, 4.0, 4.0, 10.0, 15.0, 14.0, 31.0, 38.0, 61.0, 85.0, 141.0, 246.0, 431.0, 858.0, 2269.0, 8879.0, 58292.0, 628254.0, 311125.0, 29383.0, 5336.0, 1572.0, 631.0, 345.0, 163.0, 111.0, 81.0, 51.0, 43.0, 25.0, 19.0, 13.0, 8.0, 5.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.291015625, -0.2835216522216797, -0.2760276794433594, -0.26853370666503906, -0.26103973388671875, -0.25354576110839844, -0.24605178833007812, -0.2385578155517578, -0.2310638427734375, -0.2235698699951172, -0.21607589721679688, -0.20858192443847656, -0.20108795166015625, -0.19359397888183594, -0.18610000610351562, -0.1786060333251953, -0.171112060546875, -0.1636180877685547, -0.15612411499023438, -0.14863014221191406, -0.14113616943359375, -0.13364219665527344, -0.12614822387695312, -0.11865425109863281, -0.1111602783203125, -0.10366630554199219, -0.09617233276367188, -0.08867835998535156, -0.08118438720703125, -0.07369041442871094, -0.06619644165039062, -0.05870246887207031, -0.05120849609375, -0.04371452331542969, -0.036220550537109375, -0.028726577758789062, -0.02123260498046875, -0.013738632202148438, -0.006244659423828125, 0.0012493133544921875, 0.0087432861328125, 0.016237258911132812, 0.023731231689453125, 0.031225204467773438, 0.03871917724609375, 0.04621315002441406, 0.053707122802734375, 0.06120109558105469, 0.068695068359375, 0.07618904113769531, 0.08368301391601562, 0.09117698669433594, 0.09867095947265625, 0.10616493225097656, 0.11365890502929688, 0.12115287780761719, 0.1286468505859375, 0.1361408233642578, 0.14363479614257812, 0.15112876892089844, 0.15862274169921875, 0.16611671447753906, 0.17361068725585938, 0.1811046600341797, 0.1885986328125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 10.0, 17.0, 31.0, 53.0, 73.0, 103.0, 106.0, 121.0, 143.0, 106.0, 79.0, 62.0, 35.0, 23.0, 18.0, 7.0, 5.0, 5.0, 4.0, 1.0, 3.0, 2.0], "bins": [-0.107421875, -0.10526108741760254, -0.10310029983520508, -0.10093951225280762, -0.09877872467041016, -0.0966179370880127, -0.09445714950561523, -0.09229636192321777, -0.09013557434082031, -0.08797478675842285, -0.08581399917602539, -0.08365321159362793, -0.08149242401123047, -0.07933163642883301, -0.07717084884643555, -0.07501006126403809, -0.07284927368164062, -0.07068848609924316, -0.0685276985168457, -0.06636691093444824, -0.06420612335205078, -0.06204533576965332, -0.05988454818725586, -0.0577237606048584, -0.05556297302246094, -0.05340218544006348, -0.051241397857666016, -0.049080610275268555, -0.046919822692871094, -0.04475903511047363, -0.04259824752807617, -0.04043745994567871, -0.03827667236328125, -0.03611588478088379, -0.03395509719848633, -0.03179430961608887, -0.029633522033691406, -0.027472734451293945, -0.025311946868896484, -0.023151159286499023, -0.020990371704101562, -0.0188295841217041, -0.01666879653930664, -0.01450800895690918, -0.012347221374511719, -0.010186433792114258, -0.008025646209716797, -0.005864858627319336, -0.003704071044921875, -0.001543283462524414, 0.0006175041198730469, 0.002778291702270508, 0.004939079284667969, 0.00709986686706543, 0.00926065444946289, 0.011421442031860352, 0.013582229614257812, 0.015743017196655273, 0.017903804779052734, 0.020064592361450195, 0.022225379943847656, 0.024386167526245117, 0.026546955108642578, 0.02870774269104004, 0.0308685302734375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 12.0, 5.0, 6.0, 10.0, 14.0, 28.0, 32.0, 57.0, 135.0, 263.0, 595.0, 1520.0, 6021.0, 39215.0, 728691.0, 249527.0, 17159.0, 3414.0, 1045.0, 386.0, 181.0, 98.0, 47.0, 31.0, 26.0, 15.0, 7.0, 6.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.306396484375, -0.2978401184082031, -0.28928375244140625, -0.2807273864746094, -0.2721710205078125, -0.2636146545410156, -0.25505828857421875, -0.24650192260742188, -0.237945556640625, -0.22938919067382812, -0.22083282470703125, -0.21227645874023438, -0.2037200927734375, -0.19516372680664062, -0.18660736083984375, -0.17805099487304688, -0.16949462890625, -0.16093826293945312, -0.15238189697265625, -0.14382553100585938, -0.1352691650390625, -0.12671279907226562, -0.11815643310546875, -0.10960006713867188, -0.101043701171875, -0.09248733520507812, -0.08393096923828125, -0.07537460327148438, -0.0668182373046875, -0.058261871337890625, -0.04970550537109375, -0.041149139404296875, -0.0325927734375, -0.024036407470703125, -0.01548004150390625, -0.006923675537109375, 0.0016326904296875, 0.010189056396484375, 0.01874542236328125, 0.027301788330078125, 0.035858154296875, 0.044414520263671875, 0.05297088623046875, 0.061527252197265625, 0.0700836181640625, 0.07863998413085938, 0.08719635009765625, 0.09575271606445312, 0.10430908203125, 0.11286544799804688, 0.12142181396484375, 0.12997817993164062, 0.1385345458984375, 0.14709091186523438, 0.15564727783203125, 0.16420364379882812, 0.172760009765625, 0.18131637573242188, 0.18987274169921875, 0.19842910766601562, 0.2069854736328125, 0.21554183959960938, 0.22409820556640625, 0.23265457153320312, 0.2412109375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 8.0, 3.0, 5.0, 9.0, 11.0, 21.0, 15.0, 27.0, 34.0, 50.0, 51.0, 66.0, 86.0, 94.0, 82.0, 87.0, 74.0, 66.0, 58.0, 33.0, 41.0, 17.0, 16.0, 17.0, 12.0, 6.0, 4.0, 2.0, 3.0, 5.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.251708984375, -0.24495697021484375, -0.2382049560546875, -0.23145294189453125, -0.224700927734375, -0.21794891357421875, -0.2111968994140625, -0.20444488525390625, -0.19769287109375, -0.19094085693359375, -0.1841888427734375, -0.17743682861328125, -0.170684814453125, -0.16393280029296875, -0.1571807861328125, -0.15042877197265625, -0.1436767578125, -0.13692474365234375, -0.1301727294921875, -0.12342071533203125, -0.116668701171875, -0.10991668701171875, -0.1031646728515625, -0.09641265869140625, -0.08966064453125, -0.08290863037109375, -0.0761566162109375, -0.06940460205078125, -0.062652587890625, -0.05590057373046875, -0.0491485595703125, -0.04239654541015625, -0.03564453125, -0.02889251708984375, -0.0221405029296875, -0.01538848876953125, -0.008636474609375, -0.00188446044921875, 0.0048675537109375, 0.01161956787109375, 0.01837158203125, 0.02512359619140625, 0.0318756103515625, 0.03862762451171875, 0.045379638671875, 0.05213165283203125, 0.0588836669921875, 0.06563568115234375, 0.0723876953125, 0.07913970947265625, 0.0858917236328125, 0.09264373779296875, 0.099395751953125, 0.10614776611328125, 0.1128997802734375, 0.11965179443359375, 0.12640380859375, 0.13315582275390625, 0.1399078369140625, 0.14665985107421875, 0.153411865234375, 0.16016387939453125, 0.1669158935546875, 0.17366790771484375, 0.180419921875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 4.0, 3.0, 3.0, 4.0, 4.0, 7.0, 5.0, 15.0, 21.0, 29.0, 49.0, 93.0, 120.0, 188.0, 310.0, 650.0, 1525.0, 6015.0, 56154.0, 879401.0, 92794.0, 7632.0, 1861.0, 732.0, 382.0, 218.0, 115.0, 76.0, 48.0, 31.0, 22.0, 19.0, 12.0, 2.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08245849609375, -0.07935523986816406, -0.07625198364257812, -0.07314872741699219, -0.07004547119140625, -0.06694221496582031, -0.06383895874023438, -0.06073570251464844, -0.0576324462890625, -0.05452919006347656, -0.051425933837890625, -0.04832267761230469, -0.04521942138671875, -0.04211616516113281, -0.039012908935546875, -0.03590965270996094, -0.032806396484375, -0.029703140258789062, -0.026599884033203125, -0.023496627807617188, -0.02039337158203125, -0.017290115356445312, -0.014186859130859375, -0.011083602905273438, -0.0079803466796875, -0.0048770904541015625, -0.001773834228515625, 0.0013294219970703125, 0.00443267822265625, 0.0075359344482421875, 0.010639190673828125, 0.013742446899414062, 0.016845703125, 0.019948959350585938, 0.023052215576171875, 0.026155471801757812, 0.02925872802734375, 0.03236198425292969, 0.035465240478515625, 0.03856849670410156, 0.0416717529296875, 0.04477500915527344, 0.047878265380859375, 0.05098152160644531, 0.05408477783203125, 0.05718803405761719, 0.060291290283203125, 0.06339454650878906, 0.066497802734375, 0.06960105895996094, 0.07270431518554688, 0.07580757141113281, 0.07891082763671875, 0.08201408386230469, 0.08511734008789062, 0.08822059631347656, 0.0913238525390625, 0.09442710876464844, 0.09753036499023438, 0.10063362121582031, 0.10373687744140625, 0.10684013366699219, 0.10994338989257812, 0.11304664611816406, 0.11614990234375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 9.0, 7.0, 10.0, 21.0, 19.0, 34.0, 38.0, 51.0, 57.0, 64.0, 55.0, 89.0, 57.0, 78.0, 58.0, 67.0, 61.0, 59.0, 42.0, 21.0, 28.0, 10.0, 15.0, 6.0, 13.0, 5.0, 4.0, 6.0, 1.0, 2.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.331371307373047e-06, -7.0659443736076355e-06, -6.800517439842224e-06, -6.535090506076813e-06, -6.269663572311401e-06, -6.00423663854599e-06, -5.738809704780579e-06, -5.473382771015167e-06, -5.207955837249756e-06, -4.9425289034843445e-06, -4.677101969718933e-06, -4.411675035953522e-06, -4.14624810218811e-06, -3.880821168422699e-06, -3.6153942346572876e-06, -3.3499673008918762e-06, -3.084540367126465e-06, -2.8191134333610535e-06, -2.553686499595642e-06, -2.2882595658302307e-06, -2.0228326320648193e-06, -1.757405698299408e-06, -1.4919787645339966e-06, -1.2265518307685852e-06, -9.611248970031738e-07, -6.956979632377625e-07, -4.302710294723511e-07, -1.648440957069397e-07, 1.0058283805847168e-07, 3.6600977182388306e-07, 6.314367055892944e-07, 8.968636393547058e-07, 1.1622905731201172e-06, 1.4277175068855286e-06, 1.69314444065094e-06, 1.9585713744163513e-06, 2.2239983081817627e-06, 2.489425241947174e-06, 2.7548521757125854e-06, 3.020279109477997e-06, 3.285706043243408e-06, 3.5511329770088196e-06, 3.816559910774231e-06, 4.081986844539642e-06, 4.347413778305054e-06, 4.612840712070465e-06, 4.8782676458358765e-06, 5.143694579601288e-06, 5.409121513366699e-06, 5.674548447132111e-06, 5.939975380897522e-06, 6.205402314662933e-06, 6.470829248428345e-06, 6.736256182193756e-06, 7.0016831159591675e-06, 7.267110049724579e-06, 7.53253698348999e-06, 7.797963917255402e-06, 8.063390851020813e-06, 8.328817784786224e-06, 8.594244718551636e-06, 8.859671652317047e-06, 9.125098586082458e-06, 9.39052551984787e-06, 9.655952453613281e-06]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 5.0, 5.0, 12.0, 19.0, 24.0, 43.0, 53.0, 123.0, 216.0, 524.0, 1663.0, 8056.0, 137016.0, 855237.0, 39176.0, 4431.0, 1132.0, 428.0, 166.0, 75.0, 52.0, 41.0, 14.0, 11.0, 10.0, 6.0, 9.0, 4.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1058349609375, -0.1029214859008789, -0.10000801086425781, -0.09709453582763672, -0.09418106079101562, -0.09126758575439453, -0.08835411071777344, -0.08544063568115234, -0.08252716064453125, -0.07961368560791016, -0.07670021057128906, -0.07378673553466797, -0.07087326049804688, -0.06795978546142578, -0.06504631042480469, -0.062132835388183594, -0.0592193603515625, -0.056305885314941406, -0.05339241027832031, -0.05047893524169922, -0.047565460205078125, -0.04465198516845703, -0.04173851013183594, -0.038825035095214844, -0.03591156005859375, -0.032998085021972656, -0.030084609985351562, -0.02717113494873047, -0.024257659912109375, -0.02134418487548828, -0.018430709838867188, -0.015517234802246094, -0.012603759765625, -0.009690284729003906, -0.0067768096923828125, -0.0038633346557617188, -0.000949859619140625, 0.0019636154174804688, 0.0048770904541015625, 0.007790565490722656, 0.01070404052734375, 0.013617515563964844, 0.016530990600585938, 0.01944446563720703, 0.022357940673828125, 0.02527141571044922, 0.028184890747070312, 0.031098365783691406, 0.0340118408203125, 0.036925315856933594, 0.03983879089355469, 0.04275226593017578, 0.045665740966796875, 0.04857921600341797, 0.05149269104003906, 0.054406166076660156, 0.05731964111328125, 0.060233116149902344, 0.06314659118652344, 0.06606006622314453, 0.06897354125976562, 0.07188701629638672, 0.07480049133300781, 0.0777139663696289, 0.08062744140625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 8.0, 9.0, 11.0, 9.0, 14.0, 11.0, 30.0, 31.0, 78.0, 117.0, 118.0, 107.0, 116.0, 94.0, 83.0, 53.0, 28.0, 20.0, 17.0, 11.0, 4.0, 6.0, 8.0, 4.0, 6.0, 2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0374755859375, -0.035633087158203125, -0.03379058837890625, -0.031948089599609375, -0.0301055908203125, -0.028263092041015625, -0.02642059326171875, -0.024578094482421875, -0.022735595703125, -0.020893096923828125, -0.01905059814453125, -0.017208099365234375, -0.0153656005859375, -0.013523101806640625, -0.01168060302734375, -0.009838104248046875, -0.00799560546875, -0.006153106689453125, -0.00431060791015625, -0.002468109130859375, -0.0006256103515625, 0.001216888427734375, 0.00305938720703125, 0.004901885986328125, 0.006744384765625, 0.008586883544921875, 0.01042938232421875, 0.012271881103515625, 0.0141143798828125, 0.015956878662109375, 0.01779937744140625, 0.019641876220703125, 0.021484375, 0.023326873779296875, 0.02516937255859375, 0.027011871337890625, 0.0288543701171875, 0.030696868896484375, 0.03253936767578125, 0.034381866455078125, 0.036224365234375, 0.038066864013671875, 0.03990936279296875, 0.041751861572265625, 0.0435943603515625, 0.045436859130859375, 0.04727935791015625, 0.049121856689453125, 0.05096435546875, 0.052806854248046875, 0.05464935302734375, 0.056491851806640625, 0.0583343505859375, 0.060176849365234375, 0.06201934814453125, 0.06386184692382812, 0.065704345703125, 0.06754684448242188, 0.06938934326171875, 0.07123184204101562, 0.0730743408203125, 0.07491683959960938, 0.07675933837890625, 0.07860183715820312, 0.0804443359375]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 6.0, 11.0, 36.0, 141.0, 443.0, 279.0, 64.0, 19.0, 5.0, 5.0, 3.0], "bins": [-4.339543342590332, -4.2644195556640625, -4.189296245574951, -4.114172458648682, -4.03904914855957, -3.963925361633301, -3.8888018131256104, -3.81367826461792, -3.7385544776916504, -3.66343092918396, -3.5883073806762695, -3.51318359375, -3.4380600452423096, -3.362936496734619, -3.2878129482269287, -3.2126893997192383, -3.137565851211548, -3.0624423027038574, -2.987318754196167, -2.9121949672698975, -2.837071418762207, -2.7619478702545166, -2.686824321746826, -2.6117007732391357, -2.5365772247314453, -2.461453676223755, -2.3863301277160645, -2.311206340789795, -2.2360827922821045, -2.160959243774414, -2.0858356952667236, -2.010712146759033, -1.9355883598327637, -1.8604648113250732, -1.7853411436080933, -1.7102175951004028, -1.6350939273834229, -1.5599703788757324, -1.484846830368042, -1.4097232818603516, -1.334599494934082, -1.2594759464263916, -1.1843522787094116, -1.1092287302017212, -1.0341050624847412, -0.9589815139770508, -0.8838579654693604, -0.8087343573570251, -0.7336108088493347, -0.6584872007369995, -0.5833636522293091, -0.5082400441169739, -0.43311643600463867, -0.35799282789230347, -0.28286924958229065, -0.20774567127227783, -0.13262206315994263, -0.057498469948768616, 0.017625123262405396, 0.0927487164735794, 0.16787230968475342, 0.24299591779708862, 0.31811949610710144, 0.39324307441711426, 0.46836668252944946]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 3.0, 4.0, 3.0, 4.0, 6.0, 6.0, 11.0, 10.0, 16.0, 25.0, 24.0, 30.0, 33.0, 37.0, 36.0, 35.0, 45.0, 40.0, 41.0, 49.0, 37.0, 51.0, 53.0, 46.0, 46.0, 33.0, 44.0, 41.0, 35.0, 18.0, 20.0, 20.0, 19.0, 15.0, 15.0, 7.0, 7.0, 6.0, 8.0, 9.0, 3.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6952948570251465, -0.6720430850982666, -0.6487912535667419, -0.6255394220352173, -0.6022876501083374, -0.5790358781814575, -0.5557840466499329, -0.5325322151184082, -0.5092804431915283, -0.48602864146232605, -0.4627768397331238, -0.4395250380039215, -0.41627323627471924, -0.39302143454551697, -0.3697696328163147, -0.3465178310871124, -0.32326602935791016, -0.3000142276287079, -0.2767624258995056, -0.25351062417030334, -0.23025882244110107, -0.2070070207118988, -0.18375521898269653, -0.16050341725349426, -0.137251615524292, -0.11399981379508972, -0.09074801206588745, -0.06749621033668518, -0.04424440860748291, -0.02099260687828064, 0.002259194850921631, 0.0255109965801239, 0.048762738704681396, 0.07201454043388367, 0.09526634216308594, 0.11851814389228821, 0.14176994562149048, 0.16502174735069275, 0.18827354907989502, 0.2115253508090973, 0.23477715253829956, 0.25802895426750183, 0.2812807559967041, 0.30453255772590637, 0.32778435945510864, 0.3510361611843109, 0.3742879629135132, 0.39753976464271545, 0.4207915663719177, 0.44404336810112, 0.46729516983032227, 0.49054697155952454, 0.5137987732887268, 0.5370506048202515, 0.5603023767471313, 0.5835541486740112, 0.6068059802055359, 0.6300578117370605, 0.6533095836639404, 0.6765613555908203, 0.699813187122345, 0.7230650186538696, 0.7463167905807495, 0.7695685625076294, 0.792820394039154]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 6.0, 3.0, 2.0, 3.0, 5.0, 8.0, 7.0, 6.0, 6.0, 11.0, 15.0, 29.0, 28.0, 41.0, 61.0, 101.0, 138.0, 197.0, 326.0, 587.0, 1137.0, 2607.0, 7304.0, 32015.0, 665233.0, 3406108.0, 62170.0, 10657.0, 3170.0, 1203.0, 572.0, 233.0, 129.0, 73.0, 39.0, 19.0, 13.0, 10.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.37060546875, -0.362396240234375, -0.35418701171875, -0.345977783203125, -0.3377685546875, -0.329559326171875, -0.32135009765625, -0.313140869140625, -0.304931640625, -0.296722412109375, -0.28851318359375, -0.280303955078125, -0.2720947265625, -0.263885498046875, -0.25567626953125, -0.247467041015625, -0.2392578125, -0.231048583984375, -0.22283935546875, -0.214630126953125, -0.2064208984375, -0.198211669921875, -0.19000244140625, -0.181793212890625, -0.173583984375, -0.165374755859375, -0.15716552734375, -0.148956298828125, -0.1407470703125, -0.132537841796875, -0.12432861328125, -0.116119384765625, -0.10791015625, -0.099700927734375, -0.09149169921875, -0.083282470703125, -0.0750732421875, -0.066864013671875, -0.05865478515625, -0.050445556640625, -0.042236328125, -0.034027099609375, -0.02581787109375, -0.017608642578125, -0.0093994140625, -0.001190185546875, 0.00701904296875, 0.015228271484375, 0.0234375, 0.031646728515625, 0.03985595703125, 0.048065185546875, 0.0562744140625, 0.064483642578125, 0.07269287109375, 0.080902099609375, 0.089111328125, 0.097320556640625, 0.10552978515625, 0.113739013671875, 0.1219482421875, 0.130157470703125, 0.13836669921875, 0.146575927734375, 0.15478515625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 8.0, 12.0, 26.0, 41.0, 59.0, 75.0, 119.0, 134.0, 121.0, 98.0, 107.0, 69.0, 55.0, 35.0, 21.0, 17.0, 4.0, 2.0, 4.0, 0.0, 1.0, 2.0], "bins": [-0.109619140625, -0.1074373722076416, -0.1052556037902832, -0.1030738353729248, -0.1008920669555664, -0.09871029853820801, -0.09652853012084961, -0.09434676170349121, -0.09216499328613281, -0.08998322486877441, -0.08780145645141602, -0.08561968803405762, -0.08343791961669922, -0.08125615119934082, -0.07907438278198242, -0.07689261436462402, -0.07471084594726562, -0.07252907752990723, -0.07034730911254883, -0.06816554069519043, -0.06598377227783203, -0.06380200386047363, -0.061620235443115234, -0.059438467025756836, -0.05725669860839844, -0.05507493019104004, -0.05289316177368164, -0.05071139335632324, -0.048529624938964844, -0.046347856521606445, -0.04416608810424805, -0.04198431968688965, -0.03980255126953125, -0.03762078285217285, -0.03543901443481445, -0.033257246017456055, -0.031075477600097656, -0.028893709182739258, -0.02671194076538086, -0.02453017234802246, -0.022348403930664062, -0.020166635513305664, -0.017984867095947266, -0.015803098678588867, -0.013621330261230469, -0.01143956184387207, -0.009257793426513672, -0.0070760250091552734, -0.004894256591796875, -0.0027124881744384766, -0.0005307197570800781, 0.0016510486602783203, 0.0038328170776367188, 0.006014585494995117, 0.008196353912353516, 0.010378122329711914, 0.012559890747070312, 0.014741659164428711, 0.01692342758178711, 0.019105195999145508, 0.021286964416503906, 0.023468732833862305, 0.025650501251220703, 0.0278322696685791, 0.0300140380859375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 10.0, 5.0, 13.0, 14.0, 23.0, 33.0, 53.0, 84.0, 134.0, 234.0, 644.0, 2991.0, 25627.0, 4097415.0, 61294.0, 4358.0, 815.0, 259.0, 99.0, 78.0, 39.0, 19.0, 21.0, 16.0, 11.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6953125, -0.6786079406738281, -0.6619033813476562, -0.6451988220214844, -0.6284942626953125, -0.6117897033691406, -0.5950851440429688, -0.5783805847167969, -0.561676025390625, -0.5449714660644531, -0.5282669067382812, -0.5115623474121094, -0.4948577880859375, -0.4781532287597656, -0.46144866943359375, -0.4447441101074219, -0.42803955078125, -0.4113349914550781, -0.39463043212890625, -0.3779258728027344, -0.3612213134765625, -0.3445167541503906, -0.32781219482421875, -0.3111076354980469, -0.294403076171875, -0.2776985168457031, -0.26099395751953125, -0.24428939819335938, -0.2275848388671875, -0.21088027954101562, -0.19417572021484375, -0.17747116088867188, -0.1607666015625, -0.14406204223632812, -0.12735748291015625, -0.11065292358398438, -0.0939483642578125, -0.07724380493164062, -0.06053924560546875, -0.043834686279296875, -0.027130126953125, -0.010425567626953125, 0.00627899169921875, 0.022983551025390625, 0.0396881103515625, 0.056392669677734375, 0.07309722900390625, 0.08980178833007812, 0.10650634765625, 0.12321090698242188, 0.13991546630859375, 0.15662002563476562, 0.1733245849609375, 0.19002914428710938, 0.20673370361328125, 0.22343826293945312, 0.240142822265625, 0.2568473815917969, 0.27355194091796875, 0.2902565002441406, 0.3069610595703125, 0.3236656188964844, 0.34037017822265625, 0.3570747375488281, 0.373779296875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 5.0, 8.0, 10.0, 19.0, 33.0, 49.0, 176.0, 1176.0, 2175.0, 278.0, 73.0, 27.0, 19.0, 8.0, 3.0, 12.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.278076171875, -0.27230072021484375, -0.2665252685546875, -0.26074981689453125, -0.254974365234375, -0.24919891357421875, -0.2434234619140625, -0.23764801025390625, -0.23187255859375, -0.22609710693359375, -0.2203216552734375, -0.21454620361328125, -0.208770751953125, -0.20299530029296875, -0.1972198486328125, -0.19144439697265625, -0.1856689453125, -0.17989349365234375, -0.1741180419921875, -0.16834259033203125, -0.162567138671875, -0.15679168701171875, -0.1510162353515625, -0.14524078369140625, -0.13946533203125, -0.13368988037109375, -0.1279144287109375, -0.12213897705078125, -0.116363525390625, -0.11058807373046875, -0.1048126220703125, -0.09903717041015625, -0.09326171875, -0.08748626708984375, -0.0817108154296875, -0.07593536376953125, -0.070159912109375, -0.06438446044921875, -0.0586090087890625, -0.05283355712890625, -0.04705810546875, -0.04128265380859375, -0.0355072021484375, -0.02973175048828125, -0.023956298828125, -0.01818084716796875, -0.0124053955078125, -0.00662994384765625, -0.0008544921875, 0.00492095947265625, 0.0106964111328125, 0.01647186279296875, 0.022247314453125, 0.02802276611328125, 0.0337982177734375, 0.03957366943359375, 0.04534912109375, 0.05112457275390625, 0.0569000244140625, 0.06267547607421875, 0.068450927734375, 0.07422637939453125, 0.0800018310546875, 0.08577728271484375, 0.091552734375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 31.0, 783.0, 187.0, 8.0, 3.0, 1.0, 1.0], "bins": [-6.561384201049805, -6.449646949768066, -6.337910175323486, -6.226172924041748, -6.11443567276001, -6.0026984214782715, -5.890961647033691, -5.779224395751953, -5.667487144470215, -5.555749893188477, -5.4440131187438965, -5.332275867462158, -5.22053861618042, -5.108801364898682, -4.997064590454102, -4.885327339172363, -4.773590087890625, -4.661852836608887, -4.550116062164307, -4.438378810882568, -4.32664155960083, -4.214904308319092, -4.103167533874512, -3.9914302825927734, -3.8796932697296143, -3.767956256866455, -3.656219005584717, -3.5444819927215576, -3.4327447414398193, -3.32100772857666, -3.209270477294922, -3.0975334644317627, -2.9857962131500244, -2.8740592002868652, -2.762321949005127, -2.6505849361419678, -2.5388476848602295, -2.4271106719970703, -2.315373420715332, -2.203636407852173, -2.0918991565704346, -1.9801620244979858, -1.868424892425537, -1.7566877603530884, -1.6449506282806396, -1.5332136154174805, -1.4214763641357422, -1.309739351272583, -1.1980022192001343, -1.0862650871276855, -0.9745279550552368, -0.8627908229827881, -0.7510536909103394, -0.6393166184425354, -0.5275794863700867, -0.41584235429763794, -0.3041052222251892, -0.19236809015274048, -0.08063097298145294, 0.031106144189834595, 0.14284327626228333, 0.25458037853240967, 0.3663175106048584, 0.47805464267730713, 0.5897917747497559]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 4.0, 4.0, 11.0, 32.0, 45.0, 69.0, 96.0, 109.0, 124.0, 136.0, 117.0, 88.0, 72.0, 47.0, 21.0, 18.0, 7.0, 7.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7585063576698303, -0.734368622303009, -0.7102308869361877, -0.6860931515693665, -0.6619554162025452, -0.6378176808357239, -0.6136798858642578, -0.5895421504974365, -0.5654044151306152, -0.541266679763794, -0.5171289443969727, -0.49299120903015137, -0.4688534736633301, -0.4447157382965088, -0.4205779731273651, -0.3964402377605438, -0.3723025321960449, -0.34816479682922363, -0.32402706146240234, -0.29988932609558105, -0.27575159072875977, -0.2516138553619385, -0.2274760901927948, -0.2033383548259735, -0.17920061945915222, -0.15506288409233093, -0.13092514872550964, -0.10678739845752716, -0.08264966309070587, -0.05851192772388458, -0.0343741774559021, -0.01023644208908081, 0.013901233673095703, 0.03803897276520729, 0.06217671185731888, 0.08631445467472076, 0.11045219004154205, 0.13458992540836334, 0.15872767567634583, 0.18286541104316711, 0.2070031464099884, 0.2311408817768097, 0.255278617143631, 0.27941638231277466, 0.30355411767959595, 0.32769185304641724, 0.3518295884132385, 0.3759673237800598, 0.4001050591468811, 0.4242427945137024, 0.4483805298805237, 0.47251826524734497, 0.49665600061416626, 0.5207937359809875, 0.5449315309524536, 0.5690692663192749, 0.5932070016860962, 0.6173447370529175, 0.6414824724197388, 0.6656202077865601, 0.6897579431533813, 0.7138956785202026, 0.7380334138870239, 0.7621711492538452, 0.7863088846206665]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 2.0, 2.0, 5.0, 9.0, 4.0, 13.0, 17.0, 17.0, 22.0, 36.0, 54.0, 67.0, 126.0, 202.0, 340.0, 635.0, 1590.0, 5880.0, 34097.0, 386200.0, 559608.0, 48405.0, 7584.0, 1894.0, 741.0, 384.0, 204.0, 121.0, 84.0, 54.0, 42.0, 28.0, 24.0, 18.0, 17.0, 12.0, 13.0, 3.0, 0.0, 1.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1746826171875, -0.1671161651611328, -0.15954971313476562, -0.15198326110839844, -0.14441680908203125, -0.13685035705566406, -0.12928390502929688, -0.12171745300292969, -0.1141510009765625, -0.10658454895019531, -0.09901809692382812, -0.09145164489746094, -0.08388519287109375, -0.07631874084472656, -0.06875228881835938, -0.06118583679199219, -0.053619384765625, -0.04605293273925781, -0.038486480712890625, -0.030920028686523438, -0.02335357666015625, -0.015787124633789062, -0.008220672607421875, -0.0006542205810546875, 0.0069122314453125, 0.014478683471679688, 0.022045135498046875, 0.029611587524414062, 0.03717803955078125, 0.04474449157714844, 0.052310943603515625, 0.05987739562988281, 0.06744384765625, 0.07501029968261719, 0.08257675170898438, 0.09014320373535156, 0.09770965576171875, 0.10527610778808594, 0.11284255981445312, 0.12040901184082031, 0.1279754638671875, 0.1355419158935547, 0.14310836791992188, 0.15067481994628906, 0.15824127197265625, 0.16580772399902344, 0.17337417602539062, 0.1809406280517578, 0.188507080078125, 0.1960735321044922, 0.20363998413085938, 0.21120643615722656, 0.21877288818359375, 0.22633934020996094, 0.23390579223632812, 0.2414722442626953, 0.2490386962890625, 0.2566051483154297, 0.2641716003417969, 0.27173805236816406, 0.27930450439453125, 0.28687095642089844, 0.2944374084472656, 0.3020038604736328, 0.3095703125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 7.0, 6.0, 21.0, 36.0, 46.0, 70.0, 87.0, 111.0, 123.0, 131.0, 94.0, 83.0, 63.0, 53.0, 28.0, 26.0, 14.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.088623046875, -0.08660411834716797, -0.08458518981933594, -0.0825662612915039, -0.08054733276367188, -0.07852840423583984, -0.07650947570800781, -0.07449054718017578, -0.07247161865234375, -0.07045269012451172, -0.06843376159667969, -0.06641483306884766, -0.06439590454101562, -0.062376976013183594, -0.06035804748535156, -0.05833911895751953, -0.0563201904296875, -0.05430126190185547, -0.05228233337402344, -0.050263404846191406, -0.048244476318359375, -0.046225547790527344, -0.04420661926269531, -0.04218769073486328, -0.04016876220703125, -0.03814983367919922, -0.03613090515136719, -0.034111976623535156, -0.032093048095703125, -0.030074119567871094, -0.028055191040039062, -0.02603626251220703, -0.024017333984375, -0.02199840545654297, -0.019979476928710938, -0.017960548400878906, -0.015941619873046875, -0.013922691345214844, -0.011903762817382812, -0.009884834289550781, -0.00786590576171875, -0.005846977233886719, -0.0038280487060546875, -0.0018091201782226562, 0.000209808349609375, 0.0022287368774414062, 0.0042476654052734375, 0.006266593933105469, 0.0082855224609375, 0.010304450988769531, 0.012323379516601562, 0.014342308044433594, 0.016361236572265625, 0.018380165100097656, 0.020399093627929688, 0.02241802215576172, 0.02443695068359375, 0.02645587921142578, 0.028474807739257812, 0.030493736267089844, 0.032512664794921875, 0.034531593322753906, 0.03655052185058594, 0.03856945037841797, 0.04058837890625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 10.0, 9.0, 9.0, 13.0, 19.0, 38.0, 47.0, 65.0, 109.0, 175.0, 293.0, 461.0, 940.0, 1765.0, 3718.0, 8007.0, 18518.0, 47170.0, 139429.0, 363570.0, 299943.0, 101821.0, 35615.0, 14364.0, 6294.0, 2933.0, 1409.0, 752.0, 392.0, 244.0, 159.0, 74.0, 52.0, 38.0, 33.0, 20.0, 16.0, 12.0, 7.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0772705078125, -0.0748453140258789, -0.07242012023925781, -0.06999492645263672, -0.06756973266601562, -0.06514453887939453, -0.06271934509277344, -0.060294151306152344, -0.05786895751953125, -0.055443763732910156, -0.05301856994628906, -0.05059337615966797, -0.048168182373046875, -0.04574298858642578, -0.04331779479980469, -0.040892601013183594, -0.0384674072265625, -0.036042213439941406, -0.03361701965332031, -0.03119182586669922, -0.028766632080078125, -0.02634143829345703, -0.023916244506835938, -0.021491050720214844, -0.01906585693359375, -0.016640663146972656, -0.014215469360351562, -0.011790275573730469, -0.009365081787109375, -0.006939888000488281, -0.0045146942138671875, -0.0020895004272460938, 0.000335693359375, 0.0027608871459960938, 0.0051860809326171875, 0.007611274719238281, 0.010036468505859375, 0.012461662292480469, 0.014886856079101562, 0.017312049865722656, 0.01973724365234375, 0.022162437438964844, 0.024587631225585938, 0.02701282501220703, 0.029438018798828125, 0.03186321258544922, 0.03428840637207031, 0.036713600158691406, 0.0391387939453125, 0.041563987731933594, 0.04398918151855469, 0.04641437530517578, 0.048839569091796875, 0.05126476287841797, 0.05368995666503906, 0.056115150451660156, 0.05854034423828125, 0.060965538024902344, 0.06339073181152344, 0.06581592559814453, 0.06824111938476562, 0.07066631317138672, 0.07309150695800781, 0.0755167007446289, 0.07794189453125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 7.0, 2.0, 6.0, 3.0, 7.0, 9.0, 12.0, 11.0, 12.0, 35.0, 28.0, 37.0, 33.0, 34.0, 50.0, 37.0, 43.0, 49.0, 48.0, 51.0, 55.0, 51.0, 39.0, 35.0, 38.0, 41.0, 35.0, 36.0, 27.0, 23.0, 17.0, 19.0, 12.0, 13.0, 13.0, 12.0, 7.0, 3.0, 6.0, 7.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1005859375, -0.09694671630859375, -0.0933074951171875, -0.08966827392578125, -0.086029052734375, -0.08238983154296875, -0.0787506103515625, -0.07511138916015625, -0.07147216796875, -0.06783294677734375, -0.0641937255859375, -0.06055450439453125, -0.056915283203125, -0.05327606201171875, -0.0496368408203125, -0.04599761962890625, -0.0423583984375, -0.03871917724609375, -0.0350799560546875, -0.03144073486328125, -0.027801513671875, -0.02416229248046875, -0.0205230712890625, -0.01688385009765625, -0.01324462890625, -0.00960540771484375, -0.0059661865234375, -0.00232696533203125, 0.001312255859375, 0.00495147705078125, 0.0085906982421875, 0.01222991943359375, 0.015869140625, 0.01950836181640625, 0.0231475830078125, 0.02678680419921875, 0.030426025390625, 0.03406524658203125, 0.0377044677734375, 0.04134368896484375, 0.04498291015625, 0.04862213134765625, 0.0522613525390625, 0.05590057373046875, 0.059539794921875, 0.06317901611328125, 0.0668182373046875, 0.07045745849609375, 0.0740966796875, 0.07773590087890625, 0.0813751220703125, 0.08501434326171875, 0.088653564453125, 0.09229278564453125, 0.0959320068359375, 0.09957122802734375, 0.10321044921875, 0.10684967041015625, 0.1104888916015625, 0.11412811279296875, 0.117767333984375, 0.12140655517578125, 0.1250457763671875, 0.12868499755859375, 0.13232421875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 9.0, 14.0, 13.0, 15.0, 22.0, 42.0, 47.0, 89.0, 151.0, 238.0, 483.0, 1040.0, 2611.0, 9882.0, 73669.0, 592352.0, 328567.0, 30239.0, 5666.0, 1796.0, 700.0, 362.0, 221.0, 98.0, 82.0, 48.0, 33.0, 23.0, 13.0, 10.0, 7.0, 3.0, 6.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0574951171875, -0.055843353271484375, -0.05419158935546875, -0.052539825439453125, -0.0508880615234375, -0.049236297607421875, -0.04758453369140625, -0.045932769775390625, -0.044281005859375, -0.042629241943359375, -0.04097747802734375, -0.039325714111328125, -0.0376739501953125, -0.036022186279296875, -0.03437042236328125, -0.032718658447265625, -0.03106689453125, -0.029415130615234375, -0.02776336669921875, -0.026111602783203125, -0.0244598388671875, -0.022808074951171875, -0.02115631103515625, -0.019504547119140625, -0.017852783203125, -0.016201019287109375, -0.01454925537109375, -0.012897491455078125, -0.0112457275390625, -0.009593963623046875, -0.00794219970703125, -0.006290435791015625, -0.004638671875, -0.002986907958984375, -0.00133514404296875, 0.000316619873046875, 0.0019683837890625, 0.003620147705078125, 0.00527191162109375, 0.006923675537109375, 0.008575439453125, 0.010227203369140625, 0.01187896728515625, 0.013530731201171875, 0.0151824951171875, 0.016834259033203125, 0.01848602294921875, 0.020137786865234375, 0.02178955078125, 0.023441314697265625, 0.02509307861328125, 0.026744842529296875, 0.0283966064453125, 0.030048370361328125, 0.03170013427734375, 0.033351898193359375, 0.035003662109375, 0.036655426025390625, 0.03830718994140625, 0.039958953857421875, 0.0416107177734375, 0.043262481689453125, 0.04491424560546875, 0.046566009521484375, 0.0482177734375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 13.0, 15.0, 21.0, 28.0, 39.0, 58.0, 63.0, 84.0, 80.0, 58.0, 88.0, 81.0, 75.0, 73.0, 66.0, 45.0, 41.0, 23.0, 15.0, 9.0, 8.0, 9.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.417533874511719e-06, -9.123235940933228e-06, -8.828938007354736e-06, -8.534640073776245e-06, -8.240342140197754e-06, -7.946044206619263e-06, -7.651746273040771e-06, -7.35744833946228e-06, -7.063150405883789e-06, -6.768852472305298e-06, -6.474554538726807e-06, -6.1802566051483154e-06, -5.885958671569824e-06, -5.591660737991333e-06, -5.297362804412842e-06, -5.003064870834351e-06, -4.708766937255859e-06, -4.414469003677368e-06, -4.120171070098877e-06, -3.825873136520386e-06, -3.5315752029418945e-06, -3.2372772693634033e-06, -2.942979335784912e-06, -2.648681402206421e-06, -2.3543834686279297e-06, -2.0600855350494385e-06, -1.7657876014709473e-06, -1.471489667892456e-06, -1.1771917343139648e-06, -8.828938007354736e-07, -5.885958671569824e-07, -2.942979335784912e-07, 0.0, 2.942979335784912e-07, 5.885958671569824e-07, 8.828938007354736e-07, 1.1771917343139648e-06, 1.471489667892456e-06, 1.7657876014709473e-06, 2.0600855350494385e-06, 2.3543834686279297e-06, 2.648681402206421e-06, 2.942979335784912e-06, 3.2372772693634033e-06, 3.5315752029418945e-06, 3.825873136520386e-06, 4.120171070098877e-06, 4.414469003677368e-06, 4.708766937255859e-06, 5.003064870834351e-06, 5.297362804412842e-06, 5.591660737991333e-06, 5.885958671569824e-06, 6.1802566051483154e-06, 6.474554538726807e-06, 6.768852472305298e-06, 7.063150405883789e-06, 7.35744833946228e-06, 7.651746273040771e-06, 7.946044206619263e-06, 8.240342140197754e-06, 8.534640073776245e-06, 8.828938007354736e-06, 9.123235940933228e-06, 9.417533874511719e-06]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 5.0, 10.0, 6.0, 15.0, 20.0, 35.0, 46.0, 79.0, 133.0, 240.0, 380.0, 740.0, 1671.0, 4108.0, 13248.0, 64650.0, 353493.0, 472087.0, 107608.0, 19953.0, 5762.0, 2097.0, 975.0, 482.0, 245.0, 168.0, 107.0, 63.0, 41.0, 26.0, 15.0, 15.0, 6.0, 6.0, 6.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0], "bins": [-0.0389404296875, -0.03783226013183594, -0.036724090576171875, -0.03561592102050781, -0.03450775146484375, -0.03339958190917969, -0.032291412353515625, -0.031183242797851562, -0.0300750732421875, -0.028966903686523438, -0.027858734130859375, -0.026750564575195312, -0.02564239501953125, -0.024534225463867188, -0.023426055908203125, -0.022317886352539062, -0.021209716796875, -0.020101547241210938, -0.018993377685546875, -0.017885208129882812, -0.01677703857421875, -0.015668869018554688, -0.014560699462890625, -0.013452529907226562, -0.0123443603515625, -0.011236190795898438, -0.010128021240234375, -0.009019851684570312, -0.00791168212890625, -0.0068035125732421875, -0.005695343017578125, -0.0045871734619140625, -0.00347900390625, -0.0023708343505859375, -0.001262664794921875, -0.0001544952392578125, 0.00095367431640625, 0.0020618438720703125, 0.003170013427734375, 0.0042781829833984375, 0.0053863525390625, 0.0064945220947265625, 0.007602691650390625, 0.008710861206054688, 0.00981903076171875, 0.010927200317382812, 0.012035369873046875, 0.013143539428710938, 0.014251708984375, 0.015359878540039062, 0.016468048095703125, 0.017576217651367188, 0.01868438720703125, 0.019792556762695312, 0.020900726318359375, 0.022008895874023438, 0.0231170654296875, 0.024225234985351562, 0.025333404541015625, 0.026441574096679688, 0.02754974365234375, 0.028657913208007812, 0.029766082763671875, 0.030874252319335938, 0.031982421875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 3.0, 3.0, 10.0, 9.0, 16.0, 13.0, 27.0, 36.0, 49.0, 95.0, 97.0, 127.0, 134.0, 103.0, 89.0, 62.0, 46.0, 26.0, 19.0, 13.0, 9.0, 7.0, 3.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.053192138671875, -0.051363468170166016, -0.04953479766845703, -0.04770612716674805, -0.04587745666503906, -0.04404878616333008, -0.042220115661621094, -0.04039144515991211, -0.038562774658203125, -0.03673410415649414, -0.034905433654785156, -0.03307676315307617, -0.031248092651367188, -0.029419422149658203, -0.02759075164794922, -0.025762081146240234, -0.02393341064453125, -0.022104740142822266, -0.02027606964111328, -0.018447399139404297, -0.016618728637695312, -0.014790058135986328, -0.012961387634277344, -0.01113271713256836, -0.009304046630859375, -0.007475376129150391, -0.005646705627441406, -0.003818035125732422, -0.0019893646240234375, -0.00016069412231445312, 0.0016679763793945312, 0.0034966468811035156, 0.0053253173828125, 0.007153987884521484, 0.008982658386230469, 0.010811328887939453, 0.012639999389648438, 0.014468669891357422, 0.016297340393066406, 0.01812601089477539, 0.019954681396484375, 0.02178335189819336, 0.023612022399902344, 0.025440692901611328, 0.027269363403320312, 0.029098033905029297, 0.03092670440673828, 0.032755374908447266, 0.03458404541015625, 0.036412715911865234, 0.03824138641357422, 0.0400700569152832, 0.04189872741699219, 0.04372739791870117, 0.045556068420410156, 0.04738473892211914, 0.049213409423828125, 0.05104207992553711, 0.052870750427246094, 0.05469942092895508, 0.05652809143066406, 0.05835676193237305, 0.06018543243408203, 0.062014102935791016, 0.0638427734375]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 7.0, 7.0, 16.0, 24.0, 74.0, 134.0, 191.0, 223.0, 151.0, 93.0, 40.0, 18.0, 7.0, 7.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7173994779586792, -0.6877219080924988, -0.6580443382263184, -0.6283667683601379, -0.5986891984939575, -0.5690116882324219, -0.5393341183662415, -0.509656548500061, -0.4799789786338806, -0.4503014087677002, -0.4206238389015198, -0.39094629883766174, -0.3612687289714813, -0.3315911591053009, -0.30191361904144287, -0.27223604917526245, -0.24255847930908203, -0.2128809094429016, -0.18320335447788239, -0.15352579951286316, -0.12384822964668274, -0.09417065978050232, -0.0644931048154831, -0.03481554985046387, -0.005137979984283447, 0.024539582431316376, 0.0542171448469162, 0.08389470726251602, 0.11357226967811584, 0.14324983954429626, 0.1729273945093155, 0.20260494947433472, 0.23228251934051514, 0.26196008920669556, 0.291637659072876, 0.321315199136734, 0.35099276900291443, 0.38067033886909485, 0.4103478789329529, 0.4400254487991333, 0.4697030186653137, 0.49938058853149414, 0.5290581583976746, 0.558735728263855, 0.5884132385253906, 0.6180908679962158, 0.6477683782577515, 0.6774459481239319, 0.7071235179901123, 0.7368010878562927, 0.7664786577224731, 0.7961562275886536, 0.825833797454834, 0.8555113077163696, 0.88518887758255, 0.9148664474487305, 0.9445440173149109, 0.9742215871810913, 1.003899097442627, 1.0335767269134521, 1.0632542371749878, 1.092931866645813, 1.1226093769073486, 1.1522870063781738, 1.1819645166397095]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 16.0, 10.0, 4.0, 13.0, 16.0, 18.0, 20.0, 31.0, 34.0, 32.0, 50.0, 44.0, 44.0, 47.0, 49.0, 46.0, 68.0, 54.0, 60.0, 42.0, 46.0, 44.0, 31.0, 33.0, 31.0, 29.0, 19.0, 12.0, 14.0, 11.0, 10.0, 10.0, 5.0, 1.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.629010021686554, -0.6050156354904175, -0.5810211896896362, -0.557026743888855, -0.5330323576927185, -0.509037971496582, -0.4850435256958008, -0.4610491096973419, -0.43705469369888306, -0.4130602777004242, -0.38906586170196533, -0.36507144570350647, -0.3410770297050476, -0.31708261370658875, -0.2930881977081299, -0.269093781709671, -0.24509936571121216, -0.2211049497127533, -0.19711053371429443, -0.17311611771583557, -0.1491217017173767, -0.12512728571891785, -0.10113286972045898, -0.07713845372200012, -0.05314403772354126, -0.029149621725082397, -0.005155205726623535, 0.018839210271835327, 0.04283362627029419, 0.06682804226875305, 0.09082245826721191, 0.11481687426567078, 0.13881123065948486, 0.16280564665794373, 0.1868000626564026, 0.21079447865486145, 0.2347888946533203, 0.2587833106517792, 0.28277772665023804, 0.3067721426486969, 0.33076655864715576, 0.3547609746456146, 0.3787553906440735, 0.40274980664253235, 0.4267442226409912, 0.4507386386394501, 0.47473305463790894, 0.4987274706363678, 0.5227218866348267, 0.5467163324356079, 0.5707107186317444, 0.5947051048278809, 0.6186995506286621, 0.6426939964294434, 0.6666883826255798, 0.6906827688217163, 0.7146772146224976, 0.7386716604232788, 0.7626660466194153, 0.7866604328155518, 0.810654878616333, 0.8346493244171143, 0.8586437106132507, 0.8826380968093872, 0.9066325426101685]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 9.0, 4.0, 4.0, 9.0, 14.0, 14.0, 29.0, 36.0, 50.0, 83.0, 126.0, 248.0, 501.0, 1354.0, 4955.0, 34704.0, 3490197.0, 637461.0, 19809.0, 3273.0, 883.0, 298.0, 117.0, 53.0, 18.0, 17.0, 12.0, 4.0, 2.0, 2.0], "bins": [-0.322509765625, -0.31617069244384766, -0.3098316192626953, -0.30349254608154297, -0.2971534729003906, -0.2908143997192383, -0.28447532653808594, -0.2781362533569336, -0.27179718017578125, -0.2654581069946289, -0.25911903381347656, -0.2527799606323242, -0.24644088745117188, -0.24010181427001953, -0.2337627410888672, -0.22742366790771484, -0.2210845947265625, -0.21474552154541016, -0.2084064483642578, -0.20206737518310547, -0.19572830200195312, -0.18938922882080078, -0.18305015563964844, -0.1767110824584961, -0.17037200927734375, -0.1640329360961914, -0.15769386291503906, -0.15135478973388672, -0.14501571655273438, -0.13867664337158203, -0.1323375701904297, -0.12599849700927734, -0.119659423828125, -0.11332035064697266, -0.10698127746582031, -0.10064220428466797, -0.09430313110351562, -0.08796405792236328, -0.08162498474121094, -0.0752859115600586, -0.06894683837890625, -0.0626077651977539, -0.05626869201660156, -0.04992961883544922, -0.043590545654296875, -0.03725147247314453, -0.030912399291992188, -0.024573326110839844, -0.0182342529296875, -0.011895179748535156, -0.0055561065673828125, 0.0007829666137695312, 0.007122039794921875, 0.013461112976074219, 0.019800186157226562, 0.026139259338378906, 0.03247833251953125, 0.038817405700683594, 0.04515647888183594, 0.05149555206298828, 0.057834625244140625, 0.06417369842529297, 0.07051277160644531, 0.07685184478759766, 0.08319091796875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 4.0, 12.0, 9.0, 25.0, 38.0, 54.0, 55.0, 90.0, 97.0, 92.0, 116.0, 108.0, 80.0, 79.0, 57.0, 32.0, 24.0, 14.0, 4.0, 10.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0831298828125, -0.08119583129882812, -0.07926177978515625, -0.07732772827148438, -0.0753936767578125, -0.07345962524414062, -0.07152557373046875, -0.06959152221679688, -0.067657470703125, -0.06572341918945312, -0.06378936767578125, -0.061855316162109375, -0.0599212646484375, -0.057987213134765625, -0.05605316162109375, -0.054119110107421875, -0.05218505859375, -0.050251007080078125, -0.04831695556640625, -0.046382904052734375, -0.0444488525390625, -0.042514801025390625, -0.04058074951171875, -0.038646697998046875, -0.036712646484375, -0.034778594970703125, -0.03284454345703125, -0.030910491943359375, -0.0289764404296875, -0.027042388916015625, -0.02510833740234375, -0.023174285888671875, -0.021240234375, -0.019306182861328125, -0.01737213134765625, -0.015438079833984375, -0.0135040283203125, -0.011569976806640625, -0.00963592529296875, -0.007701873779296875, -0.005767822265625, -0.003833770751953125, -0.00189971923828125, 3.4332275390625e-05, 0.0019683837890625, 0.003902435302734375, 0.00583648681640625, 0.007770538330078125, 0.00970458984375, 0.011638641357421875, 0.01357269287109375, 0.015506744384765625, 0.0174407958984375, 0.019374847412109375, 0.02130889892578125, 0.023242950439453125, 0.025177001953125, 0.027111053466796875, 0.02904510498046875, 0.030979156494140625, 0.0329132080078125, 0.034847259521484375, 0.03678131103515625, 0.038715362548828125, 0.0406494140625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 1.0, 4.0, 6.0, 5.0, 5.0, 18.0, 21.0, 37.0, 50.0, 89.0, 140.0, 331.0, 1241.0, 11421.0, 3831038.0, 342965.0, 5270.0, 855.0, 331.0, 166.0, 98.0, 58.0, 34.0, 29.0, 16.0, 22.0, 14.0, 5.0, 9.0, 2.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3798828125, -0.3703479766845703, -0.3608131408691406, -0.35127830505371094, -0.34174346923828125, -0.33220863342285156, -0.3226737976074219, -0.3131389617919922, -0.3036041259765625, -0.2940692901611328, -0.2845344543457031, -0.27499961853027344, -0.26546478271484375, -0.25592994689941406, -0.24639511108398438, -0.2368602752685547, -0.227325439453125, -0.2177906036376953, -0.20825576782226562, -0.19872093200683594, -0.18918609619140625, -0.17965126037597656, -0.17011642456054688, -0.1605815887451172, -0.1510467529296875, -0.1415119171142578, -0.13197708129882812, -0.12244224548339844, -0.11290740966796875, -0.10337257385253906, -0.09383773803710938, -0.08430290222167969, -0.07476806640625, -0.06523323059082031, -0.055698394775390625, -0.04616355895996094, -0.03662872314453125, -0.027093887329101562, -0.017559051513671875, -0.008024215698242188, 0.0015106201171875, 0.011045455932617188, 0.020580291748046875, 0.030115127563476562, 0.03964996337890625, 0.04918479919433594, 0.058719635009765625, 0.06825447082519531, 0.077789306640625, 0.08732414245605469, 0.09685897827148438, 0.10639381408691406, 0.11592864990234375, 0.12546348571777344, 0.13499832153320312, 0.1445331573486328, 0.1540679931640625, 0.1636028289794922, 0.17313766479492188, 0.18267250061035156, 0.19220733642578125, 0.20174217224121094, 0.21127700805664062, 0.2208118438720703, 0.2303466796875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 10.0, 32.0, 119.0, 978.0, 2522.0, 303.0, 67.0, 26.0, 10.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.042755126953125, -0.03856801986694336, -0.03438091278076172, -0.030193805694580078, -0.026006698608398438, -0.021819591522216797, -0.017632484436035156, -0.013445377349853516, -0.009258270263671875, -0.005071163177490234, -0.0008840560913085938, 0.003303050994873047, 0.0074901580810546875, 0.011677265167236328, 0.01586437225341797, 0.02005147933959961, 0.02423858642578125, 0.02842569351196289, 0.03261280059814453, 0.03679990768432617, 0.04098701477050781, 0.04517412185668945, 0.049361228942871094, 0.053548336029052734, 0.057735443115234375, 0.061922550201416016, 0.06610965728759766, 0.0702967643737793, 0.07448387145996094, 0.07867097854614258, 0.08285808563232422, 0.08704519271850586, 0.0912322998046875, 0.09541940689086914, 0.09960651397705078, 0.10379362106323242, 0.10798072814941406, 0.1121678352355957, 0.11635494232177734, 0.12054204940795898, 0.12472915649414062, 0.12891626358032227, 0.1331033706665039, 0.13729047775268555, 0.1414775848388672, 0.14566469192504883, 0.14985179901123047, 0.1540389060974121, 0.15822601318359375, 0.1624131202697754, 0.16660022735595703, 0.17078733444213867, 0.1749744415283203, 0.17916154861450195, 0.1833486557006836, 0.18753576278686523, 0.19172286987304688, 0.19590997695922852, 0.20009708404541016, 0.2042841911315918, 0.20847129821777344, 0.21265840530395508, 0.21684551239013672, 0.22103261947631836, 0.2252197265625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 8.0, 152.0, 800.0, 39.0, 12.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9105702638626099, -1.849501609802246, -1.7884328365325928, -1.727364182472229, -1.6662955284118652, -1.605226755142212, -1.5441581010818481, -1.4830894470214844, -1.422020673751831, -1.3609520196914673, -1.299883246421814, -1.2388145923614502, -1.1777459383010864, -1.116677165031433, -1.0556085109710693, -0.9945397973060608, -0.933471143245697, -0.8724024295806885, -0.8113337755203247, -0.7502650618553162, -0.6891963481903076, -0.6281276941299438, -0.5670589804649353, -0.5059902667999268, -0.4449215829372406, -0.38385289907455444, -0.3227841854095459, -0.26171550154685974, -0.2006468027830124, -0.13957810401916504, -0.07850942015647888, -0.017440706491470337, 0.04362797737121582, 0.10469667613506317, 0.16576537489891052, 0.22683405876159668, 0.2879027724266052, 0.3489714562892914, 0.41004014015197754, 0.4711088538169861, 0.5321775674819946, 0.5932462811470032, 0.6543149352073669, 0.7153836488723755, 0.776452362537384, 0.8375210762023926, 0.8985897302627563, 0.9596584439277649, 1.0207271575927734, 1.0817958116531372, 1.1428645849227905, 1.2039332389831543, 1.265001893043518, 1.3260706663131714, 1.3871393203735352, 1.4482080936431885, 1.5092766284942627, 1.5703452825546265, 1.6314140558242798, 1.6924827098846436, 1.7535513639450073, 1.8146201372146606, 1.8756887912750244, 1.9367575645446777, 1.9978262186050415]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 8.0, 28.0, 41.0, 88.0, 126.0, 167.0, 168.0, 166.0, 89.0, 72.0, 29.0, 16.0, 8.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6750929355621338, -0.6541709303855896, -0.6332489252090454, -0.6123268604278564, -0.5914048552513123, -0.5704828500747681, -0.5495608448982239, -0.5286388397216797, -0.5077167749404907, -0.48679476976394653, -0.46587273478507996, -0.44495072960853577, -0.4240286946296692, -0.403106689453125, -0.3821846842765808, -0.3612626791000366, -0.34034067392349243, -0.31941866874694824, -0.29849663376808167, -0.2775746285915375, -0.2566525936126709, -0.2357305884361267, -0.21480858325958252, -0.19388656318187714, -0.17296454310417175, -0.15204252302646637, -0.131120502948761, -0.1101984977722168, -0.08927647769451141, -0.06835445761680603, -0.04743245244026184, -0.026510432362556458, -0.00558847188949585, 0.015333544462919235, 0.03625556081533432, 0.057177573442459106, 0.07809959352016449, 0.09902161359786987, 0.11994361877441406, 0.14086563885211945, 0.16178765892982483, 0.1827096790075302, 0.2036316990852356, 0.22455370426177979, 0.24547572433948517, 0.26639774441719055, 0.28731974959373474, 0.3082417845726013, 0.3291637897491455, 0.3500857949256897, 0.3710078299045563, 0.39192983508110046, 0.41285187005996704, 0.43377387523651123, 0.4546958804130554, 0.4756178855895996, 0.4965399205684662, 0.5174619555473328, 0.538383960723877, 0.5593059659004211, 0.5802279710769653, 0.6011500358581543, 0.6220719814300537, 0.6429940462112427, 0.6639160513877869]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 7.0, 8.0, 6.0, 5.0, 9.0, 15.0, 24.0, 29.0, 32.0, 47.0, 82.0, 103.0, 123.0, 242.0, 355.0, 669.0, 1348.0, 2952.0, 8601.0, 31620.0, 148403.0, 513347.0, 264232.0, 54548.0, 13527.0, 4243.0, 1798.0, 855.0, 493.0, 260.0, 158.0, 113.0, 86.0, 54.0, 45.0, 35.0, 24.0, 15.0, 10.0, 8.0, 8.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1392822265625, -0.1351470947265625, -0.131011962890625, -0.1268768310546875, -0.12274169921875, -0.1186065673828125, -0.114471435546875, -0.1103363037109375, -0.106201171875, -0.1020660400390625, -0.097930908203125, -0.0937957763671875, -0.08966064453125, -0.0855255126953125, -0.081390380859375, -0.0772552490234375, -0.0731201171875, -0.0689849853515625, -0.064849853515625, -0.0607147216796875, -0.05657958984375, -0.0524444580078125, -0.048309326171875, -0.0441741943359375, -0.0400390625, -0.0359039306640625, -0.031768798828125, -0.0276336669921875, -0.02349853515625, -0.0193634033203125, -0.015228271484375, -0.0110931396484375, -0.0069580078125, -0.0028228759765625, 0.001312255859375, 0.0054473876953125, 0.00958251953125, 0.0137176513671875, 0.017852783203125, 0.0219879150390625, 0.026123046875, 0.0302581787109375, 0.034393310546875, 0.0385284423828125, 0.04266357421875, 0.0467987060546875, 0.050933837890625, 0.0550689697265625, 0.0592041015625, 0.0633392333984375, 0.067474365234375, 0.0716094970703125, 0.07574462890625, 0.0798797607421875, 0.084014892578125, 0.0881500244140625, 0.09228515625, 0.0964202880859375, 0.100555419921875, 0.1046905517578125, 0.10882568359375, 0.1129608154296875, 0.117095947265625, 0.1212310791015625, 0.1253662109375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 0.0, 3.0, 0.0, 6.0, 7.0, 13.0, 13.0, 24.0, 36.0, 50.0, 60.0, 71.0, 85.0, 101.0, 94.0, 92.0, 84.0, 59.0, 75.0, 47.0, 28.0, 21.0, 16.0, 14.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06585693359375, -0.0641789436340332, -0.0625009536743164, -0.06082296371459961, -0.05914497375488281, -0.057466983795166016, -0.05578899383544922, -0.05411100387573242, -0.052433013916015625, -0.05075502395629883, -0.04907703399658203, -0.047399044036865234, -0.04572105407714844, -0.04404306411743164, -0.042365074157714844, -0.04068708419799805, -0.03900909423828125, -0.03733110427856445, -0.035653114318847656, -0.03397512435913086, -0.03229713439941406, -0.030619144439697266, -0.02894115447998047, -0.027263164520263672, -0.025585174560546875, -0.023907184600830078, -0.02222919464111328, -0.020551204681396484, -0.018873214721679688, -0.01719522476196289, -0.015517234802246094, -0.013839244842529297, -0.0121612548828125, -0.010483264923095703, -0.008805274963378906, -0.007127285003662109, -0.0054492950439453125, -0.0037713050842285156, -0.0020933151245117188, -0.0004153251647949219, 0.001262664794921875, 0.002940654754638672, 0.004618644714355469, 0.006296634674072266, 0.007974624633789062, 0.00965261459350586, 0.011330604553222656, 0.013008594512939453, 0.01468658447265625, 0.016364574432373047, 0.018042564392089844, 0.01972055435180664, 0.021398544311523438, 0.023076534271240234, 0.02475452423095703, 0.026432514190673828, 0.028110504150390625, 0.029788494110107422, 0.03146648406982422, 0.033144474029541016, 0.03482246398925781, 0.03650045394897461, 0.038178443908691406, 0.0398564338684082, 0.041534423828125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 12.0, 7.0, 18.0, 19.0, 18.0, 37.0, 50.0, 61.0, 119.0, 139.0, 268.0, 408.0, 703.0, 1337.0, 2589.0, 5446.0, 11695.0, 27457.0, 72203.0, 208172.0, 372300.0, 216106.0, 76640.0, 28659.0, 12236.0, 5720.0, 2750.0, 1408.0, 756.0, 436.0, 263.0, 173.0, 102.0, 67.0, 51.0, 32.0, 25.0, 17.0, 9.0, 11.0, 8.0, 7.0, 3.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.068359375, -0.06625747680664062, -0.06415557861328125, -0.062053680419921875, -0.0599517822265625, -0.057849884033203125, -0.05574798583984375, -0.053646087646484375, -0.051544189453125, -0.049442291259765625, -0.04734039306640625, -0.045238494873046875, -0.0431365966796875, -0.041034698486328125, -0.03893280029296875, -0.036830902099609375, -0.03472900390625, -0.032627105712890625, -0.03052520751953125, -0.028423309326171875, -0.0263214111328125, -0.024219512939453125, -0.02211761474609375, -0.020015716552734375, -0.017913818359375, -0.015811920166015625, -0.01371002197265625, -0.011608123779296875, -0.0095062255859375, -0.007404327392578125, -0.00530242919921875, -0.003200531005859375, -0.0010986328125, 0.001003265380859375, 0.00310516357421875, 0.005207061767578125, 0.0073089599609375, 0.009410858154296875, 0.01151275634765625, 0.013614654541015625, 0.015716552734375, 0.017818450927734375, 0.01992034912109375, 0.022022247314453125, 0.0241241455078125, 0.026226043701171875, 0.02832794189453125, 0.030429840087890625, 0.03253173828125, 0.034633636474609375, 0.03673553466796875, 0.038837432861328125, 0.0409393310546875, 0.043041229248046875, 0.04514312744140625, 0.047245025634765625, 0.049346923828125, 0.051448822021484375, 0.05355072021484375, 0.055652618408203125, 0.0577545166015625, 0.059856414794921875, 0.06195831298828125, 0.06406021118164062, 0.066162109375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 1.0, 4.0, 7.0, 4.0, 14.0, 17.0, 6.0, 13.0, 11.0, 16.0, 13.0, 16.0, 28.0, 32.0, 34.0, 39.0, 29.0, 42.0, 36.0, 37.0, 35.0, 43.0, 37.0, 35.0, 38.0, 38.0, 34.0, 42.0, 27.0, 28.0, 42.0, 31.0, 22.0, 18.0, 18.0, 18.0, 24.0, 13.0, 9.0, 8.0, 5.0, 9.0, 4.0, 4.0, 9.0, 5.0, 2.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.10272216796875, -0.09973907470703125, -0.0967559814453125, -0.09377288818359375, -0.090789794921875, -0.08780670166015625, -0.0848236083984375, -0.08184051513671875, -0.078857421875, -0.07587432861328125, -0.0728912353515625, -0.06990814208984375, -0.066925048828125, -0.06394195556640625, -0.0609588623046875, -0.05797576904296875, -0.05499267578125, -0.05200958251953125, -0.0490264892578125, -0.04604339599609375, -0.043060302734375, -0.04007720947265625, -0.0370941162109375, -0.03411102294921875, -0.0311279296875, -0.02814483642578125, -0.0251617431640625, -0.02217864990234375, -0.019195556640625, -0.01621246337890625, -0.0132293701171875, -0.01024627685546875, -0.00726318359375, -0.00428009033203125, -0.0012969970703125, 0.00168609619140625, 0.004669189453125, 0.00765228271484375, 0.0106353759765625, 0.01361846923828125, 0.0166015625, 0.01958465576171875, 0.0225677490234375, 0.02555084228515625, 0.028533935546875, 0.03151702880859375, 0.0345001220703125, 0.03748321533203125, 0.04046630859375, 0.04344940185546875, 0.0464324951171875, 0.04941558837890625, 0.052398681640625, 0.05538177490234375, 0.0583648681640625, 0.06134796142578125, 0.0643310546875, 0.06731414794921875, 0.0702972412109375, 0.07328033447265625, 0.076263427734375, 0.07924652099609375, 0.0822296142578125, 0.08521270751953125, 0.08819580078125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 3.0, 10.0, 11.0, 18.0, 25.0, 35.0, 75.0, 107.0, 171.0, 344.0, 728.0, 1893.0, 7447.0, 62084.0, 610619.0, 332688.0, 25579.0, 4269.0, 1289.0, 510.0, 274.0, 124.0, 86.0, 49.0, 36.0, 20.0, 19.0, 12.0, 7.0, 7.0, 2.0, 2.0, 3.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.046051025390625, -0.04433393478393555, -0.042616844177246094, -0.04089975357055664, -0.03918266296386719, -0.037465572357177734, -0.03574848175048828, -0.03403139114379883, -0.032314300537109375, -0.030597209930419922, -0.02888011932373047, -0.027163028717041016, -0.025445938110351562, -0.02372884750366211, -0.022011756896972656, -0.020294666290283203, -0.01857757568359375, -0.016860485076904297, -0.015143394470214844, -0.01342630386352539, -0.011709213256835938, -0.009992122650146484, -0.008275032043457031, -0.006557941436767578, -0.004840850830078125, -0.003123760223388672, -0.0014066696166992188, 0.0003104209899902344, 0.0020275115966796875, 0.0037446022033691406, 0.005461692810058594, 0.007178783416748047, 0.0088958740234375, 0.010612964630126953, 0.012330055236816406, 0.01404714584350586, 0.015764236450195312, 0.017481327056884766, 0.01919841766357422, 0.020915508270263672, 0.022632598876953125, 0.024349689483642578, 0.02606678009033203, 0.027783870697021484, 0.029500961303710938, 0.03121805191040039, 0.032935142517089844, 0.0346522331237793, 0.03636932373046875, 0.0380864143371582, 0.039803504943847656, 0.04152059555053711, 0.04323768615722656, 0.044954776763916016, 0.04667186737060547, 0.04838895797729492, 0.050106048583984375, 0.05182313919067383, 0.05354022979736328, 0.055257320404052734, 0.05697441101074219, 0.05869150161743164, 0.060408592224121094, 0.06212568283081055, 0.0638427734375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 13.0, 13.0, 20.0, 24.0, 31.0, 37.0, 36.0, 49.0, 58.0, 65.0, 66.0, 65.0, 70.0, 79.0, 57.0, 52.0, 30.0, 41.0, 48.0, 33.0, 24.0, 21.0, 16.0, 14.0, 7.0, 5.0, 11.0, 4.0, 6.0, 1.0, 2.0, 1.0, 4.0], "bins": [-1.0371208190917969e-05, -1.013185828924179e-05, -9.892508387565613e-06, -9.653158485889435e-06, -9.413808584213257e-06, -9.174458682537079e-06, -8.935108780860901e-06, -8.695758879184723e-06, -8.456408977508545e-06, -8.217059075832367e-06, -7.977709174156189e-06, -7.738359272480011e-06, -7.499009370803833e-06, -7.259659469127655e-06, -7.020309567451477e-06, -6.780959665775299e-06, -6.541609764099121e-06, -6.302259862422943e-06, -6.062909960746765e-06, -5.823560059070587e-06, -5.584210157394409e-06, -5.344860255718231e-06, -5.105510354042053e-06, -4.866160452365875e-06, -4.626810550689697e-06, -4.387460649013519e-06, -4.148110747337341e-06, -3.908760845661163e-06, -3.6694109439849854e-06, -3.4300610423088074e-06, -3.1907111406326294e-06, -2.9513612389564514e-06, -2.7120113372802734e-06, -2.4726614356040955e-06, -2.2333115339279175e-06, -1.9939616322517395e-06, -1.7546117305755615e-06, -1.5152618288993835e-06, -1.2759119272232056e-06, -1.0365620255470276e-06, -7.972121238708496e-07, -5.578622221946716e-07, -3.1851232051849365e-07, -7.916241884231567e-08, 1.601874828338623e-07, 3.995373845100403e-07, 6.388872861862183e-07, 8.782371878623962e-07, 1.1175870895385742e-06, 1.3569369912147522e-06, 1.5962868928909302e-06, 1.8356367945671082e-06, 2.074986696243286e-06, 2.314336597919464e-06, 2.553686499595642e-06, 2.79303640127182e-06, 3.032386302947998e-06, 3.271736204624176e-06, 3.511086106300354e-06, 3.750436007976532e-06, 3.98978590965271e-06, 4.229135811328888e-06, 4.468485713005066e-06, 4.707835614681244e-06, 4.947185516357422e-06]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 7.0, 13.0, 16.0, 26.0, 33.0, 69.0, 136.0, 322.0, 1009.0, 4877.0, 76043.0, 833000.0, 124570.0, 6564.0, 1201.0, 371.0, 133.0, 78.0, 37.0, 18.0, 15.0, 13.0, 5.0, 1.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0660400390625, -0.06380653381347656, -0.061573028564453125, -0.05933952331542969, -0.05710601806640625, -0.05487251281738281, -0.052639007568359375, -0.05040550231933594, -0.0481719970703125, -0.04593849182128906, -0.043704986572265625, -0.04147148132324219, -0.03923797607421875, -0.03700447082519531, -0.034770965576171875, -0.03253746032714844, -0.030303955078125, -0.028070449829101562, -0.025836944580078125, -0.023603439331054688, -0.02136993408203125, -0.019136428833007812, -0.016902923583984375, -0.014669418334960938, -0.0124359130859375, -0.010202407836914062, -0.007968902587890625, -0.0057353973388671875, -0.00350189208984375, -0.0012683868408203125, 0.000965118408203125, 0.0031986236572265625, 0.00543212890625, 0.0076656341552734375, 0.009899139404296875, 0.012132644653320312, 0.01436614990234375, 0.016599655151367188, 0.018833160400390625, 0.021066665649414062, 0.0233001708984375, 0.025533676147460938, 0.027767181396484375, 0.030000686645507812, 0.03223419189453125, 0.03446769714355469, 0.036701202392578125, 0.03893470764160156, 0.041168212890625, 0.04340171813964844, 0.045635223388671875, 0.04786872863769531, 0.05010223388671875, 0.05233573913574219, 0.054569244384765625, 0.05680274963378906, 0.0590362548828125, 0.06126976013183594, 0.06350326538085938, 0.06573677062988281, 0.06797027587890625, 0.07020378112792969, 0.07243728637695312, 0.07467079162597656, 0.076904296875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 5.0, 13.0, 13.0, 18.0, 28.0, 20.0, 50.0, 53.0, 55.0, 73.0, 117.0, 81.0, 101.0, 70.0, 69.0, 54.0, 52.0, 38.0, 20.0, 27.0, 12.0, 6.0, 3.0, 7.0, 7.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.040069580078125, -0.03880500793457031, -0.037540435791015625, -0.03627586364746094, -0.03501129150390625, -0.03374671936035156, -0.032482147216796875, -0.031217575073242188, -0.0299530029296875, -0.028688430786132812, -0.027423858642578125, -0.026159286499023438, -0.02489471435546875, -0.023630142211914062, -0.022365570068359375, -0.021100997924804688, -0.01983642578125, -0.018571853637695312, -0.017307281494140625, -0.016042709350585938, -0.01477813720703125, -0.013513565063476562, -0.012248992919921875, -0.010984420776367188, -0.0097198486328125, -0.008455276489257812, -0.007190704345703125, -0.0059261322021484375, -0.00466156005859375, -0.0033969879150390625, -0.002132415771484375, -0.0008678436279296875, 0.000396728515625, 0.0016613006591796875, 0.002925872802734375, 0.0041904449462890625, 0.00545501708984375, 0.0067195892333984375, 0.007984161376953125, 0.009248733520507812, 0.0105133056640625, 0.011777877807617188, 0.013042449951171875, 0.014307022094726562, 0.01557159423828125, 0.016836166381835938, 0.018100738525390625, 0.019365310668945312, 0.0206298828125, 0.021894454956054688, 0.023159027099609375, 0.024423599243164062, 0.02568817138671875, 0.026952743530273438, 0.028217315673828125, 0.029481887817382812, 0.0307464599609375, 0.03201103210449219, 0.033275604248046875, 0.03454017639160156, 0.03580474853515625, 0.03706932067871094, 0.038333892822265625, 0.03959846496582031, 0.040863037109375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 14.0, 53.0, 181.0, 472.0, 215.0, 50.0, 15.0, 6.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.0180654525756836, -2.9595415592193604, -2.901017904281616, -2.842494010925293, -2.783970355987549, -2.7254464626312256, -2.6669225692749023, -2.608398914337158, -2.549875020980835, -2.4913511276245117, -2.4328274726867676, -2.3743035793304443, -2.315779685974121, -2.257256031036377, -2.1987321376800537, -2.1402084827423096, -2.0816845893859863, -2.023160696029663, -1.964637041091919, -1.9061131477355957, -1.847589373588562, -1.7890655994415283, -1.730541706085205, -1.6720179319381714, -1.6134941577911377, -1.554970383644104, -1.4964466094970703, -1.437922716140747, -1.3793989419937134, -1.3208751678466797, -1.2623512744903564, -1.2038275003433228, -1.1453038454055786, -1.086780071258545, -1.0282561779022217, -0.969732403755188, -0.9112086296081543, -0.8526848554611206, -0.7941610217094421, -0.7356371879577637, -0.67711341381073, -0.6185896396636963, -0.5600658059120178, -0.5015419721603394, -0.44301819801330566, -0.3844943940639496, -0.3259705901145935, -0.2674467861652374, -0.20892298221588135, -0.15039917826652527, -0.09187537431716919, -0.03335157036781311, 0.02517223358154297, 0.08369603753089905, 0.14221984148025513, 0.2007436454296112, 0.2592674493789673, 0.31779125332832336, 0.37631505727767944, 0.4348388612270355, 0.4933626651763916, 0.5518864393234253, 0.6104102730751038, 0.6689341068267822, 0.7274578809738159]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 7.0, 6.0, 4.0, 8.0, 8.0, 8.0, 10.0, 12.0, 19.0, 28.0, 22.0, 22.0, 29.0, 23.0, 43.0, 33.0, 21.0, 41.0, 43.0, 52.0, 48.0, 47.0, 49.0, 44.0, 37.0, 48.0, 43.0, 27.0, 29.0, 22.0, 25.0, 23.0, 17.0, 20.0, 21.0, 13.0, 11.0, 12.0, 10.0, 7.0, 3.0, 2.0, 1.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.547916829586029, -0.5298487544059753, -0.5117806196212769, -0.49371251463890076, -0.47564440965652466, -0.45757633447647095, -0.43950822949409485, -0.42144012451171875, -0.40337201952934265, -0.38530391454696655, -0.36723580956459045, -0.34916770458221436, -0.33109962940216064, -0.31303149461746216, -0.29496341943740845, -0.27689531445503235, -0.25882720947265625, -0.24075910449028015, -0.22269099950790405, -0.20462290942668915, -0.18655480444431305, -0.16848669946193695, -0.15041860938072205, -0.13235050439834595, -0.11428239941596985, -0.09621429443359375, -0.07814619690179825, -0.06007809564471245, -0.04200999438762665, -0.02394188940525055, -0.005873791873455048, 0.012194305658340454, 0.030262410640716553, 0.04833051189780235, 0.06639861315488815, 0.08446671068668365, 0.10253481566905975, 0.12060292065143585, 0.13867101073265076, 0.15673911571502686, 0.17480722069740295, 0.19287532567977905, 0.21094343066215515, 0.22901152074337006, 0.24707962572574615, 0.26514774560928345, 0.28321582078933716, 0.30128392577171326, 0.31935203075408936, 0.33742013573646545, 0.35548824071884155, 0.37355634570121765, 0.39162445068359375, 0.40969252586364746, 0.42776063084602356, 0.44582873582839966, 0.46389684081077576, 0.48196494579315186, 0.5000330209732056, 0.518101155757904, 0.5361692309379578, 0.5542373657226562, 0.57230544090271, 0.5903735160827637, 0.6084416508674622]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 10.0, 33.0, 103.0, 357.0, 7790.0, 4178542.0, 7106.0, 227.0, 59.0, 28.0, 20.0, 7.0, 1.0, 2.0, 0.0, 4.0], "bins": [-1.36328125, -1.337799072265625, -1.31231689453125, -1.286834716796875, -1.2613525390625, -1.235870361328125, -1.21038818359375, -1.184906005859375, -1.159423828125, -1.133941650390625, -1.10845947265625, -1.082977294921875, -1.0574951171875, -1.032012939453125, -1.00653076171875, -0.981048583984375, -0.95556640625, -0.930084228515625, -0.90460205078125, -0.879119873046875, -0.8536376953125, -0.828155517578125, -0.80267333984375, -0.777191162109375, -0.751708984375, -0.726226806640625, -0.70074462890625, -0.675262451171875, -0.6497802734375, -0.624298095703125, -0.59881591796875, -0.573333740234375, -0.5478515625, -0.522369384765625, -0.49688720703125, -0.471405029296875, -0.4459228515625, -0.420440673828125, -0.39495849609375, -0.369476318359375, -0.343994140625, -0.318511962890625, -0.29302978515625, -0.267547607421875, -0.2420654296875, -0.216583251953125, -0.19110107421875, -0.165618896484375, -0.14013671875, -0.114654541015625, -0.08917236328125, -0.063690185546875, -0.0382080078125, -0.012725830078125, 0.01275634765625, 0.038238525390625, 0.063720703125, 0.089202880859375, 0.11468505859375, 0.140167236328125, 0.1656494140625, 0.191131591796875, 0.21661376953125, 0.242095947265625, 0.267578125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 6.0, 5.0, 14.0, 16.0, 17.0, 22.0, 34.0, 49.0, 52.0, 65.0, 68.0, 70.0, 85.0, 84.0, 66.0, 88.0, 45.0, 52.0, 50.0, 43.0, 26.0, 14.0, 11.0, 12.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0596923828125, -0.058112144470214844, -0.05653190612792969, -0.05495166778564453, -0.053371429443359375, -0.05179119110107422, -0.05021095275878906, -0.048630714416503906, -0.04705047607421875, -0.045470237731933594, -0.04388999938964844, -0.04230976104736328, -0.040729522705078125, -0.03914928436279297, -0.03756904602050781, -0.035988807678222656, -0.0344085693359375, -0.032828330993652344, -0.031248092651367188, -0.02966785430908203, -0.028087615966796875, -0.02650737762451172, -0.024927139282226562, -0.023346900939941406, -0.02176666259765625, -0.020186424255371094, -0.018606185913085938, -0.01702594757080078, -0.015445709228515625, -0.013865470886230469, -0.012285232543945312, -0.010704994201660156, -0.009124755859375, -0.007544517517089844, -0.0059642791748046875, -0.004384040832519531, -0.002803802490234375, -0.0012235641479492188, 0.0003566741943359375, 0.0019369125366210938, 0.00351715087890625, 0.005097389221191406, 0.0066776275634765625, 0.008257865905761719, 0.009838104248046875, 0.011418342590332031, 0.012998580932617188, 0.014578819274902344, 0.0161590576171875, 0.017739295959472656, 0.019319534301757812, 0.02089977264404297, 0.022480010986328125, 0.02406024932861328, 0.025640487670898438, 0.027220726013183594, 0.02880096435546875, 0.030381202697753906, 0.03196144104003906, 0.03354167938232422, 0.035121917724609375, 0.03670215606689453, 0.03828239440917969, 0.039862632751464844, 0.04144287109375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 9.0, 14.0, 29.0, 46.0, 100.0, 192.0, 465.0, 1102.0, 3859.0, 26734.0, 1225386.0, 2891012.0, 38092.0, 4954.0, 1330.0, 502.0, 227.0, 115.0, 53.0, 20.0, 16.0, 6.0, 5.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.20068359375, -0.19541168212890625, -0.1901397705078125, -0.18486785888671875, -0.179595947265625, -0.17432403564453125, -0.1690521240234375, -0.16378021240234375, -0.15850830078125, -0.15323638916015625, -0.1479644775390625, -0.14269256591796875, -0.137420654296875, -0.13214874267578125, -0.1268768310546875, -0.12160491943359375, -0.1163330078125, -0.11106109619140625, -0.1057891845703125, -0.10051727294921875, -0.095245361328125, -0.08997344970703125, -0.0847015380859375, -0.07942962646484375, -0.07415771484375, -0.06888580322265625, -0.0636138916015625, -0.05834197998046875, -0.053070068359375, -0.04779815673828125, -0.0425262451171875, -0.03725433349609375, -0.031982421875, -0.02671051025390625, -0.0214385986328125, -0.01616668701171875, -0.010894775390625, -0.00562286376953125, -0.0003509521484375, 0.00492095947265625, 0.01019287109375, 0.01546478271484375, 0.0207366943359375, 0.02600860595703125, 0.031280517578125, 0.03655242919921875, 0.0418243408203125, 0.04709625244140625, 0.0523681640625, 0.05764007568359375, 0.0629119873046875, 0.06818389892578125, 0.073455810546875, 0.07872772216796875, 0.0839996337890625, 0.08927154541015625, 0.09454345703125, 0.09981536865234375, 0.1050872802734375, 0.11035919189453125, 0.115631103515625, 0.12090301513671875, 0.1261749267578125, 0.13144683837890625, 0.13671875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 8.0, 2.0, 7.0, 5.0, 9.0, 20.0, 41.0, 61.0, 145.0, 376.0, 1191.0, 1450.0, 424.0, 146.0, 92.0, 34.0, 31.0, 8.0, 6.0, 8.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07098388671875, -0.0687713623046875, -0.066558837890625, -0.0643463134765625, -0.0621337890625, -0.0599212646484375, -0.057708740234375, -0.0554962158203125, -0.05328369140625, -0.0510711669921875, -0.048858642578125, -0.0466461181640625, -0.04443359375, -0.0422210693359375, -0.040008544921875, -0.0377960205078125, -0.03558349609375, -0.0333709716796875, -0.031158447265625, -0.0289459228515625, -0.0267333984375, -0.0245208740234375, -0.022308349609375, -0.0200958251953125, -0.01788330078125, -0.0156707763671875, -0.013458251953125, -0.0112457275390625, -0.009033203125, -0.0068206787109375, -0.004608154296875, -0.0023956298828125, -0.00018310546875, 0.0020294189453125, 0.004241943359375, 0.0064544677734375, 0.0086669921875, 0.0108795166015625, 0.013092041015625, 0.0153045654296875, 0.01751708984375, 0.0197296142578125, 0.021942138671875, 0.0241546630859375, 0.0263671875, 0.0285797119140625, 0.030792236328125, 0.0330047607421875, 0.03521728515625, 0.0374298095703125, 0.039642333984375, 0.0418548583984375, 0.0440673828125, 0.0462799072265625, 0.048492431640625, 0.0507049560546875, 0.05291748046875, 0.0551300048828125, 0.057342529296875, 0.0595550537109375, 0.061767578125, 0.0639801025390625, 0.066192626953125, 0.0684051513671875, 0.07061767578125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 3.0, 17.0, 268.0, 607.0, 102.0, 7.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18572044372558594, -0.1427316665649414, -0.09974290430545807, -0.05675414204597473, -0.0137653648853302, 0.02922341227531433, 0.07221215963363647, 0.115200936794281, 0.15818971395492554, 0.20117849111557007, 0.2441672533750534, 0.28715601563453674, 0.3301447927951813, 0.3731335699558258, 0.41612231731414795, 0.4591110944747925, 0.502099871635437, 0.5450886487960815, 0.5880774259567261, 0.6310662031173706, 0.6740549802780151, 0.7170437574386597, 0.7600324749946594, 0.803021252155304, 0.8460100293159485, 0.888998806476593, 0.9319875836372375, 0.9749763011932373, 1.0179650783538818, 1.0609538555145264, 1.103942632675171, 1.1469314098358154, 1.18992018699646, 1.2329089641571045, 1.275897741317749, 1.3188865184783936, 1.361875295639038, 1.4048640727996826, 1.4478528499603271, 1.4908416271209717, 1.5338304042816162, 1.5768191814422607, 1.6198079586029053, 1.6627967357635498, 1.7057855129241943, 1.7487742900848389, 1.7917630672454834, 1.834751844406128, 1.877740502357483, 1.9207292795181274, 1.963718056678772, 2.006706714630127, 2.0496954917907715, 2.092684268951416, 2.1356730461120605, 2.178661823272705, 2.2216506004333496, 2.264639377593994, 2.3076281547546387, 2.350616931915283, 2.3936057090759277, 2.4365944862365723, 2.479583263397217, 2.5225720405578613, 2.565560817718506]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 3.0, 12.0, 18.0, 19.0, 16.0, 25.0, 33.0, 38.0, 40.0, 65.0, 49.0, 69.0, 59.0, 68.0, 67.0, 56.0, 57.0, 57.0, 53.0, 54.0, 32.0, 29.0, 20.0, 18.0, 16.0, 6.0, 7.0, 9.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.21653926372528076, -0.2096126228570938, -0.20268598198890686, -0.1957593560218811, -0.18883271515369415, -0.1819060742855072, -0.17497943341732025, -0.1680527925491333, -0.16112616658210754, -0.1541995257139206, -0.14727288484573364, -0.14034625887870789, -0.13341961801052094, -0.12649297714233398, -0.11956633627414703, -0.11263969540596008, -0.10571305453777313, -0.09878641366958618, -0.09185978025197983, -0.08493313938379288, -0.07800650596618652, -0.07107986509799957, -0.06415322422981262, -0.05722658708691597, -0.05029994994401932, -0.043373312801122665, -0.03644667565822601, -0.029520034790039062, -0.02259339764714241, -0.015666760504245758, -0.008740119636058807, -0.0018134824931621552, 0.005113154649734497, 0.012039792723953724, 0.01896643079817295, 0.025893069803714752, 0.032819706946611404, 0.03974634408950806, 0.04667298495769501, 0.05359962210059166, 0.06052625924348831, 0.06745290011167526, 0.07437953352928162, 0.08130617439746857, 0.08823281526565552, 0.09515944868326187, 0.10208608955144882, 0.10901272296905518, 0.11593936383724213, 0.12286600470542908, 0.12979264557361603, 0.13671928644180298, 0.14364591240882874, 0.15057255327701569, 0.15749919414520264, 0.1644258350133896, 0.17135247588157654, 0.1782791167497635, 0.18520575761795044, 0.1921323835849762, 0.19905902445316315, 0.2059856653213501, 0.21291230618953705, 0.219838947057724, 0.22676557302474976]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 9.0, 17.0, 20.0, 27.0, 52.0, 59.0, 121.0, 177.0, 361.0, 813.0, 1840.0, 5013.0, 17110.0, 79323.0, 514153.0, 356635.0, 53451.0, 12459.0, 3965.0, 1462.0, 711.0, 301.0, 172.0, 94.0, 63.0, 43.0, 27.0, 26.0, 15.0, 10.0, 6.0, 5.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1800537109375, -0.17489242553710938, -0.16973114013671875, -0.16456985473632812, -0.1594085693359375, -0.15424728393554688, -0.14908599853515625, -0.14392471313476562, -0.138763427734375, -0.13360214233398438, -0.12844085693359375, -0.12327957153320312, -0.1181182861328125, -0.11295700073242188, -0.10779571533203125, -0.10263442993164062, -0.09747314453125, -0.09231185913085938, -0.08715057373046875, -0.08198928833007812, -0.0768280029296875, -0.07166671752929688, -0.06650543212890625, -0.061344146728515625, -0.056182861328125, -0.051021575927734375, -0.04586029052734375, -0.040699005126953125, -0.0355377197265625, -0.030376434326171875, -0.02521514892578125, -0.020053863525390625, -0.014892578125, -0.009731292724609375, -0.00457000732421875, 0.000591278076171875, 0.0057525634765625, 0.010913848876953125, 0.01607513427734375, 0.021236419677734375, 0.026397705078125, 0.031558990478515625, 0.03672027587890625, 0.041881561279296875, 0.0470428466796875, 0.052204132080078125, 0.05736541748046875, 0.06252670288085938, 0.06768798828125, 0.07284927368164062, 0.07801055908203125, 0.08317184448242188, 0.0883331298828125, 0.09349441528320312, 0.09865570068359375, 0.10381698608398438, 0.108978271484375, 0.11413955688476562, 0.11930084228515625, 0.12446212768554688, 0.1296234130859375, 0.13478469848632812, 0.13994598388671875, 0.14510726928710938, 0.1502685546875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 3.0, 4.0, 5.0, 10.0, 13.0, 20.0, 19.0, 28.0, 34.0, 45.0, 52.0, 60.0, 73.0, 80.0, 77.0, 64.0, 66.0, 66.0, 57.0, 53.0, 53.0, 34.0, 19.0, 23.0, 18.0, 8.0, 7.0, 5.0, 7.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.051361083984375, -0.049920082092285156, -0.04847908020019531, -0.04703807830810547, -0.045597076416015625, -0.04415607452392578, -0.04271507263183594, -0.041274070739746094, -0.03983306884765625, -0.038392066955566406, -0.03695106506347656, -0.03551006317138672, -0.034069061279296875, -0.03262805938720703, -0.031187057495117188, -0.029746055603027344, -0.0283050537109375, -0.026864051818847656, -0.025423049926757812, -0.02398204803466797, -0.022541046142578125, -0.02110004425048828, -0.019659042358398438, -0.018218040466308594, -0.01677703857421875, -0.015336036682128906, -0.013895034790039062, -0.012454032897949219, -0.011013031005859375, -0.009572029113769531, -0.008131027221679688, -0.006690025329589844, -0.0052490234375, -0.0038080215454101562, -0.0023670196533203125, -0.0009260177612304688, 0.000514984130859375, 0.0019559860229492188, 0.0033969879150390625, 0.004837989807128906, 0.00627899169921875, 0.007719993591308594, 0.009160995483398438, 0.010601997375488281, 0.012042999267578125, 0.013484001159667969, 0.014925003051757812, 0.016366004943847656, 0.0178070068359375, 0.019248008728027344, 0.020689010620117188, 0.02213001251220703, 0.023571014404296875, 0.02501201629638672, 0.026453018188476562, 0.027894020080566406, 0.02933502197265625, 0.030776023864746094, 0.03221702575683594, 0.03365802764892578, 0.035099029541015625, 0.03654003143310547, 0.03798103332519531, 0.039422035217285156, 0.040863037109375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 2.0, 6.0, 7.0, 7.0, 15.0, 30.0, 32.0, 49.0, 58.0, 85.0, 176.0, 334.0, 683.0, 1783.0, 4713.0, 15611.0, 64506.0, 373388.0, 472397.0, 85698.0, 19307.0, 5886.0, 2076.0, 838.0, 354.0, 181.0, 113.0, 60.0, 40.0, 30.0, 22.0, 14.0, 12.0, 10.0, 8.0, 13.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.125244140625, -0.12156963348388672, -0.11789512634277344, -0.11422061920166016, -0.11054611206054688, -0.1068716049194336, -0.10319709777832031, -0.09952259063720703, -0.09584808349609375, -0.09217357635498047, -0.08849906921386719, -0.0848245620727539, -0.08115005493164062, -0.07747554779052734, -0.07380104064941406, -0.07012653350830078, -0.0664520263671875, -0.06277751922607422, -0.05910301208496094, -0.055428504943847656, -0.051753997802734375, -0.048079490661621094, -0.04440498352050781, -0.04073047637939453, -0.03705596923828125, -0.03338146209716797, -0.029706954956054688, -0.026032447814941406, -0.022357940673828125, -0.018683433532714844, -0.015008926391601562, -0.011334419250488281, -0.007659912109375, -0.003985404968261719, -0.0003108978271484375, 0.0033636093139648438, 0.007038116455078125, 0.010712623596191406, 0.014387130737304688, 0.01806163787841797, 0.02173614501953125, 0.02541065216064453, 0.029085159301757812, 0.032759666442871094, 0.036434173583984375, 0.040108680725097656, 0.04378318786621094, 0.04745769500732422, 0.0511322021484375, 0.05480670928955078, 0.05848121643066406, 0.062155723571777344, 0.06583023071289062, 0.0695047378540039, 0.07317924499511719, 0.07685375213623047, 0.08052825927734375, 0.08420276641845703, 0.08787727355957031, 0.0915517807006836, 0.09522628784179688, 0.09890079498291016, 0.10257530212402344, 0.10624980926513672, 0.10992431640625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 2.0, 3.0, 6.0, 6.0, 9.0, 9.0, 16.0, 18.0, 23.0, 18.0, 28.0, 33.0, 37.0, 40.0, 43.0, 48.0, 53.0, 66.0, 55.0, 65.0, 48.0, 51.0, 41.0, 42.0, 51.0, 30.0, 31.0, 23.0, 25.0, 14.0, 14.0, 14.0, 11.0, 6.0, 5.0, 7.0, 6.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1348876953125, -0.13059616088867188, -0.12630462646484375, -0.12201309204101562, -0.1177215576171875, -0.11343002319335938, -0.10913848876953125, -0.10484695434570312, -0.100555419921875, -0.09626388549804688, -0.09197235107421875, -0.08768081665039062, -0.0833892822265625, -0.07909774780273438, -0.07480621337890625, -0.07051467895507812, -0.06622314453125, -0.061931610107421875, -0.05764007568359375, -0.053348541259765625, -0.0490570068359375, -0.044765472412109375, -0.04047393798828125, -0.036182403564453125, -0.031890869140625, -0.027599334716796875, -0.02330780029296875, -0.019016265869140625, -0.0147247314453125, -0.010433197021484375, -0.00614166259765625, -0.001850128173828125, 0.00244140625, 0.006732940673828125, 0.01102447509765625, 0.015316009521484375, 0.0196075439453125, 0.023899078369140625, 0.02819061279296875, 0.032482147216796875, 0.036773681640625, 0.041065216064453125, 0.04535675048828125, 0.049648284912109375, 0.0539398193359375, 0.058231353759765625, 0.06252288818359375, 0.06681442260742188, 0.07110595703125, 0.07539749145507812, 0.07968902587890625, 0.08398056030273438, 0.0882720947265625, 0.09256362915039062, 0.09685516357421875, 0.10114669799804688, 0.105438232421875, 0.10972976684570312, 0.11402130126953125, 0.11831283569335938, 0.1226043701171875, 0.12689590454101562, 0.13118743896484375, 0.13547897338867188, 0.1397705078125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 3.0, 6.0, 4.0, 6.0, 13.0, 23.0, 38.0, 61.0, 92.0, 136.0, 249.0, 503.0, 1332.0, 6128.0, 130373.0, 888887.0, 16459.0, 2609.0, 762.0, 351.0, 197.0, 125.0, 79.0, 42.0, 33.0, 15.0, 11.0, 9.0, 3.0, 5.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1107177734375, -0.10665321350097656, -0.10258865356445312, -0.09852409362792969, -0.09445953369140625, -0.09039497375488281, -0.08633041381835938, -0.08226585388183594, -0.0782012939453125, -0.07413673400878906, -0.07007217407226562, -0.06600761413574219, -0.06194305419921875, -0.05787849426269531, -0.053813934326171875, -0.04974937438964844, -0.045684814453125, -0.04162025451660156, -0.037555694580078125, -0.03349113464355469, -0.02942657470703125, -0.025362014770507812, -0.021297454833984375, -0.017232894897460938, -0.0131683349609375, -0.009103775024414062, -0.005039215087890625, -0.0009746551513671875, 0.00308990478515625, 0.0071544647216796875, 0.011219024658203125, 0.015283584594726562, 0.01934814453125, 0.023412704467773438, 0.027477264404296875, 0.03154182434082031, 0.03560638427734375, 0.03967094421386719, 0.043735504150390625, 0.04780006408691406, 0.0518646240234375, 0.05592918395996094, 0.059993743896484375, 0.06405830383300781, 0.06812286376953125, 0.07218742370605469, 0.07625198364257812, 0.08031654357910156, 0.084381103515625, 0.08844566345214844, 0.09251022338867188, 0.09657478332519531, 0.10063934326171875, 0.10470390319824219, 0.10876846313476562, 0.11283302307128906, 0.1168975830078125, 0.12096214294433594, 0.12502670288085938, 0.1290912628173828, 0.13315582275390625, 0.1372203826904297, 0.14128494262695312, 0.14534950256347656, 0.1494140625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 6.0, 4.0, 11.0, 25.0, 58.0, 78.0, 102.0, 147.0, 154.0, 134.0, 127.0, 58.0, 39.0, 21.0, 10.0, 12.0, 5.0, 3.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8835067749023438e-05, -1.8318183720111847e-05, -1.7801299691200256e-05, -1.7284415662288666e-05, -1.6767531633377075e-05, -1.6250647604465485e-05, -1.5733763575553894e-05, -1.5216879546642303e-05, -1.4699995517730713e-05, -1.4183111488819122e-05, -1.3666227459907532e-05, -1.3149343430995941e-05, -1.263245940208435e-05, -1.211557537317276e-05, -1.159869134426117e-05, -1.1081807315349579e-05, -1.0564923286437988e-05, -1.0048039257526398e-05, -9.531155228614807e-06, -9.014271199703217e-06, -8.497387170791626e-06, -7.980503141880035e-06, -7.463619112968445e-06, -6.946735084056854e-06, -6.429851055145264e-06, -5.912967026233673e-06, -5.3960829973220825e-06, -4.879198968410492e-06, -4.362314939498901e-06, -3.845430910587311e-06, -3.3285468816757202e-06, -2.8116628527641296e-06, -2.294778823852539e-06, -1.7778947949409485e-06, -1.261010766029358e-06, -7.441267371177673e-07, -2.2724270820617676e-07, 2.896413207054138e-07, 8.065253496170044e-07, 1.323409378528595e-06, 1.8402934074401855e-06, 2.357177436351776e-06, 2.8740614652633667e-06, 3.3909454941749573e-06, 3.907829523086548e-06, 4.4247135519981384e-06, 4.941597580909729e-06, 5.45848160982132e-06, 5.97536563873291e-06, 6.492249667644501e-06, 7.009133696556091e-06, 7.526017725467682e-06, 8.042901754379272e-06, 8.559785783290863e-06, 9.076669812202454e-06, 9.593553841114044e-06, 1.0110437870025635e-05, 1.0627321898937225e-05, 1.1144205927848816e-05, 1.1661089956760406e-05, 1.2177973985671997e-05, 1.2694858014583588e-05, 1.3211742043495178e-05, 1.3728626072406769e-05, 1.424551010131836e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 5.0, 3.0, 7.0, 9.0, 15.0, 21.0, 41.0, 62.0, 66.0, 68.0, 122.0, 205.0, 340.0, 1168.0, 6491.0, 267039.0, 760007.0, 10154.0, 1601.0, 438.0, 229.0, 130.0, 90.0, 78.0, 44.0, 26.0, 32.0, 28.0, 7.0, 12.0, 8.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11041259765625, -0.10618305206298828, -0.10195350646972656, -0.09772396087646484, -0.09349441528320312, -0.0892648696899414, -0.08503532409667969, -0.08080577850341797, -0.07657623291015625, -0.07234668731689453, -0.06811714172363281, -0.0638875961303711, -0.059658050537109375, -0.055428504943847656, -0.05119895935058594, -0.04696941375732422, -0.0427398681640625, -0.03851032257080078, -0.03428077697753906, -0.030051231384277344, -0.025821685791015625, -0.021592140197753906, -0.017362594604492188, -0.013133049011230469, -0.00890350341796875, -0.004673957824707031, -0.0004444122314453125, 0.0037851333618164062, 0.008014678955078125, 0.012244224548339844, 0.016473770141601562, 0.02070331573486328, 0.024932861328125, 0.02916240692138672, 0.03339195251464844, 0.037621498107910156, 0.041851043701171875, 0.046080589294433594, 0.05031013488769531, 0.05453968048095703, 0.05876922607421875, 0.06299877166748047, 0.06722831726074219, 0.0714578628540039, 0.07568740844726562, 0.07991695404052734, 0.08414649963378906, 0.08837604522705078, 0.0926055908203125, 0.09683513641357422, 0.10106468200683594, 0.10529422760009766, 0.10952377319335938, 0.1137533187866211, 0.11798286437988281, 0.12221240997314453, 0.12644195556640625, 0.13067150115966797, 0.1349010467529297, 0.1391305923461914, 0.14336013793945312, 0.14758968353271484, 0.15181922912597656, 0.15604877471923828, 0.1602783203125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 8.0, 5.0, 9.0, 43.0, 114.0, 253.0, 293.0, 181.0, 64.0, 26.0, 4.0, 5.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.168212890625, -0.16343116760253906, -0.15864944458007812, -0.1538677215576172, -0.14908599853515625, -0.1443042755126953, -0.13952255249023438, -0.13474082946777344, -0.1299591064453125, -0.12517738342285156, -0.12039566040039062, -0.11561393737792969, -0.11083221435546875, -0.10605049133300781, -0.10126876831054688, -0.09648704528808594, -0.091705322265625, -0.08692359924316406, -0.08214187622070312, -0.07736015319824219, -0.07257843017578125, -0.06779670715332031, -0.06301498413085938, -0.05823326110839844, -0.0534515380859375, -0.04866981506347656, -0.043888092041015625, -0.03910636901855469, -0.03432464599609375, -0.029542922973632812, -0.024761199951171875, -0.019979476928710938, -0.01519775390625, -0.010416030883789062, -0.005634307861328125, -0.0008525848388671875, 0.00392913818359375, 0.008710861206054688, 0.013492584228515625, 0.018274307250976562, 0.0230560302734375, 0.027837753295898438, 0.032619476318359375, 0.03740119934082031, 0.04218292236328125, 0.04696464538574219, 0.051746368408203125, 0.05652809143066406, 0.061309814453125, 0.06609153747558594, 0.07087326049804688, 0.07565498352050781, 0.08043670654296875, 0.08521842956542969, 0.09000015258789062, 0.09478187561035156, 0.0995635986328125, 0.10434532165527344, 0.10912704467773438, 0.11390876770019531, 0.11869049072265625, 0.12347221374511719, 0.12825393676757812, 0.13303565979003906, 0.1378173828125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 5.0, 3.0, 8.0, 19.0, 25.0, 65.0, 89.0, 138.0, 163.0, 171.0, 115.0, 80.0, 54.0, 26.0, 17.0, 11.0, 7.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7870216369628906, -0.7613250613212585, -0.7356284856796265, -0.7099319100379944, -0.6842353343963623, -0.658538818359375, -0.6328422427177429, -0.6071456670761108, -0.5814490914344788, -0.5557525157928467, -0.5300559401512146, -0.5043593645095825, -0.4786628186702728, -0.45296624302864075, -0.42726969718933105, -0.401573121547699, -0.3758765459060669, -0.3501799702644348, -0.32448339462280273, -0.29878684878349304, -0.27309027314186096, -0.24739369750022888, -0.221697136759758, -0.1960005760192871, -0.17030400037765503, -0.14460742473602295, -0.11891086399555206, -0.09321429580450058, -0.0675177276134491, -0.04182115197181702, -0.01612459123134613, 0.009571969509124756, 0.035268545150756836, 0.06096511334180832, 0.0866616815328598, 0.11235824972391129, 0.13805481791496277, 0.16375139355659485, 0.18944795429706573, 0.21514451503753662, 0.2408410906791687, 0.2665376663208008, 0.29223424196243286, 0.31793078780174255, 0.34362736344337463, 0.3693239390850067, 0.3950204849243164, 0.4207170605659485, 0.44641363620758057, 0.47211021184921265, 0.4978067874908447, 0.5235033631324768, 0.5491999387741089, 0.5748964548110962, 0.6005930304527283, 0.6262896060943604, 0.6519861817359924, 0.6776827573776245, 0.7033793330192566, 0.7290759086608887, 0.754772424697876, 0.7804690599441528, 0.8061655759811401, 0.8318621516227722, 0.8575587272644043]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 2.0, 4.0, 3.0, 5.0, 4.0, 6.0, 12.0, 15.0, 19.0, 20.0, 18.0, 30.0, 17.0, 39.0, 31.0, 26.0, 32.0, 39.0, 35.0, 41.0, 26.0, 42.0, 56.0, 41.0, 40.0, 44.0, 42.0, 38.0, 39.0, 25.0, 37.0, 20.0, 25.0, 19.0, 23.0, 12.0, 11.0, 10.0, 7.0, 11.0, 12.0, 7.0, 7.0, 4.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.6096944212913513, -0.5926258563995361, -0.575557291507721, -0.5584887862205505, -0.5414202213287354, -0.5243516564369202, -0.507283091545105, -0.4902145266532898, -0.473145991563797, -0.4560774266719818, -0.439008891582489, -0.42194032669067383, -0.40487176179885864, -0.38780322670936584, -0.37073466181755066, -0.35366612672805786, -0.3365975618362427, -0.3195289969444275, -0.3024604618549347, -0.2853918969631195, -0.2683233618736267, -0.2512547969818115, -0.23418623208999634, -0.21711768209934235, -0.20004913210868835, -0.18298058211803436, -0.16591203212738037, -0.14884346723556519, -0.1317749172449112, -0.1147063672542572, -0.09763780981302261, -0.08056925237178802, -0.06350076198577881, -0.04643220826983452, -0.02936365455389023, -0.012295100837945938, 0.004773452877998352, 0.021842002868652344, 0.03891056030988693, 0.05597911775112152, 0.07304766774177551, 0.0901162177324295, 0.10718477517366409, 0.12425333261489868, 0.14132188260555267, 0.15839043259620667, 0.17545899748802185, 0.19252754747867584, 0.20959609746932983, 0.22666464745998383, 0.24373319745063782, 0.260801762342453, 0.2778702974319458, 0.294938862323761, 0.31200742721557617, 0.32907599210739136, 0.34614452719688416, 0.36321309208869934, 0.38028162717819214, 0.3973501920700073, 0.4144187569618225, 0.4314872920513153, 0.4485558569431305, 0.4656243920326233, 0.4826929569244385]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 6.0, 1.0, 8.0, 5.0, 7.0, 8.0, 9.0, 11.0, 23.0, 37.0, 44.0, 68.0, 109.0, 167.0, 287.0, 461.0, 805.0, 1737.0, 3643.0, 9301.0, 31465.0, 193326.0, 3546354.0, 341621.0, 44091.0, 12277.0, 4329.0, 1919.0, 927.0, 490.0, 258.0, 199.0, 98.0, 71.0, 43.0, 32.0, 21.0, 13.0, 6.0, 7.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12066650390625, -0.11754131317138672, -0.11441612243652344, -0.11129093170166016, -0.10816574096679688, -0.1050405502319336, -0.10191535949707031, -0.09879016876220703, -0.09566497802734375, -0.09253978729248047, -0.08941459655761719, -0.0862894058227539, -0.08316421508789062, -0.08003902435302734, -0.07691383361816406, -0.07378864288330078, -0.0706634521484375, -0.06753826141357422, -0.06441307067871094, -0.061287879943847656, -0.058162689208984375, -0.055037498474121094, -0.05191230773925781, -0.04878711700439453, -0.04566192626953125, -0.04253673553466797, -0.03941154479980469, -0.036286354064941406, -0.033161163330078125, -0.030035972595214844, -0.026910781860351562, -0.02378559112548828, -0.020660400390625, -0.01753520965576172, -0.014410018920898438, -0.011284828186035156, -0.008159637451171875, -0.005034446716308594, -0.0019092559814453125, 0.0012159347534179688, 0.00434112548828125, 0.007466316223144531, 0.010591506958007812, 0.013716697692871094, 0.016841888427734375, 0.019967079162597656, 0.023092269897460938, 0.02621746063232422, 0.0293426513671875, 0.03246784210205078, 0.03559303283691406, 0.038718223571777344, 0.041843414306640625, 0.044968605041503906, 0.04809379577636719, 0.05121898651123047, 0.05434417724609375, 0.05746936798095703, 0.06059455871582031, 0.0637197494506836, 0.06684494018554688, 0.06997013092041016, 0.07309532165527344, 0.07622051239013672, 0.079345703125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 3.0, 6.0, 8.0, 8.0, 15.0, 32.0, 31.0, 29.0, 48.0, 47.0, 60.0, 61.0, 64.0, 78.0, 79.0, 87.0, 57.0, 62.0, 50.0, 43.0, 47.0, 20.0, 23.0, 20.0, 6.0, 9.0, 3.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.059814453125, -0.05823373794555664, -0.05665302276611328, -0.05507230758666992, -0.05349159240722656, -0.0519108772277832, -0.050330162048339844, -0.048749446868896484, -0.047168731689453125, -0.045588016510009766, -0.044007301330566406, -0.04242658615112305, -0.04084587097167969, -0.03926515579223633, -0.03768444061279297, -0.03610372543334961, -0.03452301025390625, -0.03294229507446289, -0.03136157989501953, -0.029780864715576172, -0.028200149536132812, -0.026619434356689453, -0.025038719177246094, -0.023458003997802734, -0.021877288818359375, -0.020296573638916016, -0.018715858459472656, -0.017135143280029297, -0.015554428100585938, -0.013973712921142578, -0.012392997741699219, -0.01081228256225586, -0.0092315673828125, -0.007650852203369141, -0.006070137023925781, -0.004489421844482422, -0.0029087066650390625, -0.0013279914855957031, 0.00025272369384765625, 0.0018334388732910156, 0.003414154052734375, 0.004994869232177734, 0.006575584411621094, 0.008156299591064453, 0.009737014770507812, 0.011317729949951172, 0.012898445129394531, 0.01447916030883789, 0.01605987548828125, 0.01764059066772461, 0.01922130584716797, 0.020802021026611328, 0.022382736206054688, 0.023963451385498047, 0.025544166564941406, 0.027124881744384766, 0.028705596923828125, 0.030286312103271484, 0.031867027282714844, 0.0334477424621582, 0.03502845764160156, 0.03660917282104492, 0.03818988800048828, 0.03977060317993164, 0.041351318359375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 6.0, 7.0, 6.0, 16.0, 21.0, 37.0, 71.0, 127.0, 188.0, 384.0, 716.0, 1652.0, 4958.0, 24122.0, 443918.0, 3633772.0, 69567.0, 9764.0, 2643.0, 1102.0, 531.0, 295.0, 152.0, 88.0, 53.0, 43.0, 17.0, 7.0, 10.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1605224609375, -0.15554237365722656, -0.15056228637695312, -0.1455821990966797, -0.14060211181640625, -0.1356220245361328, -0.13064193725585938, -0.12566184997558594, -0.1206817626953125, -0.11570167541503906, -0.11072158813476562, -0.10574150085449219, -0.10076141357421875, -0.09578132629394531, -0.09080123901367188, -0.08582115173339844, -0.080841064453125, -0.07586097717285156, -0.07088088989257812, -0.06590080261230469, -0.06092071533203125, -0.05594062805175781, -0.050960540771484375, -0.04598045349121094, -0.0410003662109375, -0.03602027893066406, -0.031040191650390625, -0.026060104370117188, -0.02108001708984375, -0.016099929809570312, -0.011119842529296875, -0.0061397552490234375, -0.00115966796875, 0.0038204193115234375, 0.008800506591796875, 0.013780593872070312, 0.01876068115234375, 0.023740768432617188, 0.028720855712890625, 0.03370094299316406, 0.0386810302734375, 0.04366111755371094, 0.048641204833984375, 0.05362129211425781, 0.05860137939453125, 0.06358146667480469, 0.06856155395507812, 0.07354164123535156, 0.078521728515625, 0.08350181579589844, 0.08848190307617188, 0.09346199035644531, 0.09844207763671875, 0.10342216491699219, 0.10840225219726562, 0.11338233947753906, 0.1183624267578125, 0.12334251403808594, 0.12832260131835938, 0.1333026885986328, 0.13828277587890625, 0.1432628631591797, 0.14824295043945312, 0.15322303771972656, 0.158203125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 3.0, 9.0, 11.0, 27.0, 46.0, 102.0, 331.0, 1731.0, 1307.0, 290.0, 95.0, 48.0, 28.0, 20.0, 8.0, 6.0, 4.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0936279296875, -0.09116077423095703, -0.08869361877441406, -0.0862264633178711, -0.08375930786132812, -0.08129215240478516, -0.07882499694824219, -0.07635784149169922, -0.07389068603515625, -0.07142353057861328, -0.06895637512207031, -0.06648921966552734, -0.06402206420898438, -0.061554908752441406, -0.05908775329589844, -0.05662059783935547, -0.0541534423828125, -0.05168628692626953, -0.04921913146972656, -0.046751976013183594, -0.044284820556640625, -0.041817665100097656, -0.03935050964355469, -0.03688335418701172, -0.03441619873046875, -0.03194904327392578, -0.029481887817382812, -0.027014732360839844, -0.024547576904296875, -0.022080421447753906, -0.019613265991210938, -0.01714611053466797, -0.014678955078125, -0.012211799621582031, -0.009744644165039062, -0.007277488708496094, -0.004810333251953125, -0.0023431777954101562, 0.0001239776611328125, 0.0025911331176757812, 0.00505828857421875, 0.007525444030761719, 0.009992599487304688, 0.012459754943847656, 0.014926910400390625, 0.017394065856933594, 0.019861221313476562, 0.02232837677001953, 0.0247955322265625, 0.02726268768310547, 0.029729843139648438, 0.032196998596191406, 0.034664154052734375, 0.037131309509277344, 0.03959846496582031, 0.04206562042236328, 0.04453277587890625, 0.04699993133544922, 0.04946708679199219, 0.051934242248535156, 0.054401397705078125, 0.056868553161621094, 0.05933570861816406, 0.06180286407470703, 0.06427001953125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 7.0, 41.0, 269.0, 527.0, 141.0, 16.0, 8.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19364482164382935, -0.1627691090106964, -0.13189339637756348, -0.10101768374443054, -0.07014197111129761, -0.03926625847816467, -0.008390545845031738, 0.022485166788101196, 0.05336087942123413, 0.08423659205436707, 0.1151123046875, 0.14598801732063293, 0.17686372995376587, 0.2077394425868988, 0.23861515522003174, 0.2694908678531647, 0.3003665804862976, 0.33124229311943054, 0.3621180057525635, 0.3929937183856964, 0.42386943101882935, 0.4547451436519623, 0.4856208562850952, 0.5164965391159058, 0.5473722815513611, 0.5782480239868164, 0.609123706817627, 0.6399993896484375, 0.6708751320838928, 0.7017508745193481, 0.7326265573501587, 0.7635022401809692, 0.7943780422210693, 0.8252537250518799, 0.8561294674873352, 0.8870052099227905, 0.9178808927536011, 0.9487565755844116, 0.9796323180198669, 1.0105080604553223, 1.0413837432861328, 1.0722594261169434, 1.103135108947754, 1.134010910987854, 1.1648865938186646, 1.195762276649475, 1.2266380786895752, 1.2575137615203857, 1.2883894443511963, 1.3192651271820068, 1.3501408100128174, 1.3810166120529175, 1.411892294883728, 1.4427679777145386, 1.4736437797546387, 1.5045194625854492, 1.5353951454162598, 1.5662708282470703, 1.5971465110778809, 1.628022313117981, 1.6588979959487915, 1.689773678779602, 1.7206494808197021, 1.7515251636505127, 1.7824008464813232]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 5.0, 7.0, 2.0, 12.0, 14.0, 17.0, 26.0, 32.0, 34.0, 43.0, 42.0, 49.0, 61.0, 59.0, 74.0, 81.0, 67.0, 63.0, 50.0, 46.0, 53.0, 34.0, 27.0, 34.0, 21.0, 18.0, 5.0, 9.0, 8.0, 4.0, 6.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20667880773544312, -0.20049025118350983, -0.19430169463157654, -0.18811312317848206, -0.18192456662654877, -0.17573601007461548, -0.169547438621521, -0.1633588820695877, -0.15717032551765442, -0.15098176896572113, -0.14479321241378784, -0.13860464096069336, -0.13241608440876007, -0.12622752785682678, -0.1200389638543129, -0.11385039985179901, -0.10766184329986572, -0.10147328674793243, -0.09528472274541855, -0.08909615874290466, -0.08290760219097137, -0.07671904563903809, -0.0705304816365242, -0.06434191763401031, -0.058153361082077026, -0.05196480080485344, -0.04577624052762985, -0.039587680250406265, -0.03339911997318268, -0.02721055969595909, -0.021021999418735504, -0.014833439141511917, -0.00864487886428833, -0.002456318587064743, 0.003732241690158844, 0.009920801967382431, 0.016109362244606018, 0.022297922521829605, 0.028486482799053192, 0.03467504307627678, 0.040863603353500366, 0.04705216363072395, 0.05324072390794754, 0.05942928418517113, 0.06561784446239471, 0.071806401014328, 0.07799496501684189, 0.08418352901935577, 0.09037208557128906, 0.09656064212322235, 0.10274920612573624, 0.10893777012825012, 0.11512632668018341, 0.1213148832321167, 0.12750345468521118, 0.13369201123714447, 0.13988056778907776, 0.14606912434101105, 0.15225768089294434, 0.15844625234603882, 0.1646348088979721, 0.1708233654499054, 0.17701193690299988, 0.18320049345493317, 0.18938905000686646]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 6.0, 8.0, 13.0, 14.0, 23.0, 39.0, 53.0, 99.0, 182.0, 312.0, 680.0, 1608.0, 4727.0, 17973.0, 100660.0, 581158.0, 285694.0, 41387.0, 8984.0, 2796.0, 1013.0, 539.0, 249.0, 125.0, 69.0, 52.0, 33.0, 19.0, 9.0, 9.0, 6.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1881103515625, -0.18299293518066406, -0.17787551879882812, -0.1727581024169922, -0.16764068603515625, -0.1625232696533203, -0.15740585327148438, -0.15228843688964844, -0.1471710205078125, -0.14205360412597656, -0.13693618774414062, -0.1318187713623047, -0.12670135498046875, -0.12158393859863281, -0.11646652221679688, -0.11134910583496094, -0.106231689453125, -0.10111427307128906, -0.09599685668945312, -0.09087944030761719, -0.08576202392578125, -0.08064460754394531, -0.07552719116210938, -0.07040977478027344, -0.0652923583984375, -0.06017494201660156, -0.055057525634765625, -0.04994010925292969, -0.04482269287109375, -0.03970527648925781, -0.034587860107421875, -0.029470443725585938, -0.02435302734375, -0.019235610961914062, -0.014118194580078125, -0.009000778198242188, -0.00388336181640625, 0.0012340545654296875, 0.006351470947265625, 0.011468887329101562, 0.0165863037109375, 0.021703720092773438, 0.026821136474609375, 0.03193855285644531, 0.03705596923828125, 0.04217338562011719, 0.047290802001953125, 0.05240821838378906, 0.057525634765625, 0.06264305114746094, 0.06776046752929688, 0.07287788391113281, 0.07799530029296875, 0.08311271667480469, 0.08823013305664062, 0.09334754943847656, 0.0984649658203125, 0.10358238220214844, 0.10869979858398438, 0.11381721496582031, 0.11893463134765625, 0.12405204772949219, 0.12916946411132812, 0.13428688049316406, 0.139404296875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 3.0, 10.0, 5.0, 16.0, 24.0, 27.0, 20.0, 39.0, 45.0, 51.0, 48.0, 70.0, 64.0, 62.0, 71.0, 75.0, 62.0, 59.0, 55.0, 41.0, 40.0, 27.0, 29.0, 17.0, 12.0, 10.0, 5.0, 6.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0511474609375, -0.049681663513183594, -0.04821586608886719, -0.04675006866455078, -0.045284271240234375, -0.04381847381591797, -0.04235267639160156, -0.040886878967285156, -0.03942108154296875, -0.037955284118652344, -0.03648948669433594, -0.03502368927001953, -0.033557891845703125, -0.03209209442138672, -0.030626296997070312, -0.029160499572753906, -0.0276947021484375, -0.026228904724121094, -0.024763107299804688, -0.02329730987548828, -0.021831512451171875, -0.02036571502685547, -0.018899917602539062, -0.017434120178222656, -0.01596832275390625, -0.014502525329589844, -0.013036727905273438, -0.011570930480957031, -0.010105133056640625, -0.008639335632324219, -0.0071735382080078125, -0.005707740783691406, -0.004241943359375, -0.0027761459350585938, -0.0013103485107421875, 0.00015544891357421875, 0.001621246337890625, 0.0030870437622070312, 0.0045528411865234375, 0.006018638610839844, 0.00748443603515625, 0.008950233459472656, 0.010416030883789062, 0.011881828308105469, 0.013347625732421875, 0.014813423156738281, 0.016279220581054688, 0.017745018005371094, 0.0192108154296875, 0.020676612854003906, 0.022142410278320312, 0.02360820770263672, 0.025074005126953125, 0.02653980255126953, 0.028005599975585938, 0.029471397399902344, 0.03093719482421875, 0.032402992248535156, 0.03386878967285156, 0.03533458709716797, 0.036800384521484375, 0.03826618194580078, 0.03973197937011719, 0.041197776794433594, 0.04266357421875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 6.0, 1.0, 2.0, 3.0, 8.0, 9.0, 7.0, 15.0, 18.0, 33.0, 36.0, 46.0, 93.0, 205.0, 368.0, 931.0, 2628.0, 8212.0, 29753.0, 142085.0, 545885.0, 251175.0, 48720.0, 12212.0, 3732.0, 1266.0, 515.0, 240.0, 123.0, 76.0, 43.0, 35.0, 24.0, 13.0, 16.0, 8.0, 5.0, 6.0, 3.0, 2.0, 0.0, 3.0, 2.0, 2.0], "bins": [-0.1456298828125, -0.14204883575439453, -0.13846778869628906, -0.1348867416381836, -0.13130569458007812, -0.12772464752197266, -0.12414360046386719, -0.12056255340576172, -0.11698150634765625, -0.11340045928955078, -0.10981941223144531, -0.10623836517333984, -0.10265731811523438, -0.0990762710571289, -0.09549522399902344, -0.09191417694091797, -0.0883331298828125, -0.08475208282470703, -0.08117103576660156, -0.0775899887084961, -0.07400894165039062, -0.07042789459228516, -0.06684684753417969, -0.06326580047607422, -0.05968475341796875, -0.05610370635986328, -0.05252265930175781, -0.048941612243652344, -0.045360565185546875, -0.041779518127441406, -0.03819847106933594, -0.03461742401123047, -0.031036376953125, -0.02745532989501953, -0.023874282836914062, -0.020293235778808594, -0.016712188720703125, -0.013131141662597656, -0.009550094604492188, -0.005969047546386719, -0.00238800048828125, 0.0011930465698242188, 0.0047740936279296875, 0.008355140686035156, 0.011936187744140625, 0.015517234802246094, 0.019098281860351562, 0.02267932891845703, 0.0262603759765625, 0.02984142303466797, 0.03342247009277344, 0.037003517150878906, 0.040584564208984375, 0.044165611267089844, 0.04774665832519531, 0.05132770538330078, 0.05490875244140625, 0.05848979949951172, 0.06207084655761719, 0.06565189361572266, 0.06923294067382812, 0.0728139877319336, 0.07639503479003906, 0.07997608184814453, 0.08355712890625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 1.0, 1.0, 5.0, 6.0, 3.0, 11.0, 15.0, 13.0, 16.0, 13.0, 23.0, 31.0, 21.0, 31.0, 47.0, 43.0, 36.0, 40.0, 38.0, 50.0, 44.0, 56.0, 42.0, 51.0, 44.0, 32.0, 38.0, 29.0, 36.0, 20.0, 27.0, 25.0, 22.0, 23.0, 14.0, 16.0, 7.0, 10.0, 4.0, 5.0, 3.0, 6.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.137451171875, -0.1336221694946289, -0.1297931671142578, -0.12596416473388672, -0.12213516235351562, -0.11830615997314453, -0.11447715759277344, -0.11064815521240234, -0.10681915283203125, -0.10299015045166016, -0.09916114807128906, -0.09533214569091797, -0.09150314331054688, -0.08767414093017578, -0.08384513854980469, -0.0800161361694336, -0.0761871337890625, -0.0723581314086914, -0.06852912902832031, -0.06470012664794922, -0.060871124267578125, -0.05704212188720703, -0.05321311950683594, -0.049384117126464844, -0.04555511474609375, -0.041726112365722656, -0.03789710998535156, -0.03406810760498047, -0.030239105224609375, -0.02641010284423828, -0.022581100463867188, -0.018752098083496094, -0.014923095703125, -0.011094093322753906, -0.0072650909423828125, -0.0034360885620117188, 0.000392913818359375, 0.004221916198730469, 0.008050918579101562, 0.011879920959472656, 0.01570892333984375, 0.019537925720214844, 0.023366928100585938, 0.02719593048095703, 0.031024932861328125, 0.03485393524169922, 0.03868293762207031, 0.042511940002441406, 0.0463409423828125, 0.050169944763183594, 0.05399894714355469, 0.05782794952392578, 0.061656951904296875, 0.06548595428466797, 0.06931495666503906, 0.07314395904541016, 0.07697296142578125, 0.08080196380615234, 0.08463096618652344, 0.08845996856689453, 0.09228897094726562, 0.09611797332763672, 0.09994697570800781, 0.1037759780883789, 0.10760498046875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 5.0, 4.0, 2.0, 4.0, 8.0, 7.0, 9.0, 12.0, 20.0, 19.0, 27.0, 27.0, 34.0, 44.0, 57.0, 83.0, 108.0, 173.0, 269.0, 515.0, 1304.0, 4194.0, 22569.0, 201435.0, 649966.0, 144789.0, 17060.0, 3426.0, 1096.0, 483.0, 254.0, 134.0, 89.0, 72.0, 48.0, 42.0, 28.0, 19.0, 23.0, 19.0, 13.0, 11.0, 11.0, 7.0, 11.0, 7.0, 10.0, 7.0, 3.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.053497314453125, -0.051795005798339844, -0.05009269714355469, -0.04839038848876953, -0.046688079833984375, -0.04498577117919922, -0.04328346252441406, -0.041581153869628906, -0.03987884521484375, -0.038176536560058594, -0.03647422790527344, -0.03477191925048828, -0.033069610595703125, -0.03136730194091797, -0.029664993286132812, -0.027962684631347656, -0.0262603759765625, -0.024558067321777344, -0.022855758666992188, -0.02115345001220703, -0.019451141357421875, -0.01774883270263672, -0.016046524047851562, -0.014344215393066406, -0.01264190673828125, -0.010939598083496094, -0.009237289428710938, -0.007534980773925781, -0.005832672119140625, -0.004130363464355469, -0.0024280548095703125, -0.0007257461547851562, 0.0009765625, 0.0026788711547851562, 0.0043811798095703125, 0.006083488464355469, 0.007785797119140625, 0.009488105773925781, 0.011190414428710938, 0.012892723083496094, 0.01459503173828125, 0.016297340393066406, 0.017999649047851562, 0.01970195770263672, 0.021404266357421875, 0.02310657501220703, 0.024808883666992188, 0.026511192321777344, 0.0282135009765625, 0.029915809631347656, 0.03161811828613281, 0.03332042694091797, 0.035022735595703125, 0.03672504425048828, 0.03842735290527344, 0.040129661560058594, 0.04183197021484375, 0.043534278869628906, 0.04523658752441406, 0.04693889617919922, 0.048641204833984375, 0.05034351348876953, 0.05204582214355469, 0.053748130798339844, 0.055450439453125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 4.0, 7.0, 8.0, 14.0, 21.0, 24.0, 40.0, 58.0, 63.0, 96.0, 96.0, 103.0, 106.0, 94.0, 67.0, 72.0, 30.0, 28.0, 23.0, 21.0, 11.0, 5.0, 5.0, 1.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.68899917602539e-06, -7.316470146179199e-06, -6.943941116333008e-06, -6.571412086486816e-06, -6.198883056640625e-06, -5.826354026794434e-06, -5.453824996948242e-06, -5.081295967102051e-06, -4.708766937255859e-06, -4.336237907409668e-06, -3.9637088775634766e-06, -3.591179847717285e-06, -3.2186508178710938e-06, -2.8461217880249023e-06, -2.473592758178711e-06, -2.1010637283325195e-06, -1.7285346984863281e-06, -1.3560056686401367e-06, -9.834766387939453e-07, -6.109476089477539e-07, -2.384185791015625e-07, 1.341104507446289e-07, 5.066394805908203e-07, 8.791685104370117e-07, 1.2516975402832031e-06, 1.6242265701293945e-06, 1.996755599975586e-06, 2.3692846298217773e-06, 2.7418136596679688e-06, 3.11434268951416e-06, 3.4868717193603516e-06, 3.859400749206543e-06, 4.231929779052734e-06, 4.604458808898926e-06, 4.976987838745117e-06, 5.349516868591309e-06, 5.7220458984375e-06, 6.094574928283691e-06, 6.467103958129883e-06, 6.839632987976074e-06, 7.212162017822266e-06, 7.584691047668457e-06, 7.957220077514648e-06, 8.32974910736084e-06, 8.702278137207031e-06, 9.074807167053223e-06, 9.447336196899414e-06, 9.819865226745605e-06, 1.0192394256591797e-05, 1.0564923286437988e-05, 1.093745231628418e-05, 1.1309981346130371e-05, 1.1682510375976562e-05, 1.2055039405822754e-05, 1.2427568435668945e-05, 1.2800097465515137e-05, 1.3172626495361328e-05, 1.354515552520752e-05, 1.3917684555053711e-05, 1.4290213584899902e-05, 1.4662742614746094e-05, 1.5035271644592285e-05, 1.5407800674438477e-05, 1.5780329704284668e-05, 1.615285873413086e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 7.0, 3.0, 7.0, 14.0, 13.0, 25.0, 37.0, 53.0, 108.0, 144.0, 358.0, 865.0, 2914.0, 18325.0, 235882.0, 694955.0, 83489.0, 8322.0, 1932.0, 577.0, 224.0, 110.0, 75.0, 43.0, 31.0, 15.0, 10.0, 12.0, 3.0, 5.0, 4.0, 6.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.037811279296875, -0.035852909088134766, -0.03389453887939453, -0.0319361686706543, -0.029977798461914062, -0.028019428253173828, -0.026061058044433594, -0.02410268783569336, -0.022144317626953125, -0.02018594741821289, -0.018227577209472656, -0.016269207000732422, -0.014310836791992188, -0.012352466583251953, -0.010394096374511719, -0.008435726165771484, -0.00647735595703125, -0.004518985748291016, -0.0025606155395507812, -0.0006022453308105469, 0.0013561248779296875, 0.003314495086669922, 0.005272865295410156, 0.007231235504150391, 0.009189605712890625, 0.01114797592163086, 0.013106346130371094, 0.015064716339111328, 0.017023086547851562, 0.018981456756591797, 0.02093982696533203, 0.022898197174072266, 0.0248565673828125, 0.026814937591552734, 0.02877330780029297, 0.030731678009033203, 0.03269004821777344, 0.03464841842651367, 0.036606788635253906, 0.03856515884399414, 0.040523529052734375, 0.04248189926147461, 0.044440269470214844, 0.04639863967895508, 0.04835700988769531, 0.05031538009643555, 0.05227375030517578, 0.054232120513916016, 0.05619049072265625, 0.058148860931396484, 0.06010723114013672, 0.06206560134887695, 0.06402397155761719, 0.06598234176635742, 0.06794071197509766, 0.06989908218383789, 0.07185745239257812, 0.07381582260131836, 0.0757741928100586, 0.07773256301879883, 0.07969093322753906, 0.0816493034362793, 0.08360767364501953, 0.08556604385375977, 0.0875244140625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 4.0, 7.0, 5.0, 10.0, 13.0, 22.0, 29.0, 38.0, 62.0, 58.0, 70.0, 87.0, 112.0, 107.0, 75.0, 91.0, 57.0, 41.0, 27.0, 23.0, 17.0, 17.0, 5.0, 9.0, 9.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04644775390625, -0.04481649398803711, -0.04318523406982422, -0.04155397415161133, -0.03992271423339844, -0.03829145431518555, -0.036660194396972656, -0.035028934478759766, -0.033397674560546875, -0.031766414642333984, -0.030135154724121094, -0.028503894805908203, -0.026872634887695312, -0.025241374969482422, -0.02361011505126953, -0.02197885513305664, -0.02034759521484375, -0.01871633529663086, -0.01708507537841797, -0.015453815460205078, -0.013822555541992188, -0.012191295623779297, -0.010560035705566406, -0.008928775787353516, -0.007297515869140625, -0.005666255950927734, -0.004034996032714844, -0.002403736114501953, -0.0007724761962890625, 0.0008587837219238281, 0.0024900436401367188, 0.004121303558349609, 0.0057525634765625, 0.007383823394775391, 0.009015083312988281, 0.010646343231201172, 0.012277603149414062, 0.013908863067626953, 0.015540122985839844, 0.017171382904052734, 0.018802642822265625, 0.020433902740478516, 0.022065162658691406, 0.023696422576904297, 0.025327682495117188, 0.026958942413330078, 0.02859020233154297, 0.03022146224975586, 0.03185272216796875, 0.03348398208618164, 0.03511524200439453, 0.03674650192260742, 0.03837776184082031, 0.0400090217590332, 0.041640281677246094, 0.043271541595458984, 0.044902801513671875, 0.046534061431884766, 0.048165321350097656, 0.04979658126831055, 0.05142784118652344, 0.05305910110473633, 0.05469036102294922, 0.05632162094116211, 0.057952880859375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 19.0, 39.0, 86.0, 177.0, 247.0, 206.0, 142.0, 56.0, 14.0, 7.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4605227708816528, -1.4209555387496948, -1.3813883066177368, -1.3418210744857788, -1.3022538423538208, -1.2626866102218628, -1.2231193780899048, -1.1835520267486572, -1.1439847946166992, -1.1044175624847412, -1.0648503303527832, -1.0252830982208252, -0.9857158660888672, -0.9461486339569092, -0.9065813422203064, -0.8670141100883484, -0.8274469375610352, -0.7878797054290771, -0.7483124732971191, -0.7087452411651611, -0.6691780090332031, -0.6296107769012451, -0.5900434851646423, -0.5504762530326843, -0.5109090209007263, -0.4713417887687683, -0.4317745566368103, -0.3922072947025299, -0.3526400625705719, -0.3130728304386139, -0.2735055685043335, -0.2339383363723755, -0.19437110424041748, -0.15480387210845947, -0.11523662507534027, -0.07566938549280167, -0.03610214591026306, 0.0034650862216949463, 0.04303233325481415, 0.08259958028793335, 0.12216681241989136, 0.16173404455184937, 0.20130129158496857, 0.24086853861808777, 0.2804357707500458, 0.3200030028820038, 0.3595702648162842, 0.3991374969482422, 0.4387047290802002, 0.4782719612121582, 0.5178391933441162, 0.5574064254760742, 0.5969736576080322, 0.6365408897399902, 0.676108181476593, 0.715675413608551, 0.755242645740509, 0.794809877872467, 0.834377110004425, 0.8739443421363831, 0.9135116338729858, 0.9530788660049438, 0.9926460981369019, 1.0322133302688599, 1.0717805624008179]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 4.0, 3.0, 5.0, 5.0, 8.0, 6.0, 13.0, 12.0, 12.0, 19.0, 23.0, 25.0, 30.0, 31.0, 24.0, 30.0, 39.0, 34.0, 54.0, 46.0, 47.0, 41.0, 30.0, 42.0, 44.0, 42.0, 27.0, 27.0, 28.0, 30.0, 26.0, 25.0, 31.0, 19.0, 12.0, 17.0, 18.0, 14.0, 18.0, 2.0, 9.0, 5.0, 2.0, 4.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.5184855461120605, -0.5015771389007568, -0.4846687614917755, -0.4677603840827942, -0.4508519768714905, -0.43394356966018677, -0.41703519225120544, -0.4001268148422241, -0.3832184076309204, -0.3663100004196167, -0.3494016230106354, -0.33249324560165405, -0.31558483839035034, -0.29867643117904663, -0.2817680537700653, -0.264859676361084, -0.24795126914978027, -0.23104287683963776, -0.21413448452949524, -0.19722609221935272, -0.1803176999092102, -0.1634093075990677, -0.14650091528892517, -0.12959252297878265, -0.11268413066864014, -0.09577573835849762, -0.0788673460483551, -0.061958953738212585, -0.04505056142807007, -0.02814216911792755, -0.011233776807785034, 0.005674615502357483, 0.0225830078125, 0.03949140012264252, 0.056399792432785034, 0.07330818474292755, 0.09021657705307007, 0.10712496936321259, 0.1240333616733551, 0.14094175398349762, 0.15785014629364014, 0.17475853860378265, 0.19166693091392517, 0.2085753232240677, 0.2254837155342102, 0.24239210784435272, 0.25930050015449524, 0.27620887756347656, 0.2931172847747803, 0.310025691986084, 0.3269340693950653, 0.34384244680404663, 0.36075085401535034, 0.37765926122665405, 0.3945676386356354, 0.4114760160446167, 0.4283844232559204, 0.4452928304672241, 0.46220120787620544, 0.47910958528518677, 0.4960179924964905, 0.5129263997077942, 0.5298347473144531, 0.5467431545257568, 0.5636515617370605]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 7.0, 3.0, 7.0, 4.0, 9.0, 19.0, 17.0, 23.0, 38.0, 54.0, 89.0, 141.0, 225.0, 390.0, 697.0, 1259.0, 2725.0, 6587.0, 21285.0, 111286.0, 3640697.0, 349812.0, 41098.0, 10461.0, 3757.0, 1614.0, 835.0, 467.0, 264.0, 155.0, 93.0, 57.0, 40.0, 29.0, 18.0, 10.0, 6.0, 8.0, 5.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.169921875, -0.1658487319946289, -0.1617755889892578, -0.15770244598388672, -0.15362930297851562, -0.14955615997314453, -0.14548301696777344, -0.14140987396240234, -0.13733673095703125, -0.13326358795166016, -0.12919044494628906, -0.12511730194091797, -0.12104415893554688, -0.11697101593017578, -0.11289787292480469, -0.1088247299194336, -0.1047515869140625, -0.1006784439086914, -0.09660530090332031, -0.09253215789794922, -0.08845901489257812, -0.08438587188720703, -0.08031272888183594, -0.07623958587646484, -0.07216644287109375, -0.06809329986572266, -0.06402015686035156, -0.05994701385498047, -0.055873870849609375, -0.05180072784423828, -0.04772758483886719, -0.043654441833496094, -0.039581298828125, -0.035508155822753906, -0.03143501281738281, -0.02736186981201172, -0.023288726806640625, -0.01921558380126953, -0.015142440795898438, -0.011069297790527344, -0.00699615478515625, -0.0029230117797851562, 0.0011501312255859375, 0.005223274230957031, 0.009296417236328125, 0.013369560241699219, 0.017442703247070312, 0.021515846252441406, 0.0255889892578125, 0.029662132263183594, 0.03373527526855469, 0.03780841827392578, 0.041881561279296875, 0.04595470428466797, 0.05002784729003906, 0.054100990295410156, 0.05817413330078125, 0.062247276306152344, 0.06632041931152344, 0.07039356231689453, 0.07446670532226562, 0.07853984832763672, 0.08261299133300781, 0.0866861343383789, 0.09075927734375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 4.0, 9.0, 10.0, 8.0, 19.0, 19.0, 19.0, 24.0, 26.0, 31.0, 35.0, 47.0, 49.0, 36.0, 68.0, 63.0, 57.0, 72.0, 62.0, 58.0, 50.0, 37.0, 36.0, 31.0, 26.0, 32.0, 20.0, 11.0, 18.0, 10.0, 9.0, 5.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0439453125, -0.0425877571105957, -0.041230201721191406, -0.03987264633178711, -0.03851509094238281, -0.037157535552978516, -0.03579998016357422, -0.03444242477416992, -0.033084869384765625, -0.03172731399536133, -0.03036975860595703, -0.029012203216552734, -0.027654647827148438, -0.02629709243774414, -0.024939537048339844, -0.023581981658935547, -0.02222442626953125, -0.020866870880126953, -0.019509315490722656, -0.01815176010131836, -0.016794204711914062, -0.015436649322509766, -0.014079093933105469, -0.012721538543701172, -0.011363983154296875, -0.010006427764892578, -0.008648872375488281, -0.007291316986083984, -0.0059337615966796875, -0.004576206207275391, -0.0032186508178710938, -0.0018610954284667969, -0.0005035400390625, 0.0008540153503417969, 0.0022115707397460938, 0.0035691261291503906, 0.0049266815185546875, 0.006284236907958984, 0.007641792297363281, 0.008999347686767578, 0.010356903076171875, 0.011714458465576172, 0.013072013854980469, 0.014429569244384766, 0.015787124633789062, 0.01714468002319336, 0.018502235412597656, 0.019859790802001953, 0.02121734619140625, 0.022574901580810547, 0.023932456970214844, 0.02529001235961914, 0.026647567749023438, 0.028005123138427734, 0.02936267852783203, 0.030720233917236328, 0.032077789306640625, 0.03343534469604492, 0.03479290008544922, 0.036150455474853516, 0.03750801086425781, 0.03886556625366211, 0.040223121643066406, 0.0415806770324707, 0.042938232421875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 3.0, 2.0, 5.0, 7.0, 9.0, 11.0, 15.0, 21.0, 34.0, 43.0, 59.0, 80.0, 113.0, 150.0, 280.0, 538.0, 1040.0, 2399.0, 6221.0, 20939.0, 109562.0, 3380573.0, 598367.0, 53082.0, 12702.0, 4274.0, 1678.0, 832.0, 451.0, 266.0, 165.0, 99.0, 62.0, 51.0, 37.0, 34.0, 21.0, 13.0, 15.0, 12.0, 8.0, 3.0, 5.0, 1.0, 3.0, 5.0, 1.0, 0.0, 1.0], "bins": [-0.1416015625, -0.1377544403076172, -0.13390731811523438, -0.13006019592285156, -0.12621307373046875, -0.12236595153808594, -0.11851882934570312, -0.11467170715332031, -0.1108245849609375, -0.10697746276855469, -0.10313034057617188, -0.09928321838378906, -0.09543609619140625, -0.09158897399902344, -0.08774185180664062, -0.08389472961425781, -0.080047607421875, -0.07620048522949219, -0.07235336303710938, -0.06850624084472656, -0.06465911865234375, -0.06081199645996094, -0.056964874267578125, -0.05311775207519531, -0.0492706298828125, -0.04542350769042969, -0.041576385498046875, -0.03772926330566406, -0.03388214111328125, -0.030035018920898438, -0.026187896728515625, -0.022340774536132812, -0.01849365234375, -0.014646530151367188, -0.010799407958984375, -0.0069522857666015625, -0.00310516357421875, 0.0007419586181640625, 0.004589080810546875, 0.008436203002929688, 0.0122833251953125, 0.016130447387695312, 0.019977569580078125, 0.023824691772460938, 0.02767181396484375, 0.03151893615722656, 0.035366058349609375, 0.03921318054199219, 0.043060302734375, 0.04690742492675781, 0.050754547119140625, 0.05460166931152344, 0.05844879150390625, 0.06229591369628906, 0.06614303588867188, 0.06999015808105469, 0.0738372802734375, 0.07768440246582031, 0.08153152465820312, 0.08537864685058594, 0.08922576904296875, 0.09307289123535156, 0.09692001342773438, 0.10076713562011719, 0.1046142578125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 6.0, 7.0, 12.0, 12.0, 22.0, 42.0, 72.0, 170.0, 454.0, 2258.0, 611.0, 210.0, 71.0, 51.0, 25.0, 18.0, 12.0, 8.0, 9.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.035369873046875, -0.03324174880981445, -0.031113624572753906, -0.02898550033569336, -0.026857376098632812, -0.024729251861572266, -0.02260112762451172, -0.020473003387451172, -0.018344879150390625, -0.016216754913330078, -0.014088630676269531, -0.011960506439208984, -0.009832382202148438, -0.007704257965087891, -0.005576133728027344, -0.003448009490966797, -0.00131988525390625, 0.0008082389831542969, 0.0029363632202148438, 0.005064487457275391, 0.0071926116943359375, 0.009320735931396484, 0.011448860168457031, 0.013576984405517578, 0.015705108642578125, 0.017833232879638672, 0.01996135711669922, 0.022089481353759766, 0.024217605590820312, 0.02634572982788086, 0.028473854064941406, 0.030601978302001953, 0.0327301025390625, 0.03485822677612305, 0.036986351013183594, 0.03911447525024414, 0.04124259948730469, 0.043370723724365234, 0.04549884796142578, 0.04762697219848633, 0.049755096435546875, 0.05188322067260742, 0.05401134490966797, 0.056139469146728516, 0.05826759338378906, 0.06039571762084961, 0.06252384185791016, 0.0646519660949707, 0.06678009033203125, 0.0689082145690918, 0.07103633880615234, 0.07316446304321289, 0.07529258728027344, 0.07742071151733398, 0.07954883575439453, 0.08167695999145508, 0.08380508422851562, 0.08593320846557617, 0.08806133270263672, 0.09018945693969727, 0.09231758117675781, 0.09444570541381836, 0.0965738296508789, 0.09870195388793945, 0.100830078125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 12.0, 13.0, 55.0, 185.0, 299.0, 278.0, 105.0, 32.0, 12.0, 6.0, 5.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.30576616525650024, -0.28858163952827454, -0.27139711380004883, -0.25421255826950073, -0.23702803254127502, -0.21984350681304932, -0.2026589810848236, -0.1854744553565979, -0.168289914727211, -0.1511053889989853, -0.1339208483695984, -0.11673632264137268, -0.09955178946256638, -0.08236725628376007, -0.06518273055553436, -0.04799819737672806, -0.030813664197921753, -0.013629132881760597, 0.0035553984344005585, 0.020739927887916565, 0.03792446106672287, 0.055108994245529175, 0.07229351997375488, 0.08947805315256119, 0.10666258633136749, 0.1238471195101738, 0.1410316526889801, 0.1582161784172058, 0.17540070414543152, 0.19258524477481842, 0.20976977050304413, 0.22695431113243103, 0.24413883686065674, 0.26132336258888245, 0.27850788831710815, 0.29569244384765625, 0.31287696957588196, 0.33006149530410767, 0.3472460210323334, 0.3644305467605591, 0.3816151022911072, 0.3987996280193329, 0.4159841537475586, 0.4331687092781067, 0.4503532350063324, 0.4675377607345581, 0.4847222864627838, 0.5019068121910095, 0.5190913677215576, 0.5362759232521057, 0.553460419178009, 0.5706449747085571, 0.5878294706344604, 0.6050140261650085, 0.6221985816955566, 0.63938307762146, 0.6565675735473633, 0.6737521290779114, 0.6909366250038147, 0.7081211805343628, 0.7253056764602661, 0.7424902319908142, 0.7596747875213623, 0.7768592834472656, 0.7940438389778137]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 12.0, 14.0, 12.0, 14.0, 31.0, 32.0, 48.0, 43.0, 61.0, 77.0, 71.0, 75.0, 74.0, 64.0, 76.0, 67.0, 45.0, 45.0, 34.0, 23.0, 21.0, 15.0, 11.0, 9.0, 6.0, 5.0, 3.0, 5.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14164412021636963, -0.13525022566318512, -0.1288563311100006, -0.1224624440073967, -0.11606855690479279, -0.10967466235160828, -0.10328076779842377, -0.09688687324523926, -0.09049298614263535, -0.08409909158945084, -0.07770520448684692, -0.07131130993366241, -0.0649174153804779, -0.05852352827787399, -0.052129633724689484, -0.04573574289679527, -0.03934185206890106, -0.03294796124100685, -0.02655406855046749, -0.02016017585992813, -0.01376628503203392, -0.0073723942041397095, -0.0009784996509552002, 0.005415391176939011, 0.011809282004833221, 0.018203172832727432, 0.024597065523266792, 0.030990958213806152, 0.03738484904170036, 0.043778739869594574, 0.05017263442277908, 0.056566525250673294, 0.0629604160785675, 0.06935431063175201, 0.07574819773435593, 0.08214209228754044, 0.08853597939014435, 0.09492987394332886, 0.10132376849651337, 0.10771766304969788, 0.11411155015230179, 0.1205054447054863, 0.1268993318080902, 0.13329322636127472, 0.13968712091445923, 0.14608100056648254, 0.15247491002082825, 0.15886878967285156, 0.16526268422603607, 0.17165657877922058, 0.1780504733324051, 0.1844443678855896, 0.19083824753761292, 0.19723214209079742, 0.20362603664398193, 0.21001993119716644, 0.21641382575035095, 0.22280772030353546, 0.22920161485671997, 0.2355954945087433, 0.2419893890619278, 0.2483832836151123, 0.254777193069458, 0.2611710727214813, 0.26756495237350464]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 4.0, 5.0, 1.0, 3.0, 5.0, 9.0, 14.0, 21.0, 27.0, 21.0, 42.0, 64.0, 97.0, 146.0, 223.0, 324.0, 627.0, 1051.0, 1698.0, 3394.0, 6955.0, 14253.0, 32782.0, 79218.0, 192550.0, 328268.0, 222510.0, 93354.0, 37824.0, 16584.0, 7739.0, 3851.0, 2023.0, 1155.0, 598.0, 391.0, 229.0, 151.0, 118.0, 53.0, 54.0, 30.0, 18.0, 18.0, 17.0, 13.0, 8.0, 8.0, 6.0, 3.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.08447265625, -0.08188056945800781, -0.07928848266601562, -0.07669639587402344, -0.07410430908203125, -0.07151222229003906, -0.06892013549804688, -0.06632804870605469, -0.0637359619140625, -0.06114387512207031, -0.058551788330078125, -0.05595970153808594, -0.05336761474609375, -0.05077552795410156, -0.048183441162109375, -0.04559135437011719, -0.042999267578125, -0.04040718078613281, -0.037815093994140625, -0.03522300720214844, -0.03263092041015625, -0.030038833618164062, -0.027446746826171875, -0.024854660034179688, -0.0222625732421875, -0.019670486450195312, -0.017078399658203125, -0.014486312866210938, -0.01189422607421875, -0.009302139282226562, -0.006710052490234375, -0.0041179656982421875, -0.00152587890625, 0.0010662078857421875, 0.003658294677734375, 0.0062503814697265625, 0.00884246826171875, 0.011434555053710938, 0.014026641845703125, 0.016618728637695312, 0.0192108154296875, 0.021802902221679688, 0.024394989013671875, 0.026987075805664062, 0.02957916259765625, 0.03217124938964844, 0.034763336181640625, 0.03735542297363281, 0.039947509765625, 0.04253959655761719, 0.045131683349609375, 0.04772377014160156, 0.05031585693359375, 0.05290794372558594, 0.055500030517578125, 0.05809211730957031, 0.0606842041015625, 0.06327629089355469, 0.06586837768554688, 0.06846046447753906, 0.07105255126953125, 0.07364463806152344, 0.07623672485351562, 0.07882881164550781, 0.0814208984375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 6.0, 4.0, 10.0, 14.0, 19.0, 15.0, 20.0, 37.0, 23.0, 23.0, 37.0, 36.0, 51.0, 48.0, 58.0, 53.0, 62.0, 64.0, 57.0, 53.0, 52.0, 46.0, 37.0, 27.0, 32.0, 29.0, 18.0, 20.0, 11.0, 14.0, 6.0, 7.0, 9.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.039215087890625, -0.0378880500793457, -0.036561012268066406, -0.03523397445678711, -0.03390693664550781, -0.032579898834228516, -0.03125286102294922, -0.029925823211669922, -0.028598785400390625, -0.027271747589111328, -0.02594470977783203, -0.024617671966552734, -0.023290634155273438, -0.02196359634399414, -0.020636558532714844, -0.019309520721435547, -0.01798248291015625, -0.016655445098876953, -0.015328407287597656, -0.01400136947631836, -0.012674331665039062, -0.011347293853759766, -0.010020256042480469, -0.008693218231201172, -0.007366180419921875, -0.006039142608642578, -0.004712104797363281, -0.0033850669860839844, -0.0020580291748046875, -0.0007309913635253906, 0.0005960464477539062, 0.0019230842590332031, 0.0032501220703125, 0.004577159881591797, 0.005904197692871094, 0.007231235504150391, 0.008558273315429688, 0.009885311126708984, 0.011212348937988281, 0.012539386749267578, 0.013866424560546875, 0.015193462371826172, 0.01652050018310547, 0.017847537994384766, 0.019174575805664062, 0.02050161361694336, 0.021828651428222656, 0.023155689239501953, 0.02448272705078125, 0.025809764862060547, 0.027136802673339844, 0.02846384048461914, 0.029790878295898438, 0.031117916107177734, 0.03244495391845703, 0.03377199172973633, 0.035099029541015625, 0.03642606735229492, 0.03775310516357422, 0.039080142974853516, 0.04040718078613281, 0.04173421859741211, 0.043061256408691406, 0.0443882942199707, 0.04571533203125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 9.0, 6.0, 6.0, 9.0, 10.0, 19.0, 19.0, 22.0, 29.0, 45.0, 52.0, 77.0, 103.0, 142.0, 208.0, 311.0, 552.0, 943.0, 1711.0, 3428.0, 7146.0, 16532.0, 40406.0, 104731.0, 253904.0, 331815.0, 171669.0, 66313.0, 26231.0, 11225.0, 5067.0, 2565.0, 1249.0, 733.0, 379.0, 280.0, 180.0, 118.0, 87.0, 70.0, 38.0, 23.0, 24.0, 21.0, 10.0, 9.0, 8.0, 10.0, 6.0, 2.0, 4.0, 0.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.06866455078125, -0.0664682388305664, -0.06427192687988281, -0.06207561492919922, -0.059879302978515625, -0.05768299102783203, -0.05548667907714844, -0.053290367126464844, -0.05109405517578125, -0.048897743225097656, -0.04670143127441406, -0.04450511932373047, -0.042308807373046875, -0.04011249542236328, -0.03791618347167969, -0.035719871520996094, -0.0335235595703125, -0.031327247619628906, -0.029130935668945312, -0.02693462371826172, -0.024738311767578125, -0.02254199981689453, -0.020345687866210938, -0.018149375915527344, -0.01595306396484375, -0.013756752014160156, -0.011560440063476562, -0.009364128112792969, -0.007167816162109375, -0.004971504211425781, -0.0027751922607421875, -0.0005788803100585938, 0.001617431640625, 0.0038137435913085938, 0.0060100555419921875, 0.008206367492675781, 0.010402679443359375, 0.012598991394042969, 0.014795303344726562, 0.016991615295410156, 0.01918792724609375, 0.021384239196777344, 0.023580551147460938, 0.02577686309814453, 0.027973175048828125, 0.03016948699951172, 0.03236579895019531, 0.034562110900878906, 0.0367584228515625, 0.038954734802246094, 0.04115104675292969, 0.04334735870361328, 0.045543670654296875, 0.04773998260498047, 0.04993629455566406, 0.052132606506347656, 0.05432891845703125, 0.056525230407714844, 0.05872154235839844, 0.06091785430908203, 0.06311416625976562, 0.06531047821044922, 0.06750679016113281, 0.0697031021118164, 0.0718994140625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 5.0, 3.0, 3.0, 7.0, 3.0, 9.0, 11.0, 11.0, 11.0, 19.0, 27.0, 24.0, 34.0, 25.0, 20.0, 30.0, 31.0, 30.0, 41.0, 43.0, 29.0, 33.0, 35.0, 48.0, 47.0, 45.0, 39.0, 39.0, 31.0, 33.0, 32.0, 28.0, 34.0, 20.0, 20.0, 17.0, 15.0, 12.0, 19.0, 8.0, 8.0, 5.0, 7.0, 3.0, 9.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.12408447265625, -0.1199960708618164, -0.11590766906738281, -0.11181926727294922, -0.10773086547851562, -0.10364246368408203, -0.09955406188964844, -0.09546566009521484, -0.09137725830078125, -0.08728885650634766, -0.08320045471191406, -0.07911205291748047, -0.07502365112304688, -0.07093524932861328, -0.06684684753417969, -0.0627584457397461, -0.0586700439453125, -0.054581642150878906, -0.05049324035644531, -0.04640483856201172, -0.042316436767578125, -0.03822803497314453, -0.03413963317871094, -0.030051231384277344, -0.02596282958984375, -0.021874427795410156, -0.017786026000976562, -0.013697624206542969, -0.009609222412109375, -0.005520820617675781, -0.0014324188232421875, 0.0026559829711914062, 0.006744384765625, 0.010832786560058594, 0.014921188354492188, 0.01900959014892578, 0.023097991943359375, 0.02718639373779297, 0.03127479553222656, 0.035363197326660156, 0.03945159912109375, 0.043540000915527344, 0.04762840270996094, 0.05171680450439453, 0.055805206298828125, 0.05989360809326172, 0.06398200988769531, 0.0680704116821289, 0.0721588134765625, 0.0762472152709961, 0.08033561706542969, 0.08442401885986328, 0.08851242065429688, 0.09260082244873047, 0.09668922424316406, 0.10077762603759766, 0.10486602783203125, 0.10895442962646484, 0.11304283142089844, 0.11713123321533203, 0.12121963500976562, 0.12530803680419922, 0.1293964385986328, 0.1334848403930664, 0.1375732421875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 7.0, 0.0, 4.0, 13.0, 8.0, 21.0, 24.0, 44.0, 71.0, 166.0, 319.0, 632.0, 1594.0, 5893.0, 36629.0, 472527.0, 483758.0, 38123.0, 5751.0, 1634.0, 662.0, 309.0, 167.0, 86.0, 48.0, 37.0, 16.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.064208984375, -0.06183147430419922, -0.05945396423339844, -0.057076454162597656, -0.054698944091796875, -0.052321434020996094, -0.04994392395019531, -0.04756641387939453, -0.04518890380859375, -0.04281139373779297, -0.04043388366699219, -0.038056373596191406, -0.035678863525390625, -0.033301353454589844, -0.030923843383789062, -0.02854633331298828, -0.0261688232421875, -0.02379131317138672, -0.021413803100585938, -0.019036293029785156, -0.016658782958984375, -0.014281272888183594, -0.011903762817382812, -0.009526252746582031, -0.00714874267578125, -0.004771232604980469, -0.0023937225341796875, -1.621246337890625e-05, 0.002361297607421875, 0.004738807678222656, 0.0071163177490234375, 0.009493827819824219, 0.011871337890625, 0.014248847961425781, 0.016626358032226562, 0.019003868103027344, 0.021381378173828125, 0.023758888244628906, 0.026136398315429688, 0.02851390838623047, 0.03089141845703125, 0.03326892852783203, 0.03564643859863281, 0.038023948669433594, 0.040401458740234375, 0.042778968811035156, 0.04515647888183594, 0.04753398895263672, 0.0499114990234375, 0.05228900909423828, 0.05466651916503906, 0.057044029235839844, 0.059421539306640625, 0.061799049377441406, 0.06417655944824219, 0.06655406951904297, 0.06893157958984375, 0.07130908966064453, 0.07368659973144531, 0.0760641098022461, 0.07844161987304688, 0.08081912994384766, 0.08319664001464844, 0.08557415008544922, 0.08795166015625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 7.0, 10.0, 25.0, 29.0, 40.0, 61.0, 67.0, 86.0, 115.0, 132.0, 103.0, 76.0, 67.0, 54.0, 35.0, 26.0, 21.0, 17.0, 10.0, 7.0, 4.0, 6.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.329183578491211e-05, -1.2893229722976685e-05, -1.249462366104126e-05, -1.2096017599105835e-05, -1.169741153717041e-05, -1.1298805475234985e-05, -1.090019941329956e-05, -1.0501593351364136e-05, -1.0102987289428711e-05, -9.704381227493286e-06, -9.305775165557861e-06, -8.907169103622437e-06, -8.508563041687012e-06, -8.109956979751587e-06, -7.711350917816162e-06, -7.312744855880737e-06, -6.9141387939453125e-06, -6.515532732009888e-06, -6.116926670074463e-06, -5.718320608139038e-06, -5.319714546203613e-06, -4.9211084842681885e-06, -4.522502422332764e-06, -4.123896360397339e-06, -3.725290298461914e-06, -3.3266842365264893e-06, -2.9280781745910645e-06, -2.5294721126556396e-06, -2.130866050720215e-06, -1.73225998878479e-06, -1.3336539268493652e-06, -9.350478649139404e-07, -5.364418029785156e-07, -1.3783574104309082e-07, 2.60770320892334e-07, 6.593763828277588e-07, 1.0579824447631836e-06, 1.4565885066986084e-06, 1.8551945686340332e-06, 2.253800630569458e-06, 2.652406692504883e-06, 3.0510127544403076e-06, 3.4496188163757324e-06, 3.848224878311157e-06, 4.246830940246582e-06, 4.645437002182007e-06, 5.044043064117432e-06, 5.4426491260528564e-06, 5.841255187988281e-06, 6.239861249923706e-06, 6.638467311859131e-06, 7.037073373794556e-06, 7.4356794357299805e-06, 7.834285497665405e-06, 8.23289155960083e-06, 8.631497621536255e-06, 9.03010368347168e-06, 9.428709745407104e-06, 9.82731580734253e-06, 1.0225921869277954e-05, 1.0624527931213379e-05, 1.1023133993148804e-05, 1.1421740055084229e-05, 1.1820346117019653e-05, 1.2218952178955078e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 6.0, 11.0, 7.0, 23.0, 64.0, 96.0, 212.0, 539.0, 1862.0, 12027.0, 209089.0, 749240.0, 68029.0, 5556.0, 1125.0, 374.0, 135.0, 69.0, 49.0, 18.0, 17.0, 7.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10675048828125, -0.10381126403808594, -0.10087203979492188, -0.09793281555175781, -0.09499359130859375, -0.09205436706542969, -0.08911514282226562, -0.08617591857910156, -0.0832366943359375, -0.08029747009277344, -0.07735824584960938, -0.07441902160644531, -0.07147979736328125, -0.06854057312011719, -0.06560134887695312, -0.06266212463378906, -0.059722900390625, -0.05678367614746094, -0.053844451904296875, -0.05090522766113281, -0.04796600341796875, -0.04502677917480469, -0.042087554931640625, -0.03914833068847656, -0.0362091064453125, -0.03326988220214844, -0.030330657958984375, -0.027391433715820312, -0.02445220947265625, -0.021512985229492188, -0.018573760986328125, -0.015634536743164062, -0.0126953125, -0.009756088256835938, -0.006816864013671875, -0.0038776397705078125, -0.00093841552734375, 0.0020008087158203125, 0.004940032958984375, 0.007879257202148438, 0.0108184814453125, 0.013757705688476562, 0.016696929931640625, 0.019636154174804688, 0.02257537841796875, 0.025514602661132812, 0.028453826904296875, 0.03139305114746094, 0.034332275390625, 0.03727149963378906, 0.040210723876953125, 0.04314994812011719, 0.04608917236328125, 0.04902839660644531, 0.051967620849609375, 0.05490684509277344, 0.0578460693359375, 0.06078529357910156, 0.06372451782226562, 0.06666374206542969, 0.06960296630859375, 0.07254219055175781, 0.07548141479492188, 0.07842063903808594, 0.08135986328125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 8.0, 11.0, 17.0, 20.0, 38.0, 55.0, 52.0, 99.0, 114.0, 125.0, 101.0, 94.0, 95.0, 69.0, 28.0, 26.0, 21.0, 7.0, 6.0, 5.0, 8.0, 4.0, 6.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09869384765625, -0.09633779525756836, -0.09398174285888672, -0.09162569046020508, -0.08926963806152344, -0.0869135856628418, -0.08455753326416016, -0.08220148086547852, -0.07984542846679688, -0.07748937606811523, -0.0751333236694336, -0.07277727127075195, -0.07042121887207031, -0.06806516647338867, -0.06570911407470703, -0.06335306167602539, -0.06099700927734375, -0.05864095687866211, -0.05628490447998047, -0.05392885208129883, -0.05157279968261719, -0.04921674728393555, -0.046860694885253906, -0.044504642486572266, -0.042148590087890625, -0.039792537689208984, -0.037436485290527344, -0.0350804328918457, -0.03272438049316406, -0.030368328094482422, -0.02801227569580078, -0.02565622329711914, -0.0233001708984375, -0.02094411849975586, -0.01858806610107422, -0.016232013702392578, -0.013875961303710938, -0.011519908905029297, -0.009163856506347656, -0.006807804107666016, -0.004451751708984375, -0.0020956993103027344, 0.00026035308837890625, 0.002616405487060547, 0.0049724578857421875, 0.007328510284423828, 0.009684562683105469, 0.01204061508178711, 0.01439666748046875, 0.01675271987915039, 0.01910877227783203, 0.021464824676513672, 0.023820877075195312, 0.026176929473876953, 0.028532981872558594, 0.030889034271240234, 0.033245086669921875, 0.035601139068603516, 0.037957191467285156, 0.0403132438659668, 0.04266929626464844, 0.04502534866333008, 0.04738140106201172, 0.04973745346069336, 0.052093505859375]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 9.0, 23.0, 77.0, 170.0, 303.0, 263.0, 112.0, 32.0, 17.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4553911685943604, -2.396761178970337, -2.3381314277648926, -2.279501438140869, -2.2208714485168457, -2.1622414588928223, -2.103611707687378, -2.0449817180633545, -1.986351728439331, -1.9277218580245972, -1.8690918684005737, -1.8104619979858398, -1.7518320083618164, -1.6932021379470825, -1.634572148323059, -1.5759422779083252, -1.5173122882843018, -1.4586824178695679, -1.4000524282455444, -1.3414225578308105, -1.282792568206787, -1.2241626977920532, -1.1655327081680298, -1.106902837753296, -1.048272967338562, -0.9896430373191833, -0.9310131072998047, -0.872383177280426, -0.8137532472610474, -0.7551233768463135, -0.69649338722229, -0.6378635168075562, -0.5792335271835327, -0.520603597164154, -0.4619736671447754, -0.40334373712539673, -0.34471380710601807, -0.2860839068889618, -0.22745397686958313, -0.16882404685020447, -0.1101941168308258, -0.05156419053673744, 0.007065735757350922, 0.06569565832614899, 0.12432558834552765, 0.18295550346374512, 0.24158543348312378, 0.30021536350250244, 0.3588452935218811, 0.41747522354125977, 0.4761051535606384, 0.5347350835800171, 0.5933650135993958, 0.6519949436187744, 0.7106248140335083, 0.7692548036575317, 0.8278846740722656, 0.8865146040916443, 0.945144534111023, 1.0037744045257568, 1.0624043941497803, 1.1210342645645142, 1.1796642541885376, 1.2382941246032715, 1.296924114227295]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 6.0, 9.0, 4.0, 5.0, 10.0, 15.0, 14.0, 12.0, 18.0, 20.0, 30.0, 33.0, 23.0, 30.0, 32.0, 48.0, 41.0, 50.0, 48.0, 40.0, 52.0, 40.0, 50.0, 34.0, 41.0, 38.0, 31.0, 37.0, 21.0, 21.0, 25.0, 29.0, 19.0, 18.0, 13.0, 9.0, 11.0, 10.0, 7.0, 3.0, 5.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6759023070335388, -0.6527527570724487, -0.6296032071113586, -0.6064536571502686, -0.5833041071891785, -0.5601545572280884, -0.5370050668716431, -0.513855516910553, -0.4907059669494629, -0.4675564169883728, -0.4444068670272827, -0.4212573170661926, -0.3981077969074249, -0.37495824694633484, -0.35180869698524475, -0.32865917682647705, -0.3055095970630646, -0.2823600471019745, -0.2592104971408844, -0.2360609620809555, -0.2129114270210266, -0.18976187705993652, -0.16661232709884644, -0.14346279203891754, -0.12031324207782745, -0.09716369956731796, -0.07401415705680847, -0.050864607095718384, -0.027715064585208893, -0.004565522074699402, 0.018584027886390686, 0.04173356294631958, 0.06488311290740967, 0.08803265541791916, 0.11118219792842865, 0.13433174788951874, 0.15748128294944763, 0.18063083291053772, 0.2037803828716278, 0.2269299179315567, 0.2500794529914856, 0.2732290029525757, 0.29637855291366577, 0.31952810287475586, 0.34267762303352356, 0.36582717299461365, 0.38897672295570374, 0.41212624311447144, 0.4352758228778839, 0.458425372838974, 0.4815749228000641, 0.5047244429588318, 0.5278739929199219, 0.551023542881012, 0.574173092842102, 0.5973226428031921, 0.6204721927642822, 0.6436217427253723, 0.6667712926864624, 0.6899208426475525, 0.7130703926086426, 0.7362198829650879, 0.7593694925308228, 0.7825189828872681, 0.8056685328483582]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 6.0, 9.0, 11.0, 14.0, 26.0, 22.0, 37.0, 46.0, 67.0, 140.0, 207.0, 326.0, 451.0, 813.0, 1184.0, 2143.0, 3814.0, 7355.0, 16671.0, 50743.0, 314833.0, 3563877.0, 168659.0, 36184.0, 13121.0, 5993.0, 3084.0, 1665.0, 1016.0, 595.0, 400.0, 273.0, 137.0, 99.0, 74.0, 66.0, 41.0, 31.0, 15.0, 12.0, 8.0, 4.0, 9.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.08233642578125, -0.07943344116210938, -0.07653045654296875, -0.07362747192382812, -0.0707244873046875, -0.06782150268554688, -0.06491851806640625, -0.062015533447265625, -0.059112548828125, -0.056209564208984375, -0.05330657958984375, -0.050403594970703125, -0.0475006103515625, -0.044597625732421875, -0.04169464111328125, -0.038791656494140625, -0.035888671875, -0.032985687255859375, -0.03008270263671875, -0.027179718017578125, -0.0242767333984375, -0.021373748779296875, -0.01847076416015625, -0.015567779541015625, -0.012664794921875, -0.009761810302734375, -0.00685882568359375, -0.003955841064453125, -0.0010528564453125, 0.001850128173828125, 0.00475311279296875, 0.007656097412109375, 0.01055908203125, 0.013462066650390625, 0.01636505126953125, 0.019268035888671875, 0.0221710205078125, 0.025074005126953125, 0.02797698974609375, 0.030879974365234375, 0.033782958984375, 0.036685943603515625, 0.03958892822265625, 0.042491912841796875, 0.0453948974609375, 0.048297882080078125, 0.05120086669921875, 0.054103851318359375, 0.0570068359375, 0.059909820556640625, 0.06281280517578125, 0.06571578979492188, 0.0686187744140625, 0.07152175903320312, 0.07442474365234375, 0.07732772827148438, 0.080230712890625, 0.08313369750976562, 0.08603668212890625, 0.08893966674804688, 0.0918426513671875, 0.09474563598632812, 0.09764862060546875, 0.10055160522460938, 0.10345458984375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 2.0, 4.0, 9.0, 9.0, 17.0, 16.0, 22.0, 22.0, 25.0, 36.0, 28.0, 27.0, 51.0, 48.0, 54.0, 53.0, 53.0, 48.0, 45.0, 43.0, 58.0, 53.0, 49.0, 31.0, 35.0, 30.0, 28.0, 28.0, 13.0, 16.0, 18.0, 7.0, 10.0, 7.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.042022705078125, -0.040644168853759766, -0.03926563262939453, -0.0378870964050293, -0.03650856018066406, -0.03513002395629883, -0.033751487731933594, -0.03237295150756836, -0.030994415283203125, -0.02961587905883789, -0.028237342834472656, -0.026858806610107422, -0.025480270385742188, -0.024101734161376953, -0.02272319793701172, -0.021344661712646484, -0.01996612548828125, -0.018587589263916016, -0.01720905303955078, -0.015830516815185547, -0.014451980590820312, -0.013073444366455078, -0.011694908142089844, -0.01031637191772461, -0.008937835693359375, -0.007559299468994141, -0.006180763244628906, -0.004802227020263672, -0.0034236907958984375, -0.002045154571533203, -0.0006666183471679688, 0.0007119178771972656, 0.0020904541015625, 0.0034689903259277344, 0.004847526550292969, 0.006226062774658203, 0.0076045989990234375, 0.008983135223388672, 0.010361671447753906, 0.01174020767211914, 0.013118743896484375, 0.01449728012084961, 0.015875816345214844, 0.017254352569580078, 0.018632888793945312, 0.020011425018310547, 0.02138996124267578, 0.022768497467041016, 0.02414703369140625, 0.025525569915771484, 0.02690410614013672, 0.028282642364501953, 0.029661178588867188, 0.031039714813232422, 0.032418251037597656, 0.03379678726196289, 0.035175323486328125, 0.03655385971069336, 0.037932395935058594, 0.03931093215942383, 0.04068946838378906, 0.0420680046081543, 0.04344654083251953, 0.044825077056884766, 0.04620361328125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 12.0, 14.0, 8.0, 19.0, 34.0, 51.0, 62.0, 103.0, 140.0, 234.0, 369.0, 722.0, 1326.0, 2808.0, 6956.0, 21564.0, 108525.0, 3564499.0, 422728.0, 43932.0, 11835.0, 4214.0, 1764.0, 954.0, 511.0, 306.0, 215.0, 143.0, 74.0, 50.0, 38.0, 19.0, 12.0, 14.0, 13.0, 7.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.126953125, -0.1230764389038086, -0.11919975280761719, -0.11532306671142578, -0.11144638061523438, -0.10756969451904297, -0.10369300842285156, -0.09981632232666016, -0.09593963623046875, -0.09206295013427734, -0.08818626403808594, -0.08430957794189453, -0.08043289184570312, -0.07655620574951172, -0.07267951965332031, -0.0688028335571289, -0.0649261474609375, -0.061049461364746094, -0.05717277526855469, -0.05329608917236328, -0.049419403076171875, -0.04554271697998047, -0.04166603088378906, -0.037789344787597656, -0.03391265869140625, -0.030035972595214844, -0.026159286499023438, -0.02228260040283203, -0.018405914306640625, -0.014529228210449219, -0.010652542114257812, -0.006775856018066406, -0.002899169921875, 0.0009775161743164062, 0.0048542022705078125, 0.008730888366699219, 0.012607574462890625, 0.01648426055908203, 0.020360946655273438, 0.024237632751464844, 0.02811431884765625, 0.031991004943847656, 0.03586769104003906, 0.03974437713623047, 0.043621063232421875, 0.04749774932861328, 0.05137443542480469, 0.055251121520996094, 0.0591278076171875, 0.0630044937133789, 0.06688117980957031, 0.07075786590576172, 0.07463455200195312, 0.07851123809814453, 0.08238792419433594, 0.08626461029052734, 0.09014129638671875, 0.09401798248291016, 0.09789466857910156, 0.10177135467529297, 0.10564804077148438, 0.10952472686767578, 0.11340141296386719, 0.1172780990600586, 0.12115478515625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 13.0, 16.0, 38.0, 52.0, 121.0, 512.0, 2728.0, 355.0, 112.0, 47.0, 34.0, 14.0, 7.0, 5.0, 7.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.107421875, -0.10389041900634766, -0.10035896301269531, -0.09682750701904297, -0.09329605102539062, -0.08976459503173828, -0.08623313903808594, -0.0827016830444336, -0.07917022705078125, -0.0756387710571289, -0.07210731506347656, -0.06857585906982422, -0.06504440307617188, -0.06151294708251953, -0.05798149108886719, -0.054450035095214844, -0.0509185791015625, -0.047387123107910156, -0.04385566711425781, -0.04032421112060547, -0.036792755126953125, -0.03326129913330078, -0.029729843139648438, -0.026198387145996094, -0.02266693115234375, -0.019135475158691406, -0.015604019165039062, -0.012072563171386719, -0.008541107177734375, -0.005009651184082031, -0.0014781951904296875, 0.0020532608032226562, 0.005584716796875, 0.009116172790527344, 0.012647628784179688, 0.01617908477783203, 0.019710540771484375, 0.02324199676513672, 0.026773452758789062, 0.030304908752441406, 0.03383636474609375, 0.037367820739746094, 0.04089927673339844, 0.04443073272705078, 0.047962188720703125, 0.05149364471435547, 0.05502510070800781, 0.058556556701660156, 0.0620880126953125, 0.06561946868896484, 0.06915092468261719, 0.07268238067626953, 0.07621383666992188, 0.07974529266357422, 0.08327674865722656, 0.0868082046508789, 0.09033966064453125, 0.0938711166381836, 0.09740257263183594, 0.10093402862548828, 0.10446548461914062, 0.10799694061279297, 0.11152839660644531, 0.11505985260009766, 0.11859130859375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 5.0, 3.0, 8.0, 17.0, 29.0, 67.0, 111.0, 162.0, 177.0, 162.0, 116.0, 57.0, 36.0, 17.0, 11.0, 13.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42981791496276855, -0.41735705733299255, -0.40489619970321655, -0.39243531227111816, -0.37997445464134216, -0.36751359701156616, -0.3550527095794678, -0.3425918519496918, -0.33013099431991577, -0.31767013669013977, -0.30520927906036377, -0.2927483916282654, -0.2802875339984894, -0.2678266763687134, -0.255365788936615, -0.242904931306839, -0.230444073677063, -0.217983216047287, -0.2055223435163498, -0.1930614709854126, -0.1806006133556366, -0.1681397557258606, -0.1556788831949234, -0.1432180106639862, -0.1307571530342102, -0.11829628795385361, -0.10583542287349701, -0.09337455779314041, -0.08091369271278381, -0.06845282763242722, -0.05599196255207062, -0.04353109747171402, -0.031070202589035034, -0.018609337508678436, -0.006148472428321838, 0.0063123926520347595, 0.018773257732391357, 0.031234122812747955, 0.04369498789310455, 0.05615585297346115, 0.06861671805381775, 0.08107758313417435, 0.09353844821453094, 0.10599931329488754, 0.11846017837524414, 0.13092103600502014, 0.14338190853595734, 0.15584278106689453, 0.16830363869667053, 0.18076449632644653, 0.19322536885738373, 0.20568624138832092, 0.21814709901809692, 0.23060795664787292, 0.24306882917881012, 0.2555297017097473, 0.2679905593395233, 0.2804514169692993, 0.2929123044013977, 0.3053731620311737, 0.3178340196609497, 0.3302948772907257, 0.3427557349205017, 0.3552166223526001, 0.3676774799823761]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 8.0, 5.0, 5.0, 11.0, 9.0, 13.0, 19.0, 15.0, 17.0, 26.0, 31.0, 34.0, 38.0, 48.0, 45.0, 36.0, 41.0, 50.0, 64.0, 53.0, 49.0, 37.0, 46.0, 47.0, 42.0, 38.0, 28.0, 33.0, 22.0, 20.0, 8.0, 11.0, 8.0, 11.0, 11.0, 4.0, 7.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.2289496660232544, -0.2222941517829895, -0.21563862264156342, -0.20898310840129852, -0.20232759416103363, -0.19567206501960754, -0.18901655077934265, -0.18236103653907776, -0.17570552229881287, -0.16905000805854797, -0.1623944789171219, -0.155738964676857, -0.1490834504365921, -0.14242792129516602, -0.13577240705490112, -0.12911689281463623, -0.12246136367321014, -0.11580584198236465, -0.10915032774209976, -0.10249480605125427, -0.09583929181098938, -0.08918377012014389, -0.0825282484292984, -0.07587273418903351, -0.06921721249818802, -0.06256169080734253, -0.05590617656707764, -0.04925065487623215, -0.042595136910676956, -0.035939618945121765, -0.029284097254276276, -0.022628579288721085, -0.015973061323165894, -0.009317542426288128, -0.0026620235294103622, 0.003993496298789978, 0.010649014264345169, 0.01730453222990036, 0.02396005392074585, 0.03061557188630104, 0.03727108985185623, 0.04392660781741142, 0.050582125782966614, 0.0572376474738121, 0.06389316916465759, 0.07054868340492249, 0.07720420509576797, 0.08385972678661346, 0.09051524102687836, 0.09717076271772385, 0.10382627695798874, 0.11048179864883423, 0.11713731288909912, 0.12379283457994461, 0.1304483562707901, 0.137103870511055, 0.14375939965248108, 0.15041491389274597, 0.15707044303417206, 0.16372595727443695, 0.17038147151470184, 0.17703700065612793, 0.18369251489639282, 0.19034802913665771, 0.1970035433769226]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 5.0, 6.0, 5.0, 10.0, 17.0, 19.0, 26.0, 50.0, 66.0, 118.0, 179.0, 345.0, 551.0, 1007.0, 1917.0, 4240.0, 9851.0, 26781.0, 78724.0, 227940.0, 383288.0, 203399.0, 69364.0, 23825.0, 9137.0, 3772.0, 1710.0, 925.0, 489.0, 289.0, 186.0, 109.0, 71.0, 55.0, 22.0, 17.0, 14.0, 11.0, 8.0, 4.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.10760498046875, -0.10428810119628906, -0.10097122192382812, -0.09765434265136719, -0.09433746337890625, -0.09102058410644531, -0.08770370483398438, -0.08438682556152344, -0.0810699462890625, -0.07775306701660156, -0.07443618774414062, -0.07111930847167969, -0.06780242919921875, -0.06448554992675781, -0.061168670654296875, -0.05785179138183594, -0.054534912109375, -0.05121803283691406, -0.047901153564453125, -0.04458427429199219, -0.04126739501953125, -0.03795051574707031, -0.034633636474609375, -0.03131675720214844, -0.0279998779296875, -0.024682998657226562, -0.021366119384765625, -0.018049240112304688, -0.01473236083984375, -0.011415481567382812, -0.008098602294921875, -0.0047817230224609375, -0.00146484375, 0.0018520355224609375, 0.005168914794921875, 0.008485794067382812, 0.01180267333984375, 0.015119552612304688, 0.018436431884765625, 0.021753311157226562, 0.0250701904296875, 0.028387069702148438, 0.031703948974609375, 0.03502082824707031, 0.03833770751953125, 0.04165458679199219, 0.044971466064453125, 0.04828834533691406, 0.051605224609375, 0.05492210388183594, 0.058238983154296875, 0.06155586242675781, 0.06487274169921875, 0.06818962097167969, 0.07150650024414062, 0.07482337951660156, 0.0781402587890625, 0.08145713806152344, 0.08477401733398438, 0.08809089660644531, 0.09140777587890625, 0.09472465515136719, 0.09804153442382812, 0.10135841369628906, 0.10467529296875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 7.0, 8.0, 8.0, 13.0, 20.0, 18.0, 21.0, 15.0, 26.0, 28.0, 39.0, 42.0, 37.0, 44.0, 48.0, 50.0, 41.0, 54.0, 53.0, 46.0, 55.0, 40.0, 37.0, 28.0, 33.0, 25.0, 33.0, 33.0, 24.0, 14.0, 17.0, 8.0, 9.0, 9.0, 8.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0416259765625, -0.040255069732666016, -0.03888416290283203, -0.03751325607299805, -0.03614234924316406, -0.03477144241333008, -0.033400535583496094, -0.03202962875366211, -0.030658721923828125, -0.02928781509399414, -0.027916908264160156, -0.026546001434326172, -0.025175094604492188, -0.023804187774658203, -0.02243328094482422, -0.021062374114990234, -0.01969146728515625, -0.018320560455322266, -0.01694965362548828, -0.015578746795654297, -0.014207839965820312, -0.012836933135986328, -0.011466026306152344, -0.01009511947631836, -0.008724212646484375, -0.007353305816650391, -0.005982398986816406, -0.004611492156982422, -0.0032405853271484375, -0.0018696784973144531, -0.0004987716674804688, 0.0008721351623535156, 0.0022430419921875, 0.0036139488220214844, 0.004984855651855469, 0.006355762481689453, 0.0077266693115234375, 0.009097576141357422, 0.010468482971191406, 0.01183938980102539, 0.013210296630859375, 0.01458120346069336, 0.015952110290527344, 0.017323017120361328, 0.018693923950195312, 0.020064830780029297, 0.02143573760986328, 0.022806644439697266, 0.02417755126953125, 0.025548458099365234, 0.02691936492919922, 0.028290271759033203, 0.029661178588867188, 0.031032085418701172, 0.032402992248535156, 0.03377389907836914, 0.035144805908203125, 0.03651571273803711, 0.037886619567871094, 0.03925752639770508, 0.04062843322753906, 0.04199934005737305, 0.04337024688720703, 0.044741153717041016, 0.046112060546875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 7.0, 15.0, 14.0, 20.0, 25.0, 68.0, 65.0, 149.0, 238.0, 456.0, 1015.0, 2611.0, 8212.0, 32104.0, 167909.0, 583485.0, 200343.0, 37401.0, 9186.0, 2925.0, 1122.0, 500.0, 283.0, 145.0, 85.0, 53.0, 39.0, 26.0, 18.0, 11.0, 5.0, 3.0, 5.0, 4.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.135009765625, -0.13059043884277344, -0.12617111206054688, -0.12175178527832031, -0.11733245849609375, -0.11291313171386719, -0.10849380493164062, -0.10407447814941406, -0.0996551513671875, -0.09523582458496094, -0.09081649780273438, -0.08639717102050781, -0.08197784423828125, -0.07755851745605469, -0.07313919067382812, -0.06871986389160156, -0.064300537109375, -0.05988121032714844, -0.055461883544921875, -0.05104255676269531, -0.04662322998046875, -0.04220390319824219, -0.037784576416015625, -0.03336524963378906, -0.0289459228515625, -0.024526596069335938, -0.020107269287109375, -0.015687942504882812, -0.01126861572265625, -0.0068492889404296875, -0.002429962158203125, 0.0019893646240234375, 0.00640869140625, 0.010828018188476562, 0.015247344970703125, 0.019666671752929688, 0.02408599853515625, 0.028505325317382812, 0.032924652099609375, 0.03734397888183594, 0.0417633056640625, 0.04618263244628906, 0.050601959228515625, 0.05502128601074219, 0.05944061279296875, 0.06385993957519531, 0.06827926635742188, 0.07269859313964844, 0.077117919921875, 0.08153724670410156, 0.08595657348632812, 0.09037590026855469, 0.09479522705078125, 0.09921455383300781, 0.10363388061523438, 0.10805320739746094, 0.1124725341796875, 0.11689186096191406, 0.12131118774414062, 0.1257305145263672, 0.13014984130859375, 0.1345691680908203, 0.13898849487304688, 0.14340782165527344, 0.1478271484375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 3.0, 8.0, 1.0, 8.0, 2.0, 3.0, 7.0, 11.0, 7.0, 22.0, 14.0, 16.0, 23.0, 25.0, 31.0, 26.0, 27.0, 43.0, 28.0, 38.0, 53.0, 52.0, 54.0, 38.0, 52.0, 30.0, 33.0, 39.0, 34.0, 37.0, 26.0, 16.0, 33.0, 23.0, 23.0, 15.0, 20.0, 10.0, 16.0, 9.0, 12.0, 8.0, 8.0, 9.0, 5.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.15673828125, -0.15172958374023438, -0.14672088623046875, -0.14171218872070312, -0.1367034912109375, -0.13169479370117188, -0.12668609619140625, -0.12167739868164062, -0.116668701171875, -0.11166000366210938, -0.10665130615234375, -0.10164260864257812, -0.0966339111328125, -0.09162521362304688, -0.08661651611328125, -0.08160781860351562, -0.07659912109375, -0.07159042358398438, -0.06658172607421875, -0.061573028564453125, -0.0565643310546875, -0.051555633544921875, -0.04654693603515625, -0.041538238525390625, -0.036529541015625, -0.031520843505859375, -0.02651214599609375, -0.021503448486328125, -0.0164947509765625, -0.011486053466796875, -0.00647735595703125, -0.001468658447265625, 0.0035400390625, 0.008548736572265625, 0.01355743408203125, 0.018566131591796875, 0.0235748291015625, 0.028583526611328125, 0.03359222412109375, 0.038600921630859375, 0.043609619140625, 0.048618316650390625, 0.05362701416015625, 0.058635711669921875, 0.0636444091796875, 0.06865310668945312, 0.07366180419921875, 0.07867050170898438, 0.08367919921875, 0.08868789672851562, 0.09369659423828125, 0.09870529174804688, 0.1037139892578125, 0.10872268676757812, 0.11373138427734375, 0.11874008178710938, 0.123748779296875, 0.12875747680664062, 0.13376617431640625, 0.13877487182617188, 0.1437835693359375, 0.14879226684570312, 0.15380096435546875, 0.15880966186523438, 0.163818359375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 4.0, 6.0, 5.0, 11.0, 23.0, 35.0, 20.0, 54.0, 45.0, 86.0, 120.0, 144.0, 238.0, 346.0, 562.0, 927.0, 1721.0, 3266.0, 8756.0, 31248.0, 191031.0, 648093.0, 124477.0, 23689.0, 6927.0, 2847.0, 1389.0, 869.0, 505.0, 335.0, 249.0, 158.0, 105.0, 74.0, 56.0, 45.0, 26.0, 13.0, 15.0, 11.0, 8.0, 7.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.057464599609375, -0.05551004409790039, -0.05355548858642578, -0.05160093307495117, -0.04964637756347656, -0.04769182205200195, -0.045737266540527344, -0.043782711029052734, -0.041828155517578125, -0.039873600006103516, -0.037919044494628906, -0.0359644889831543, -0.03400993347167969, -0.03205537796020508, -0.03010082244873047, -0.02814626693725586, -0.02619171142578125, -0.02423715591430664, -0.02228260040283203, -0.020328044891357422, -0.018373489379882812, -0.016418933868408203, -0.014464378356933594, -0.012509822845458984, -0.010555267333984375, -0.008600711822509766, -0.006646156311035156, -0.004691600799560547, -0.0027370452880859375, -0.0007824897766113281, 0.0011720657348632812, 0.0031266212463378906, 0.0050811767578125, 0.007035732269287109, 0.008990287780761719, 0.010944843292236328, 0.012899398803710938, 0.014853954315185547, 0.016808509826660156, 0.018763065338134766, 0.020717620849609375, 0.022672176361083984, 0.024626731872558594, 0.026581287384033203, 0.028535842895507812, 0.030490398406982422, 0.03244495391845703, 0.03439950942993164, 0.03635406494140625, 0.03830862045288086, 0.04026317596435547, 0.04221773147583008, 0.04417228698730469, 0.0461268424987793, 0.048081398010253906, 0.050035953521728516, 0.051990509033203125, 0.053945064544677734, 0.055899620056152344, 0.05785417556762695, 0.05980873107910156, 0.06176328659057617, 0.06371784210205078, 0.06567239761352539, 0.067626953125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 12.0, 7.0, 18.0, 26.0, 45.0, 81.0, 90.0, 135.0, 154.0, 116.0, 114.0, 69.0, 45.0, 39.0, 23.0, 5.0, 13.0, 0.0, 5.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2232532501220703e-05, -2.1656043827533722e-05, -2.107955515384674e-05, -2.050306648015976e-05, -1.992657780647278e-05, -1.9350089132785797e-05, -1.8773600459098816e-05, -1.8197111785411835e-05, -1.7620623111724854e-05, -1.7044134438037872e-05, -1.646764576435089e-05, -1.589115709066391e-05, -1.531466841697693e-05, -1.4738179743289948e-05, -1.4161691069602966e-05, -1.3585202395915985e-05, -1.3008713722229004e-05, -1.2432225048542023e-05, -1.1855736374855042e-05, -1.127924770116806e-05, -1.0702759027481079e-05, -1.0126270353794098e-05, -9.549781680107117e-06, -8.973293006420135e-06, -8.396804332733154e-06, -7.820315659046173e-06, -7.243826985359192e-06, -6.667338311672211e-06, -6.0908496379852295e-06, -5.514360964298248e-06, -4.937872290611267e-06, -4.361383616924286e-06, -3.7848949432373047e-06, -3.2084062695503235e-06, -2.6319175958633423e-06, -2.055428922176361e-06, -1.4789402484893799e-06, -9.024515748023987e-07, -3.259629011154175e-07, 2.505257725715637e-07, 8.270144462585449e-07, 1.4035031199455261e-06, 1.9799917936325073e-06, 2.5564804673194885e-06, 3.1329691410064697e-06, 3.709457814693451e-06, 4.285946488380432e-06, 4.862435162067413e-06, 5.4389238357543945e-06, 6.015412509441376e-06, 6.591901183128357e-06, 7.168389856815338e-06, 7.74487853050232e-06, 8.3213672041893e-06, 8.897855877876282e-06, 9.474344551563263e-06, 1.0050833225250244e-05, 1.0627321898937225e-05, 1.1203810572624207e-05, 1.1780299246311188e-05, 1.2356787919998169e-05, 1.293327659368515e-05, 1.3509765267372131e-05, 1.4086253941059113e-05, 1.4662742614746094e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 6.0, 8.0, 6.0, 9.0, 11.0, 17.0, 25.0, 34.0, 67.0, 66.0, 76.0, 115.0, 169.0, 261.0, 439.0, 758.0, 1377.0, 3322.0, 10840.0, 64494.0, 640610.0, 286015.0, 28732.0, 6095.0, 2235.0, 1082.0, 557.0, 376.0, 229.0, 130.0, 102.0, 78.0, 61.0, 41.0, 35.0, 24.0, 17.0, 9.0, 11.0, 8.0, 3.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.078125, -0.07558822631835938, -0.07305145263671875, -0.07051467895507812, -0.0679779052734375, -0.06544113159179688, -0.06290435791015625, -0.060367584228515625, -0.057830810546875, -0.055294036865234375, -0.05275726318359375, -0.050220489501953125, -0.0476837158203125, -0.045146942138671875, -0.04261016845703125, -0.040073394775390625, -0.03753662109375, -0.034999847412109375, -0.03246307373046875, -0.029926300048828125, -0.0273895263671875, -0.024852752685546875, -0.02231597900390625, -0.019779205322265625, -0.017242431640625, -0.014705657958984375, -0.01216888427734375, -0.009632110595703125, -0.0070953369140625, -0.004558563232421875, -0.00202178955078125, 0.000514984130859375, 0.0030517578125, 0.005588531494140625, 0.00812530517578125, 0.010662078857421875, 0.0131988525390625, 0.015735626220703125, 0.01827239990234375, 0.020809173583984375, 0.023345947265625, 0.025882720947265625, 0.02841949462890625, 0.030956268310546875, 0.0334930419921875, 0.036029815673828125, 0.03856658935546875, 0.041103363037109375, 0.04364013671875, 0.046176910400390625, 0.04871368408203125, 0.051250457763671875, 0.0537872314453125, 0.056324005126953125, 0.05886077880859375, 0.061397552490234375, 0.063934326171875, 0.06647109985351562, 0.06900787353515625, 0.07154464721679688, 0.0740814208984375, 0.07661819458007812, 0.07915496826171875, 0.08169174194335938, 0.084228515625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 13.0, 25.0, 41.0, 74.0, 109.0, 197.0, 188.0, 149.0, 85.0, 47.0, 24.0, 21.0, 9.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1624755859375, -0.15820980072021484, -0.1539440155029297, -0.14967823028564453, -0.14541244506835938, -0.14114665985107422, -0.13688087463378906, -0.1326150894165039, -0.12834930419921875, -0.1240835189819336, -0.11981773376464844, -0.11555194854736328, -0.11128616333007812, -0.10702037811279297, -0.10275459289550781, -0.09848880767822266, -0.0942230224609375, -0.08995723724365234, -0.08569145202636719, -0.08142566680908203, -0.07715988159179688, -0.07289409637451172, -0.06862831115722656, -0.0643625259399414, -0.06009674072265625, -0.055830955505371094, -0.05156517028808594, -0.04729938507080078, -0.043033599853515625, -0.03876781463623047, -0.03450202941894531, -0.030236244201660156, -0.025970458984375, -0.021704673767089844, -0.017438888549804688, -0.013173103332519531, -0.008907318115234375, -0.004641532897949219, -0.0003757476806640625, 0.0038900375366210938, 0.00815582275390625, 0.012421607971191406, 0.016687393188476562, 0.02095317840576172, 0.025218963623046875, 0.02948474884033203, 0.03375053405761719, 0.038016319274902344, 0.0422821044921875, 0.046547889709472656, 0.05081367492675781, 0.05507946014404297, 0.059345245361328125, 0.06361103057861328, 0.06787681579589844, 0.0721426010131836, 0.07640838623046875, 0.0806741714477539, 0.08493995666503906, 0.08920574188232422, 0.09347152709960938, 0.09773731231689453, 0.10200309753417969, 0.10626888275146484, 0.11053466796875]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 12.0, 36.0, 92.0, 220.0, 282.0, 214.0, 89.0, 34.0, 13.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6445916891098022, -1.580265998840332, -1.5159403085708618, -1.4516146183013916, -1.3872889280319214, -1.3229632377624512, -1.2586374282836914, -1.1943118572235107, -1.129986047744751, -1.0656603574752808, -1.0013346672058105, -0.9370089769363403, -0.8726832866668701, -0.8083575963973999, -0.7440318465232849, -0.6797061562538147, -0.6153805255889893, -0.551054835319519, -0.48672914505004883, -0.4224034249782562, -0.358077734708786, -0.2937520444393158, -0.2294263243675232, -0.16510063409805298, -0.10077494382858276, -0.03644924610853195, 0.02787645161151886, 0.09220215678215027, 0.15652784705162048, 0.2208535373210907, 0.2851792573928833, 0.3495049476623535, 0.4138305187225342, 0.4781562089920044, 0.5424818992614746, 0.6068075895309448, 0.671133279800415, 0.7354589700698853, 0.7997847199440002, 0.8641104102134705, 0.9284361004829407, 0.9927617907524109, 1.0570875406265259, 1.121413230895996, 1.1857389211654663, 1.2500646114349365, 1.3143903017044067, 1.378715991973877, 1.4430416822433472, 1.5073673725128174, 1.5716930627822876, 1.6360187530517578, 1.700344443321228, 1.7646701335906982, 1.828995943069458, 1.8933215141296387, 1.9576473236083984, 2.021973133087158, 2.086298704147339, 2.1506245136260986, 2.2149500846862793, 2.279275894165039, 2.3436014652252197, 2.4079272747039795, 2.47225284576416]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 5.0, 5.0, 6.0, 13.0, 8.0, 7.0, 17.0, 17.0, 15.0, 13.0, 28.0, 32.0, 34.0, 35.0, 27.0, 36.0, 37.0, 48.0, 46.0, 41.0, 39.0, 44.0, 49.0, 41.0, 57.0, 30.0, 32.0, 36.0, 21.0, 22.0, 22.0, 23.0, 26.0, 12.0, 15.0, 12.0, 9.0, 10.0, 10.0, 6.0, 4.0, 2.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.8333945274353027, -0.8060218095779419, -0.7786490321159363, -0.7512763142585754, -0.7239035367965698, -0.696530818939209, -0.6691581010818481, -0.6417853832244873, -0.6144126057624817, -0.5870398879051208, -0.5596671104431152, -0.5322943925857544, -0.5049216747283936, -0.47754889726638794, -0.4501761794090271, -0.42280343174934387, -0.39543068408966064, -0.3680579364299774, -0.3406851887702942, -0.31331247091293335, -0.2859397232532501, -0.2585669755935669, -0.23119424283504486, -0.20382151007652283, -0.1764487624168396, -0.14907601475715637, -0.12170328199863434, -0.09433054178953171, -0.06695780158042908, -0.03958505392074585, -0.012212321162223816, 0.015160411596298218, 0.04253309965133667, 0.0699058398604393, 0.09727858006954193, 0.12465132027864456, 0.1520240604877472, 0.17939680814743042, 0.20676954090595245, 0.2341422736644745, 0.2615150213241577, 0.28888776898384094, 0.31626051664352417, 0.343633234500885, 0.37100598216056824, 0.39837872982025146, 0.4257514476776123, 0.45312419533729553, 0.48049694299697876, 0.5078696608543396, 0.5352424383163452, 0.562615156173706, 0.5899878740310669, 0.6173606514930725, 0.6447333693504333, 0.672106146812439, 0.6994788646697998, 0.7268515825271606, 0.7542243599891663, 0.7815970778465271, 0.8089698553085327, 0.8363425731658936, 0.8637152910232544, 0.8910880088806152, 0.9184607863426208]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 2.0, 3.0, 7.0, 3.0, 4.0, 13.0, 12.0, 14.0, 26.0, 37.0, 54.0, 71.0, 104.0, 165.0, 300.0, 616.0, 1636.0, 5012.0, 24784.0, 4089525.0, 59823.0, 7909.0, 2357.0, 846.0, 403.0, 183.0, 119.0, 81.0, 50.0, 34.0, 27.0, 17.0, 12.0, 9.0, 7.0, 5.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.1934814453125, -0.18773460388183594, -0.18198776245117188, -0.1762409210205078, -0.17049407958984375, -0.1647472381591797, -0.15900039672851562, -0.15325355529785156, -0.1475067138671875, -0.14175987243652344, -0.13601303100585938, -0.1302661895751953, -0.12451934814453125, -0.11877250671386719, -0.11302566528320312, -0.10727882385253906, -0.101531982421875, -0.09578514099121094, -0.09003829956054688, -0.08429145812988281, -0.07854461669921875, -0.07279777526855469, -0.06705093383789062, -0.06130409240722656, -0.0555572509765625, -0.04981040954589844, -0.044063568115234375, -0.03831672668457031, -0.03256988525390625, -0.026823043823242188, -0.021076202392578125, -0.015329360961914062, -0.00958251953125, -0.0038356781005859375, 0.001911163330078125, 0.0076580047607421875, 0.01340484619140625, 0.019151687622070312, 0.024898529052734375, 0.030645370483398438, 0.0363922119140625, 0.04213905334472656, 0.047885894775390625, 0.05363273620605469, 0.05937957763671875, 0.06512641906738281, 0.07087326049804688, 0.07662010192871094, 0.082366943359375, 0.08811378479003906, 0.09386062622070312, 0.09960746765136719, 0.10535430908203125, 0.11110115051269531, 0.11684799194335938, 0.12259483337402344, 0.1283416748046875, 0.13408851623535156, 0.13983535766601562, 0.1455821990966797, 0.15132904052734375, 0.1570758819580078, 0.16282272338867188, 0.16856956481933594, 0.17431640625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 0.0, 5.0, 5.0, 3.0, 13.0, 4.0, 6.0, 3.0, 12.0, 15.0, 11.0, 23.0, 23.0, 28.0, 27.0, 26.0, 22.0, 37.0, 39.0, 32.0, 48.0, 43.0, 47.0, 52.0, 41.0, 35.0, 39.0, 50.0, 44.0, 41.0, 52.0, 27.0, 23.0, 28.0, 20.0, 16.0, 15.0, 12.0, 12.0, 11.0, 6.0, 3.0, 1.0, 7.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.048828125, -0.04736614227294922, -0.04590415954589844, -0.044442176818847656, -0.042980194091796875, -0.041518211364746094, -0.04005622863769531, -0.03859424591064453, -0.03713226318359375, -0.03567028045654297, -0.03420829772949219, -0.032746315002441406, -0.031284332275390625, -0.029822349548339844, -0.028360366821289062, -0.02689838409423828, -0.0254364013671875, -0.02397441864013672, -0.022512435913085938, -0.021050453186035156, -0.019588470458984375, -0.018126487731933594, -0.016664505004882812, -0.015202522277832031, -0.01374053955078125, -0.012278556823730469, -0.010816574096679688, -0.009354591369628906, -0.007892608642578125, -0.006430625915527344, -0.0049686431884765625, -0.0035066604614257812, -0.002044677734375, -0.0005826950073242188, 0.0008792877197265625, 0.0023412704467773438, 0.003803253173828125, 0.005265235900878906, 0.0067272186279296875, 0.008189201354980469, 0.00965118408203125, 0.011113166809082031, 0.012575149536132812, 0.014037132263183594, 0.015499114990234375, 0.016961097717285156, 0.018423080444335938, 0.01988506317138672, 0.0213470458984375, 0.02280902862548828, 0.024271011352539062, 0.025732994079589844, 0.027194976806640625, 0.028656959533691406, 0.030118942260742188, 0.03158092498779297, 0.03304290771484375, 0.03450489044189453, 0.03596687316894531, 0.037428855895996094, 0.038890838623046875, 0.040352821350097656, 0.04181480407714844, 0.04327678680419922, 0.04473876953125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 8.0, 2.0, 7.0, 14.0, 17.0, 23.0, 23.0, 82.0, 64.0, 122.0, 161.0, 260.0, 487.0, 787.0, 1350.0, 2646.0, 6173.0, 22737.0, 3774451.0, 353358.0, 19808.0, 5726.0, 2572.0, 1359.0, 759.0, 473.0, 257.0, 180.0, 116.0, 85.0, 51.0, 37.0, 24.0, 28.0, 11.0, 8.0, 5.0, 6.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.146728515625, -0.1421375274658203, -0.13754653930664062, -0.13295555114746094, -0.12836456298828125, -0.12377357482910156, -0.11918258666992188, -0.11459159851074219, -0.1100006103515625, -0.10540962219238281, -0.10081863403320312, -0.09622764587402344, -0.09163665771484375, -0.08704566955566406, -0.08245468139648438, -0.07786369323730469, -0.073272705078125, -0.06868171691894531, -0.06409072875976562, -0.05949974060058594, -0.05490875244140625, -0.05031776428222656, -0.045726776123046875, -0.04113578796386719, -0.0365447998046875, -0.03195381164550781, -0.027362823486328125, -0.022771835327148438, -0.01818084716796875, -0.013589859008789062, -0.008998870849609375, -0.0044078826904296875, 0.00018310546875, 0.0047740936279296875, 0.009365081787109375, 0.013956069946289062, 0.01854705810546875, 0.023138046264648438, 0.027729034423828125, 0.03232002258300781, 0.0369110107421875, 0.04150199890136719, 0.046092987060546875, 0.05068397521972656, 0.05527496337890625, 0.05986595153808594, 0.06445693969726562, 0.06904792785644531, 0.073638916015625, 0.07822990417480469, 0.08282089233398438, 0.08741188049316406, 0.09200286865234375, 0.09659385681152344, 0.10118484497070312, 0.10577583312988281, 0.1103668212890625, 0.11495780944824219, 0.11954879760742188, 0.12413978576660156, 0.12873077392578125, 0.13332176208496094, 0.13791275024414062, 0.1425037384033203, 0.1470947265625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 10.0, 18.0, 25.0, 67.0, 163.0, 3548.0, 110.0, 62.0, 20.0, 16.0, 2.0, 5.0, 5.0, 2.0, 1.0, 1.0, 4.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0328369140625, -0.03179121017456055, -0.030745506286621094, -0.02969980239868164, -0.028654098510742188, -0.027608394622802734, -0.02656269073486328, -0.025516986846923828, -0.024471282958984375, -0.023425579071044922, -0.02237987518310547, -0.021334171295166016, -0.020288467407226562, -0.01924276351928711, -0.018197059631347656, -0.017151355743408203, -0.01610565185546875, -0.015059947967529297, -0.014014244079589844, -0.01296854019165039, -0.011922836303710938, -0.010877132415771484, -0.009831428527832031, -0.008785724639892578, -0.007740020751953125, -0.006694316864013672, -0.005648612976074219, -0.004602909088134766, -0.0035572052001953125, -0.0025115013122558594, -0.0014657974243164062, -0.0004200935363769531, 0.0006256103515625, 0.0016713142395019531, 0.0027170181274414062, 0.0037627220153808594, 0.0048084259033203125, 0.005854129791259766, 0.006899833679199219, 0.007945537567138672, 0.008991241455078125, 0.010036945343017578, 0.011082649230957031, 0.012128353118896484, 0.013174057006835938, 0.01421976089477539, 0.015265464782714844, 0.016311168670654297, 0.01735687255859375, 0.018402576446533203, 0.019448280334472656, 0.02049398422241211, 0.021539688110351562, 0.022585391998291016, 0.02363109588623047, 0.024676799774169922, 0.025722503662109375, 0.026768207550048828, 0.02781391143798828, 0.028859615325927734, 0.029905319213867188, 0.03095102310180664, 0.031996726989746094, 0.03304243087768555, 0.034088134765625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 6.0, 15.0, 31.0, 29.0, 55.0, 95.0, 133.0, 139.0, 151.0, 125.0, 87.0, 57.0, 27.0, 16.0, 14.0, 8.0, 5.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13288013637065887, -0.12953658401966095, -0.12619301676750183, -0.12284945696592331, -0.11950589716434479, -0.11616234481334686, -0.11281877756118774, -0.10947522521018982, -0.1061316654086113, -0.10278810560703278, -0.09944454580545425, -0.09610098600387573, -0.09275742620229721, -0.08941386640071869, -0.08607031404972076, -0.08272675424814224, -0.07938319444656372, -0.0760396346449852, -0.07269607484340668, -0.06935251504182816, -0.06600895524024963, -0.06266540288925171, -0.05932183936238289, -0.055978283286094666, -0.05263471603393555, -0.049291156232357025, -0.0459475964307785, -0.04260403662919998, -0.03926048055291176, -0.03591692075133324, -0.032573360949754715, -0.029229803010821342, -0.02588624507188797, -0.022542685270309448, -0.019199127331376076, -0.015855567529797554, -0.012512008659541607, -0.00916844978928566, -0.005824889987707138, -0.0024813320487737656, 0.0008622277528047562, 0.004205786623060703, 0.007549345958977938, 0.010892905294895172, 0.01423646416515112, 0.017580023035407066, 0.020923582836985588, 0.02426714077591896, 0.027610700577497482, 0.030954260379076004, 0.034297820180654526, 0.03764137625694275, 0.04098493605852127, 0.04432849586009979, 0.047672055661678314, 0.051015615463256836, 0.05435917526483536, 0.05770273506641388, 0.0610462948679924, 0.06438985466957092, 0.06773341447114944, 0.07107697427272797, 0.07442052662372589, 0.07776408642530441, 0.08110764622688293]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 3.0, 10.0, 12.0, 17.0, 13.0, 16.0, 23.0, 17.0, 22.0, 21.0, 32.0, 38.0, 34.0, 32.0, 44.0, 41.0, 44.0, 58.0, 51.0, 50.0, 44.0, 36.0, 44.0, 38.0, 39.0, 27.0, 43.0, 26.0, 25.0, 17.0, 16.0, 15.0, 16.0, 13.0, 11.0, 4.0, 5.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.04555976390838623, -0.04382229223847389, -0.042084820568561554, -0.04034734517335892, -0.03860987350344658, -0.03687240183353424, -0.035134926438331604, -0.033397454768419266, -0.03165998309850693, -0.02992251142859459, -0.028185037896037102, -0.026447564363479614, -0.024710092693567276, -0.022972621023654938, -0.02123514749109745, -0.019497673958539963, -0.017760202288627625, -0.016022730618715286, -0.014285257086157799, -0.012547784484922886, -0.010810311883687973, -0.00907283928245306, -0.007335366681218147, -0.005597894079983234, -0.0038604214787483215, -0.0021229488775134087, -0.0003854762762784958, 0.001351996324956417, 0.00308946892619133, 0.004826941527426243, 0.006564414128661156, 0.008301886729896069, 0.010039359331130981, 0.011776831932365894, 0.013514304533600807, 0.01525177713483572, 0.016989249736070633, 0.01872672140598297, 0.02046419493854046, 0.022201668471097946, 0.023939140141010284, 0.025676611810922623, 0.02741408534348011, 0.029151558876037598, 0.030889030545949936, 0.032626502215862274, 0.03436397761106491, 0.03610144928097725, 0.03783892095088959, 0.039576392620801926, 0.041313864290714264, 0.0430513396859169, 0.04478881135582924, 0.04652628302574158, 0.048263758420944214, 0.05000123009085655, 0.05173870176076889, 0.05347617343068123, 0.05521364510059357, 0.056951120495796204, 0.05868859216570854, 0.06042606383562088, 0.06216353923082352, 0.06390100717544556, 0.0656384825706482]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 4.0, 14.0, 22.0, 32.0, 49.0, 81.0, 112.0, 152.0, 259.0, 422.0, 726.0, 1277.0, 2174.0, 4134.0, 8173.0, 16300.0, 33212.0, 71203.0, 149594.0, 256335.0, 245651.0, 134441.0, 63620.0, 29858.0, 14478.0, 7332.0, 3851.0, 2115.0, 1157.0, 688.0, 399.0, 239.0, 161.0, 93.0, 74.0, 35.0, 28.0, 16.0, 10.0, 10.0, 9.0, 5.0, 3.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.077880859375, -0.07558536529541016, -0.07328987121582031, -0.07099437713623047, -0.06869888305664062, -0.06640338897705078, -0.06410789489746094, -0.061812400817871094, -0.05951690673828125, -0.057221412658691406, -0.05492591857910156, -0.05263042449951172, -0.050334930419921875, -0.04803943634033203, -0.04574394226074219, -0.043448448181152344, -0.0411529541015625, -0.038857460021972656, -0.03656196594238281, -0.03426647186279297, -0.031970977783203125, -0.02967548370361328, -0.027379989624023438, -0.025084495544433594, -0.02278900146484375, -0.020493507385253906, -0.018198013305664062, -0.01590251922607422, -0.013607025146484375, -0.011311531066894531, -0.009016036987304688, -0.006720542907714844, -0.004425048828125, -0.0021295547485351562, 0.0001659393310546875, 0.0024614334106445312, 0.004756927490234375, 0.007052421569824219, 0.009347915649414062, 0.011643409729003906, 0.01393890380859375, 0.016234397888183594, 0.018529891967773438, 0.02082538604736328, 0.023120880126953125, 0.02541637420654297, 0.027711868286132812, 0.030007362365722656, 0.0323028564453125, 0.034598350524902344, 0.03689384460449219, 0.03918933868408203, 0.041484832763671875, 0.04378032684326172, 0.04607582092285156, 0.048371315002441406, 0.05066680908203125, 0.052962303161621094, 0.05525779724121094, 0.05755329132080078, 0.059848785400390625, 0.06214427947998047, 0.06443977355957031, 0.06673526763916016, 0.06903076171875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 6.0, 0.0, 7.0, 5.0, 8.0, 6.0, 5.0, 12.0, 10.0, 17.0, 15.0, 20.0, 26.0, 30.0, 25.0, 24.0, 30.0, 32.0, 39.0, 51.0, 40.0, 42.0, 53.0, 55.0, 37.0, 34.0, 35.0, 42.0, 45.0, 48.0, 39.0, 26.0, 23.0, 19.0, 23.0, 14.0, 15.0, 12.0, 11.0, 9.0, 4.0, 5.0, 7.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.051361083984375, -0.049845218658447266, -0.04832935333251953, -0.0468134880065918, -0.04529762268066406, -0.04378175735473633, -0.042265892028808594, -0.04075002670288086, -0.039234161376953125, -0.03771829605102539, -0.036202430725097656, -0.03468656539916992, -0.03317070007324219, -0.03165483474731445, -0.03013896942138672, -0.028623104095458984, -0.02710723876953125, -0.025591373443603516, -0.02407550811767578, -0.022559642791748047, -0.021043777465820312, -0.019527912139892578, -0.018012046813964844, -0.01649618148803711, -0.014980316162109375, -0.01346445083618164, -0.011948585510253906, -0.010432720184326172, -0.008916854858398438, -0.007400989532470703, -0.005885124206542969, -0.004369258880615234, -0.0028533935546875, -0.0013375282287597656, 0.00017833709716796875, 0.0016942024230957031, 0.0032100677490234375, 0.004725933074951172, 0.006241798400878906, 0.007757663726806641, 0.009273529052734375, 0.01078939437866211, 0.012305259704589844, 0.013821125030517578, 0.015336990356445312, 0.016852855682373047, 0.01836872100830078, 0.019884586334228516, 0.02140045166015625, 0.022916316986083984, 0.02443218231201172, 0.025948047637939453, 0.027463912963867188, 0.028979778289794922, 0.030495643615722656, 0.03201150894165039, 0.033527374267578125, 0.03504323959350586, 0.036559104919433594, 0.03807497024536133, 0.03959083557128906, 0.0411067008972168, 0.04262256622314453, 0.044138431549072266, 0.045654296875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 3.0, 3.0, 5.0, 3.0, 4.0, 10.0, 13.0, 6.0, 19.0, 27.0, 48.0, 51.0, 96.0, 113.0, 149.0, 265.0, 478.0, 984.0, 2365.0, 7683.0, 28370.0, 126854.0, 490600.0, 301116.0, 65721.0, 15669.0, 4614.0, 1607.0, 692.0, 359.0, 191.0, 111.0, 79.0, 66.0, 33.0, 33.0, 31.0, 24.0, 9.0, 23.0, 14.0, 4.0, 7.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.11572265625, -0.11183738708496094, -0.10795211791992188, -0.10406684875488281, -0.10018157958984375, -0.09629631042480469, -0.09241104125976562, -0.08852577209472656, -0.0846405029296875, -0.08075523376464844, -0.07686996459960938, -0.07298469543457031, -0.06909942626953125, -0.06521415710449219, -0.061328887939453125, -0.05744361877441406, -0.053558349609375, -0.04967308044433594, -0.045787811279296875, -0.04190254211425781, -0.03801727294921875, -0.03413200378417969, -0.030246734619140625, -0.026361465454101562, -0.0224761962890625, -0.018590927124023438, -0.014705657958984375, -0.010820388793945312, -0.00693511962890625, -0.0030498504638671875, 0.000835418701171875, 0.0047206878662109375, 0.00860595703125, 0.012491226196289062, 0.016376495361328125, 0.020261764526367188, 0.02414703369140625, 0.028032302856445312, 0.031917572021484375, 0.03580284118652344, 0.0396881103515625, 0.04357337951660156, 0.047458648681640625, 0.05134391784667969, 0.05522918701171875, 0.05911445617675781, 0.06299972534179688, 0.06688499450683594, 0.070770263671875, 0.07465553283691406, 0.07854080200195312, 0.08242607116699219, 0.08631134033203125, 0.09019660949707031, 0.09408187866210938, 0.09796714782714844, 0.1018524169921875, 0.10573768615722656, 0.10962295532226562, 0.11350822448730469, 0.11739349365234375, 0.12127876281738281, 0.12516403198242188, 0.12904930114746094, 0.1329345703125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 2.0, 7.0, 7.0, 9.0, 10.0, 6.0, 9.0, 17.0, 20.0, 32.0, 26.0, 37.0, 32.0, 31.0, 48.0, 37.0, 55.0, 51.0, 47.0, 61.0, 56.0, 41.0, 48.0, 45.0, 38.0, 43.0, 31.0, 28.0, 24.0, 19.0, 23.0, 13.0, 12.0, 12.0, 6.0, 7.0, 4.0, 5.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2041015625, -0.1971263885498047, -0.19015121459960938, -0.18317604064941406, -0.17620086669921875, -0.16922569274902344, -0.16225051879882812, -0.1552753448486328, -0.1483001708984375, -0.1413249969482422, -0.13434982299804688, -0.12737464904785156, -0.12039947509765625, -0.11342430114746094, -0.10644912719726562, -0.09947395324707031, -0.092498779296875, -0.08552360534667969, -0.07854843139648438, -0.07157325744628906, -0.06459808349609375, -0.05762290954589844, -0.050647735595703125, -0.04367256164550781, -0.0366973876953125, -0.029722213745117188, -0.022747039794921875, -0.015771865844726562, -0.00879669189453125, -0.0018215179443359375, 0.005153656005859375, 0.012128829956054688, 0.01910400390625, 0.026079177856445312, 0.033054351806640625, 0.04002952575683594, 0.04700469970703125, 0.05397987365722656, 0.060955047607421875, 0.06793022155761719, 0.0749053955078125, 0.08188056945800781, 0.08885574340820312, 0.09583091735839844, 0.10280609130859375, 0.10978126525878906, 0.11675643920898438, 0.12373161315917969, 0.130706787109375, 0.1376819610595703, 0.14465713500976562, 0.15163230895996094, 0.15860748291015625, 0.16558265686035156, 0.17255783081054688, 0.1795330047607422, 0.1865081787109375, 0.1934833526611328, 0.20045852661132812, 0.20743370056152344, 0.21440887451171875, 0.22138404846191406, 0.22835922241210938, 0.2353343963623047, 0.2423095703125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 9.0, 14.0, 16.0, 30.0, 48.0, 90.0, 150.0, 266.0, 660.0, 1507.0, 4119.0, 16157.0, 120987.0, 704542.0, 171282.0, 20717.0, 4863.0, 1691.0, 683.0, 334.0, 160.0, 99.0, 50.0, 29.0, 16.0, 17.0, 9.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07122802734375, -0.06904125213623047, -0.06685447692871094, -0.0646677017211914, -0.062480926513671875, -0.060294151306152344, -0.05810737609863281, -0.05592060089111328, -0.05373382568359375, -0.05154705047607422, -0.04936027526855469, -0.047173500061035156, -0.044986724853515625, -0.042799949645996094, -0.04061317443847656, -0.03842639923095703, -0.0362396240234375, -0.03405284881591797, -0.03186607360839844, -0.029679298400878906, -0.027492523193359375, -0.025305747985839844, -0.023118972778320312, -0.02093219757080078, -0.01874542236328125, -0.01655864715576172, -0.014371871948242188, -0.012185096740722656, -0.009998321533203125, -0.007811546325683594, -0.0056247711181640625, -0.0034379959106445312, -0.001251220703125, 0.0009355545043945312, 0.0031223297119140625, 0.005309104919433594, 0.007495880126953125, 0.009682655334472656, 0.011869430541992188, 0.014056205749511719, 0.01624298095703125, 0.01842975616455078, 0.020616531372070312, 0.022803306579589844, 0.024990081787109375, 0.027176856994628906, 0.029363632202148438, 0.03155040740966797, 0.0337371826171875, 0.03592395782470703, 0.03811073303222656, 0.040297508239746094, 0.042484283447265625, 0.044671058654785156, 0.04685783386230469, 0.04904460906982422, 0.05123138427734375, 0.05341815948486328, 0.05560493469238281, 0.057791709899902344, 0.059978485107421875, 0.062165260314941406, 0.06435203552246094, 0.06653881072998047, 0.0687255859375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 5.0, 5.0, 16.0, 12.0, 17.0, 20.0, 30.0, 52.0, 62.0, 84.0, 85.0, 74.0, 109.0, 72.0, 77.0, 66.0, 53.0, 45.0, 25.0, 29.0, 19.0, 12.0, 10.0, 9.0, 5.0, 5.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2516975402832031e-05, -1.2150034308433533e-05, -1.1783093214035034e-05, -1.1416152119636536e-05, -1.1049211025238037e-05, -1.0682269930839539e-05, -1.031532883644104e-05, -9.948387742042542e-06, -9.581446647644043e-06, -9.214505553245544e-06, -8.847564458847046e-06, -8.480623364448547e-06, -8.113682270050049e-06, -7.74674117565155e-06, -7.379800081253052e-06, -7.012858986854553e-06, -6.645917892456055e-06, -6.278976798057556e-06, -5.912035703659058e-06, -5.545094609260559e-06, -5.1781535148620605e-06, -4.811212420463562e-06, -4.4442713260650635e-06, -4.077330231666565e-06, -3.7103891372680664e-06, -3.343448042869568e-06, -2.9765069484710693e-06, -2.609565854072571e-06, -2.2426247596740723e-06, -1.8756836652755737e-06, -1.5087425708770752e-06, -1.1418014764785767e-06, -7.748603820800781e-07, -4.079192876815796e-07, -4.0978193283081055e-08, 3.259629011154175e-07, 6.92903995513916e-07, 1.0598450899124146e-06, 1.426786184310913e-06, 1.7937272787094116e-06, 2.16066837310791e-06, 2.5276094675064087e-06, 2.8945505619049072e-06, 3.2614916563034058e-06, 3.6284327507019043e-06, 3.995373845100403e-06, 4.362314939498901e-06, 4.7292560338974e-06, 5.0961971282958984e-06, 5.463138222694397e-06, 5.8300793170928955e-06, 6.197020411491394e-06, 6.563961505889893e-06, 6.930902600288391e-06, 7.29784369468689e-06, 7.664784789085388e-06, 8.031725883483887e-06, 8.398666977882385e-06, 8.765608072280884e-06, 9.132549166679382e-06, 9.499490261077881e-06, 9.86643135547638e-06, 1.0233372449874878e-05, 1.0600313544273376e-05, 1.0967254638671875e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 7.0, 16.0, 19.0, 35.0, 44.0, 82.0, 132.0, 264.0, 517.0, 1054.0, 2483.0, 7831.0, 33995.0, 230939.0, 610285.0, 130013.0, 21461.0, 5484.0, 2101.0, 866.0, 429.0, 194.0, 104.0, 71.0, 44.0, 29.0, 18.0, 9.0, 8.0, 8.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.058074951171875, -0.05622291564941406, -0.054370880126953125, -0.05251884460449219, -0.05066680908203125, -0.04881477355957031, -0.046962738037109375, -0.04511070251464844, -0.0432586669921875, -0.04140663146972656, -0.039554595947265625, -0.03770256042480469, -0.03585052490234375, -0.03399848937988281, -0.032146453857421875, -0.030294418334960938, -0.0284423828125, -0.026590347290039062, -0.024738311767578125, -0.022886276245117188, -0.02103424072265625, -0.019182205200195312, -0.017330169677734375, -0.015478134155273438, -0.0136260986328125, -0.011774063110351562, -0.009922027587890625, -0.008069992065429688, -0.00621795654296875, -0.0043659210205078125, -0.002513885498046875, -0.0006618499755859375, 0.001190185546875, 0.0030422210693359375, 0.004894256591796875, 0.0067462921142578125, 0.00859832763671875, 0.010450363159179688, 0.012302398681640625, 0.014154434204101562, 0.0160064697265625, 0.017858505249023438, 0.019710540771484375, 0.021562576293945312, 0.02341461181640625, 0.025266647338867188, 0.027118682861328125, 0.028970718383789062, 0.03082275390625, 0.03267478942871094, 0.034526824951171875, 0.03637886047363281, 0.03823089599609375, 0.04008293151855469, 0.041934967041015625, 0.04378700256347656, 0.0456390380859375, 0.04749107360839844, 0.049343109130859375, 0.05119514465332031, 0.05304718017578125, 0.05489921569824219, 0.056751251220703125, 0.05860328674316406, 0.060455322265625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 9.0, 7.0, 6.0, 4.0, 8.0, 10.0, 17.0, 21.0, 22.0, 31.0, 53.0, 63.0, 68.0, 80.0, 104.0, 94.0, 97.0, 62.0, 70.0, 47.0, 30.0, 20.0, 25.0, 12.0, 7.0, 10.0, 6.0, 7.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06500244140625, -0.06274795532226562, -0.06049346923828125, -0.058238983154296875, -0.0559844970703125, -0.053730010986328125, -0.05147552490234375, -0.049221038818359375, -0.046966552734375, -0.044712066650390625, -0.04245758056640625, -0.040203094482421875, -0.0379486083984375, -0.035694122314453125, -0.03343963623046875, -0.031185150146484375, -0.0289306640625, -0.026676177978515625, -0.02442169189453125, -0.022167205810546875, -0.0199127197265625, -0.017658233642578125, -0.01540374755859375, -0.013149261474609375, -0.010894775390625, -0.008640289306640625, -0.00638580322265625, -0.004131317138671875, -0.0018768310546875, 0.000377655029296875, 0.00263214111328125, 0.004886627197265625, 0.00714111328125, 0.009395599365234375, 0.01165008544921875, 0.013904571533203125, 0.0161590576171875, 0.018413543701171875, 0.02066802978515625, 0.022922515869140625, 0.025177001953125, 0.027431488037109375, 0.02968597412109375, 0.031940460205078125, 0.0341949462890625, 0.036449432373046875, 0.03870391845703125, 0.040958404541015625, 0.043212890625, 0.045467376708984375, 0.04772186279296875, 0.049976348876953125, 0.0522308349609375, 0.054485321044921875, 0.05673980712890625, 0.058994293212890625, 0.061248779296875, 0.06350326538085938, 0.06575775146484375, 0.06801223754882812, 0.0702667236328125, 0.07252120971679688, 0.07477569580078125, 0.07703018188476562, 0.07928466796875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 8.0, 10.0, 16.0, 23.0, 32.0, 44.0, 66.0, 86.0, 117.0, 118.0, 113.0, 111.0, 86.0, 57.0, 37.0, 33.0, 8.0, 14.0, 11.0, 6.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5869490504264832, -0.5587567090988159, -0.5305643081665039, -0.5023719668388367, -0.47417962551116943, -0.4459872841835022, -0.4177949130535126, -0.38960254192352295, -0.3614102005958557, -0.3332178592681885, -0.30502548813819885, -0.27683311700820923, -0.248640775680542, -0.22044841945171356, -0.19225606322288513, -0.1640637069940567, -0.13587135076522827, -0.10767899453639984, -0.07948663830757141, -0.05129428207874298, -0.02310192584991455, 0.005090430378913879, 0.03328278660774231, 0.06147514283657074, 0.08966749906539917, 0.1178598552942276, 0.14605221152305603, 0.17424456775188446, 0.2024369239807129, 0.23062928020954132, 0.25882163643836975, 0.2870140075683594, 0.31520628929138184, 0.3433986306190491, 0.3715910017490387, 0.3997833728790283, 0.42797571420669556, 0.4561680555343628, 0.4843604266643524, 0.512552797794342, 0.5407451391220093, 0.5689374804496765, 0.5971298217773438, 0.6253222227096558, 0.653514564037323, 0.6817069053649902, 0.7098993062973022, 0.7380916476249695, 0.7662839889526367, 0.794476330280304, 0.8226686716079712, 0.8508610725402832, 0.8790534138679504, 0.9072457551956177, 0.9354381561279297, 0.9636304974555969, 0.9918228387832642, 1.0200152397155762, 1.0482075214385986, 1.0763999223709106, 1.1045923233032227, 1.1327846050262451, 1.1609770059585571, 1.1891692876815796, 1.2173616886138916]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 6.0, 3.0, 7.0, 7.0, 5.0, 6.0, 13.0, 8.0, 19.0, 15.0, 19.0, 29.0, 32.0, 19.0, 18.0, 35.0, 34.0, 37.0, 42.0, 33.0, 47.0, 59.0, 47.0, 42.0, 42.0, 42.0, 33.0, 31.0, 34.0, 29.0, 30.0, 23.0, 24.0, 22.0, 22.0, 11.0, 17.0, 11.0, 12.0, 6.0, 11.0, 4.0, 6.0, 4.0, 1.0, 4.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9338024854660034, -0.9048005938529968, -0.8757987022399902, -0.8467968106269836, -0.817794919013977, -0.7887930870056152, -0.7597911953926086, -0.730789303779602, -0.7017874121665955, -0.6727855205535889, -0.6437836289405823, -0.6147817373275757, -0.5857799053192139, -0.5567779541015625, -0.5277761220932007, -0.4987742304801941, -0.4697723388671875, -0.4407704472541809, -0.4117685556411743, -0.3827666938304901, -0.3537648022174835, -0.32476291060447693, -0.2957610487937927, -0.26675915718078613, -0.23775726556777954, -0.20875537395477295, -0.17975349724292755, -0.15075162053108215, -0.12174972891807556, -0.09274783730506897, -0.06374596059322357, -0.034744083881378174, -0.005742251873016357, 0.023259632289409637, 0.05226151645183563, 0.08126340061426163, 0.11026528477668762, 0.1392671763896942, 0.1682690531015396, 0.197270929813385, 0.2262728214263916, 0.2552747130393982, 0.2842766046524048, 0.313278466463089, 0.3422803580760956, 0.3712822496891022, 0.4002841114997864, 0.42928600311279297, 0.45828789472579956, 0.48728978633880615, 0.5162916779518127, 0.5452935695648193, 0.5742954015731812, 0.6032973527908325, 0.6322991847991943, 0.6613010764122009, 0.6903029680252075, 0.7193048596382141, 0.7483067512512207, 0.7773086428642273, 0.8063105344772339, 0.8353123664855957, 0.8643142580986023, 0.8933161497116089, 0.9223180413246155]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 4.0, 3.0, 3.0, 12.0, 21.0, 31.0, 23.0, 37.0, 45.0, 77.0, 102.0, 147.0, 251.0, 333.0, 524.0, 793.0, 1390.0, 2429.0, 4673.0, 12027.0, 47806.0, 4007217.0, 86549.0, 16520.0, 6144.0, 2868.0, 1609.0, 938.0, 590.0, 370.0, 231.0, 153.0, 129.0, 68.0, 48.0, 28.0, 27.0, 23.0, 18.0, 16.0, 4.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.1044921875, -0.1017160415649414, -0.09893989562988281, -0.09616374969482422, -0.09338760375976562, -0.09061145782470703, -0.08783531188964844, -0.08505916595458984, -0.08228302001953125, -0.07950687408447266, -0.07673072814941406, -0.07395458221435547, -0.07117843627929688, -0.06840229034423828, -0.06562614440917969, -0.0628499984741211, -0.0600738525390625, -0.057297706604003906, -0.05452156066894531, -0.05174541473388672, -0.048969268798828125, -0.04619312286376953, -0.04341697692871094, -0.040640830993652344, -0.03786468505859375, -0.035088539123535156, -0.03231239318847656, -0.02953624725341797, -0.026760101318359375, -0.02398395538330078, -0.021207809448242188, -0.018431663513183594, -0.015655517578125, -0.012879371643066406, -0.010103225708007812, -0.007327079772949219, -0.004550933837890625, -0.0017747879028320312, 0.0010013580322265625, 0.0037775039672851562, 0.00655364990234375, 0.009329795837402344, 0.012105941772460938, 0.014882087707519531, 0.017658233642578125, 0.02043437957763672, 0.023210525512695312, 0.025986671447753906, 0.0287628173828125, 0.031538963317871094, 0.03431510925292969, 0.03709125518798828, 0.039867401123046875, 0.04264354705810547, 0.04541969299316406, 0.048195838928222656, 0.05097198486328125, 0.053748130798339844, 0.05652427673339844, 0.05930042266845703, 0.062076568603515625, 0.06485271453857422, 0.06762886047363281, 0.0704050064086914, 0.07318115234375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 6.0, 2.0, 1.0, 3.0, 5.0, 15.0, 10.0, 10.0, 7.0, 7.0, 17.0, 20.0, 24.0, 28.0, 25.0, 29.0, 31.0, 26.0, 34.0, 41.0, 36.0, 42.0, 46.0, 44.0, 47.0, 47.0, 34.0, 39.0, 46.0, 32.0, 28.0, 27.0, 27.0, 39.0, 20.0, 30.0, 24.0, 6.0, 13.0, 9.0, 10.0, 6.0, 8.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0504150390625, -0.04886913299560547, -0.04732322692871094, -0.045777320861816406, -0.044231414794921875, -0.042685508728027344, -0.04113960266113281, -0.03959369659423828, -0.03804779052734375, -0.03650188446044922, -0.03495597839355469, -0.033410072326660156, -0.031864166259765625, -0.030318260192871094, -0.028772354125976562, -0.02722644805908203, -0.0256805419921875, -0.02413463592529297, -0.022588729858398438, -0.021042823791503906, -0.019496917724609375, -0.017951011657714844, -0.016405105590820312, -0.014859199523925781, -0.01331329345703125, -0.011767387390136719, -0.010221481323242188, -0.008675575256347656, -0.007129669189453125, -0.005583763122558594, -0.0040378570556640625, -0.0024919509887695312, -0.000946044921875, 0.0005998611450195312, 0.0021457672119140625, 0.0036916732788085938, 0.005237579345703125, 0.006783485412597656, 0.008329391479492188, 0.009875297546386719, 0.01142120361328125, 0.012967109680175781, 0.014513015747070312, 0.016058921813964844, 0.017604827880859375, 0.019150733947753906, 0.020696640014648438, 0.02224254608154297, 0.0237884521484375, 0.02533435821533203, 0.026880264282226562, 0.028426170349121094, 0.029972076416015625, 0.031517982482910156, 0.03306388854980469, 0.03460979461669922, 0.03615570068359375, 0.03770160675048828, 0.03924751281738281, 0.040793418884277344, 0.042339324951171875, 0.043885231018066406, 0.04543113708496094, 0.04697704315185547, 0.04852294921875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 3.0, 3.0, 7.0, 4.0, 13.0, 18.0, 16.0, 17.0, 31.0, 54.0, 76.0, 106.0, 170.0, 313.0, 479.0, 792.0, 1383.0, 2361.0, 4668.0, 11045.0, 38619.0, 3894918.0, 198173.0, 24065.0, 8172.0, 3829.0, 1933.0, 1159.0, 680.0, 409.0, 250.0, 169.0, 130.0, 69.0, 46.0, 28.0, 20.0, 17.0, 12.0, 12.0, 7.0, 4.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1097412109375, -0.1063995361328125, -0.103057861328125, -0.0997161865234375, -0.09637451171875, -0.0930328369140625, -0.089691162109375, -0.0863494873046875, -0.0830078125, -0.0796661376953125, -0.076324462890625, -0.0729827880859375, -0.06964111328125, -0.0662994384765625, -0.062957763671875, -0.0596160888671875, -0.0562744140625, -0.0529327392578125, -0.049591064453125, -0.0462493896484375, -0.04290771484375, -0.0395660400390625, -0.036224365234375, -0.0328826904296875, -0.029541015625, -0.0261993408203125, -0.022857666015625, -0.0195159912109375, -0.01617431640625, -0.0128326416015625, -0.009490966796875, -0.0061492919921875, -0.0028076171875, 0.0005340576171875, 0.003875732421875, 0.0072174072265625, 0.01055908203125, 0.0139007568359375, 0.017242431640625, 0.0205841064453125, 0.02392578125, 0.0272674560546875, 0.030609130859375, 0.0339508056640625, 0.03729248046875, 0.0406341552734375, 0.043975830078125, 0.0473175048828125, 0.0506591796875, 0.0540008544921875, 0.057342529296875, 0.0606842041015625, 0.06402587890625, 0.0673675537109375, 0.070709228515625, 0.0740509033203125, 0.077392578125, 0.0807342529296875, 0.084075927734375, 0.0874176025390625, 0.09075927734375, 0.0941009521484375, 0.097442626953125, 0.1007843017578125, 0.1041259765625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 4.0, 3.0, 7.0, 2.0, 5.0, 10.0, 4.0, 8.0, 26.0, 23.0, 48.0, 98.0, 3317.0, 316.0, 97.0, 30.0, 23.0, 11.0, 10.0, 4.0, 8.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.031280517578125, -0.030431509017944336, -0.029582500457763672, -0.028733491897583008, -0.027884483337402344, -0.02703547477722168, -0.026186466217041016, -0.02533745765686035, -0.024488449096679688, -0.023639440536499023, -0.02279043197631836, -0.021941423416137695, -0.02109241485595703, -0.020243406295776367, -0.019394397735595703, -0.01854538917541504, -0.017696380615234375, -0.01684737205505371, -0.015998363494873047, -0.015149354934692383, -0.014300346374511719, -0.013451337814331055, -0.01260232925415039, -0.011753320693969727, -0.010904312133789062, -0.010055303573608398, -0.009206295013427734, -0.00835728645324707, -0.007508277893066406, -0.006659269332885742, -0.005810260772705078, -0.004961252212524414, -0.00411224365234375, -0.003263235092163086, -0.002414226531982422, -0.0015652179718017578, -0.0007162094116210938, 0.0001327991485595703, 0.0009818077087402344, 0.0018308162689208984, 0.0026798248291015625, 0.0035288333892822266, 0.004377841949462891, 0.005226850509643555, 0.006075859069824219, 0.006924867630004883, 0.007773876190185547, 0.008622884750366211, 0.009471893310546875, 0.010320901870727539, 0.011169910430908203, 0.012018918991088867, 0.012867927551269531, 0.013716936111450195, 0.01456594467163086, 0.015414953231811523, 0.016263961791992188, 0.01711297035217285, 0.017961978912353516, 0.01881098747253418, 0.019659996032714844, 0.020509004592895508, 0.021358013153076172, 0.022207021713256836, 0.0230560302734375]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 10.0, 16.0, 59.0, 148.0, 281.0, 263.0, 157.0, 53.0, 17.0, 4.0, 2.0, 0.0, 2.0], "bins": [-0.5066134929656982, -0.4976367950439453, -0.4886600971221924, -0.47968342900276184, -0.4707067310810089, -0.461730033159256, -0.45275333523750305, -0.4437766671180725, -0.4347999691963196, -0.42582327127456665, -0.4168465733528137, -0.4078699052333832, -0.39889320731163025, -0.3899165093898773, -0.3809398114681244, -0.37196314334869385, -0.3629864454269409, -0.354009747505188, -0.34503304958343506, -0.3360563814640045, -0.3270796835422516, -0.31810298562049866, -0.3091262876987457, -0.3001496195793152, -0.29117289185523987, -0.28219619393348694, -0.273219496011734, -0.26424282789230347, -0.25526612997055054, -0.2462894320487976, -0.23731273412704468, -0.22833605110645294, -0.2193593531847, -0.21038265526294708, -0.20140597224235535, -0.19242927432060242, -0.18345259130001068, -0.17447589337825775, -0.16549921035766602, -0.15652251243591309, -0.14754581451416016, -0.13856911659240723, -0.1295924335718155, -0.12061573565006256, -0.11163905262947083, -0.1026623547077179, -0.09368566423654556, -0.08470897376537323, -0.0757322907447815, -0.06675560027360916, -0.05777890980243683, -0.0488022156059742, -0.039825525134801865, -0.030848834663629532, -0.0218721404671669, -0.012895449995994568, -0.003918759524822235, 0.005057931877672672, 0.01403462328016758, 0.02301131561398506, 0.031988006085157394, 0.04096469655632973, 0.04994139075279236, 0.05891808122396469, 0.06789477169513702]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 2.0, 5.0, 15.0, 18.0, 19.0, 27.0, 22.0, 36.0, 42.0, 47.0, 49.0, 51.0, 57.0, 57.0, 59.0, 44.0, 46.0, 52.0, 52.0, 44.0, 47.0, 48.0, 41.0, 23.0, 19.0, 20.0, 13.0, 11.0, 14.0, 5.0, 4.0, 6.0, 7.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09989792108535767, -0.09703506529331207, -0.09417221695184708, -0.09130936861038208, -0.08844651281833649, -0.0855836570262909, -0.0827208086848259, -0.0798579603433609, -0.07699510455131531, -0.07413224875926971, -0.07126940041780472, -0.06840655207633972, -0.06554369628429413, -0.06268084049224854, -0.05981799215078354, -0.056955140084028244, -0.05409228801727295, -0.051229435950517654, -0.04836658388376236, -0.045503731817007065, -0.04264087975025177, -0.039778027683496475, -0.03691517561674118, -0.034052323549985886, -0.03118947148323059, -0.028326619416475296, -0.02546376734972, -0.022600915282964706, -0.01973806321620941, -0.016875211149454117, -0.014012359082698822, -0.011149507015943527, -0.008286654949188232, -0.005423802882432938, -0.002560950815677643, 0.000301901251077652, 0.0031647533178329468, 0.006027605384588242, 0.008890457451343536, 0.011753309518098831, 0.014616161584854126, 0.01747901365160942, 0.020341865718364716, 0.02320471778512001, 0.026067569851875305, 0.0289304219186306, 0.031793273985385895, 0.03465612605214119, 0.037518978118896484, 0.04038183018565178, 0.043244682252407074, 0.04610753431916237, 0.048970386385917664, 0.05183323845267296, 0.05469609051942825, 0.05755894258618355, 0.06042179465293884, 0.06328465044498444, 0.06614749878644943, 0.06901034712791443, 0.07187320291996002, 0.07473605871200562, 0.07759890705347061, 0.08046175539493561, 0.0833246111869812]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 5.0, 13.0, 10.0, 11.0, 32.0, 41.0, 59.0, 96.0, 125.0, 246.0, 379.0, 695.0, 1310.0, 2486.0, 5118.0, 10642.0, 24136.0, 54715.0, 128414.0, 270097.0, 289580.0, 146615.0, 62616.0, 27206.0, 12091.0, 5675.0, 2691.0, 1465.0, 775.0, 469.0, 265.0, 169.0, 93.0, 66.0, 54.0, 31.0, 27.0, 12.0, 9.0, 6.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.09234619140625, -0.08978652954101562, -0.08722686767578125, -0.08466720581054688, -0.0821075439453125, -0.07954788208007812, -0.07698822021484375, -0.07442855834960938, -0.071868896484375, -0.06930923461914062, -0.06674957275390625, -0.06418991088867188, -0.0616302490234375, -0.059070587158203125, -0.05651092529296875, -0.053951263427734375, -0.0513916015625, -0.048831939697265625, -0.04627227783203125, -0.043712615966796875, -0.0411529541015625, -0.038593292236328125, -0.03603363037109375, -0.033473968505859375, -0.030914306640625, -0.028354644775390625, -0.02579498291015625, -0.023235321044921875, -0.0206756591796875, -0.018115997314453125, -0.01555633544921875, -0.012996673583984375, -0.01043701171875, -0.007877349853515625, -0.00531768798828125, -0.002758026123046875, -0.0001983642578125, 0.002361297607421875, 0.00492095947265625, 0.007480621337890625, 0.010040283203125, 0.012599945068359375, 0.01515960693359375, 0.017719268798828125, 0.0202789306640625, 0.022838592529296875, 0.02539825439453125, 0.027957916259765625, 0.030517578125, 0.033077239990234375, 0.03563690185546875, 0.038196563720703125, 0.0407562255859375, 0.043315887451171875, 0.04587554931640625, 0.048435211181640625, 0.050994873046875, 0.053554534912109375, 0.05611419677734375, 0.058673858642578125, 0.0612335205078125, 0.06379318237304688, 0.06635284423828125, 0.06891250610351562, 0.07147216796875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 5.0, 2.0, 6.0, 5.0, 9.0, 9.0, 4.0, 11.0, 15.0, 19.0, 14.0, 32.0, 19.0, 21.0, 24.0, 39.0, 26.0, 31.0, 46.0, 45.0, 37.0, 51.0, 36.0, 42.0, 36.0, 38.0, 29.0, 37.0, 36.0, 41.0, 28.0, 36.0, 21.0, 24.0, 25.0, 20.0, 15.0, 17.0, 12.0, 13.0, 9.0, 1.0, 4.0, 2.0, 3.0, 6.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.050933837890625, -0.049424171447753906, -0.04791450500488281, -0.04640483856201172, -0.044895172119140625, -0.04338550567626953, -0.04187583923339844, -0.040366172790527344, -0.03885650634765625, -0.037346839904785156, -0.03583717346191406, -0.03432750701904297, -0.032817840576171875, -0.03130817413330078, -0.029798507690429688, -0.028288841247558594, -0.0267791748046875, -0.025269508361816406, -0.023759841918945312, -0.02225017547607422, -0.020740509033203125, -0.01923084259033203, -0.017721176147460938, -0.016211509704589844, -0.01470184326171875, -0.013192176818847656, -0.011682510375976562, -0.010172843933105469, -0.008663177490234375, -0.007153511047363281, -0.0056438446044921875, -0.004134178161621094, -0.00262451171875, -0.0011148452758789062, 0.0003948211669921875, 0.0019044876098632812, 0.003414154052734375, 0.004923820495605469, 0.0064334869384765625, 0.007943153381347656, 0.00945281982421875, 0.010962486267089844, 0.012472152709960938, 0.013981819152832031, 0.015491485595703125, 0.01700115203857422, 0.018510818481445312, 0.020020484924316406, 0.0215301513671875, 0.023039817810058594, 0.024549484252929688, 0.02605915069580078, 0.027568817138671875, 0.02907848358154297, 0.030588150024414062, 0.032097816467285156, 0.03360748291015625, 0.035117149353027344, 0.03662681579589844, 0.03813648223876953, 0.039646148681640625, 0.04115581512451172, 0.04266548156738281, 0.044175148010253906, 0.045684814453125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 4.0, 3.0, 4.0, 8.0, 8.0, 13.0, 13.0, 27.0, 38.0, 46.0, 76.0, 113.0, 208.0, 404.0, 817.0, 2236.0, 7938.0, 42373.0, 374366.0, 541662.0, 62705.0, 10723.0, 2694.0, 984.0, 417.0, 262.0, 145.0, 81.0, 56.0, 36.0, 36.0, 15.0, 17.0, 8.0, 8.0, 4.0, 1.0, 4.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1932373046875, -0.18757057189941406, -0.18190383911132812, -0.1762371063232422, -0.17057037353515625, -0.1649036407470703, -0.15923690795898438, -0.15357017517089844, -0.1479034423828125, -0.14223670959472656, -0.13656997680664062, -0.1309032440185547, -0.12523651123046875, -0.11956977844238281, -0.11390304565429688, -0.10823631286621094, -0.102569580078125, -0.09690284729003906, -0.09123611450195312, -0.08556938171386719, -0.07990264892578125, -0.07423591613769531, -0.06856918334960938, -0.06290245056152344, -0.0572357177734375, -0.05156898498535156, -0.045902252197265625, -0.04023551940917969, -0.03456878662109375, -0.028902053833007812, -0.023235321044921875, -0.017568588256835938, -0.01190185546875, -0.0062351226806640625, -0.000568389892578125, 0.0050983428955078125, 0.01076507568359375, 0.016431808471679688, 0.022098541259765625, 0.027765274047851562, 0.0334320068359375, 0.03909873962402344, 0.044765472412109375, 0.05043220520019531, 0.05609893798828125, 0.06176567077636719, 0.06743240356445312, 0.07309913635253906, 0.078765869140625, 0.08443260192871094, 0.09009933471679688, 0.09576606750488281, 0.10143280029296875, 0.10709953308105469, 0.11276626586914062, 0.11843299865722656, 0.1240997314453125, 0.12976646423339844, 0.13543319702148438, 0.1410999298095703, 0.14676666259765625, 0.1524333953857422, 0.15810012817382812, 0.16376686096191406, 0.16943359375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 2.0, 2.0, 5.0, 3.0, 18.0, 12.0, 12.0, 33.0, 30.0, 32.0, 40.0, 54.0, 61.0, 64.0, 59.0, 68.0, 63.0, 71.0, 58.0, 59.0, 39.0, 52.0, 33.0, 30.0, 27.0, 25.0, 14.0, 10.0, 9.0, 3.0, 4.0, 8.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.365478515625, -0.3557853698730469, -0.34609222412109375, -0.3363990783691406, -0.3267059326171875, -0.3170127868652344, -0.30731964111328125, -0.2976264953613281, -0.287933349609375, -0.2782402038574219, -0.26854705810546875, -0.2588539123535156, -0.2491607666015625, -0.23946762084960938, -0.22977447509765625, -0.22008132934570312, -0.21038818359375, -0.20069503784179688, -0.19100189208984375, -0.18130874633789062, -0.1716156005859375, -0.16192245483398438, -0.15222930908203125, -0.14253616333007812, -0.132843017578125, -0.12314987182617188, -0.11345672607421875, -0.10376358032226562, -0.0940704345703125, -0.08437728881835938, -0.07468414306640625, -0.06499099731445312, -0.0552978515625, -0.045604705810546875, -0.03591156005859375, -0.026218414306640625, -0.0165252685546875, -0.006832122802734375, 0.00286102294921875, 0.012554168701171875, 0.022247314453125, 0.031940460205078125, 0.04163360595703125, 0.051326751708984375, 0.0610198974609375, 0.07071304321289062, 0.08040618896484375, 0.09009933471679688, 0.09979248046875, 0.10948562622070312, 0.11917877197265625, 0.12887191772460938, 0.1385650634765625, 0.14825820922851562, 0.15795135498046875, 0.16764450073242188, 0.177337646484375, 0.18703079223632812, 0.19672393798828125, 0.20641708374023438, 0.2161102294921875, 0.22580337524414062, 0.23549652099609375, 0.24518966674804688, 0.2548828125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 4.0, 3.0, 4.0, 4.0, 8.0, 8.0, 15.0, 31.0, 35.0, 48.0, 105.0, 187.0, 397.0, 883.0, 2310.0, 7586.0, 84167.0, 910974.0, 33131.0, 5534.0, 1761.0, 725.0, 309.0, 136.0, 77.0, 46.0, 30.0, 4.0, 13.0, 8.0, 5.0, 2.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.156982421875, -0.15299510955810547, -0.14900779724121094, -0.1450204849243164, -0.14103317260742188, -0.13704586029052734, -0.1330585479736328, -0.12907123565673828, -0.12508392333984375, -0.12109661102294922, -0.11710929870605469, -0.11312198638916016, -0.10913467407226562, -0.1051473617553711, -0.10116004943847656, -0.09717273712158203, -0.0931854248046875, -0.08919811248779297, -0.08521080017089844, -0.0812234878540039, -0.07723617553710938, -0.07324886322021484, -0.06926155090332031, -0.06527423858642578, -0.06128692626953125, -0.05729961395263672, -0.05331230163574219, -0.049324989318847656, -0.045337677001953125, -0.041350364685058594, -0.03736305236816406, -0.03337574005126953, -0.029388427734375, -0.02540111541748047, -0.021413803100585938, -0.017426490783691406, -0.013439178466796875, -0.009451866149902344, -0.0054645538330078125, -0.0014772415161132812, 0.00251007080078125, 0.006497383117675781, 0.010484695434570312, 0.014472007751464844, 0.018459320068359375, 0.022446632385253906, 0.026433944702148438, 0.03042125701904297, 0.0344085693359375, 0.03839588165283203, 0.04238319396972656, 0.046370506286621094, 0.050357818603515625, 0.054345130920410156, 0.05833244323730469, 0.06231975555419922, 0.06630706787109375, 0.07029438018798828, 0.07428169250488281, 0.07826900482177734, 0.08225631713867188, 0.0862436294555664, 0.09023094177246094, 0.09421825408935547, 0.09820556640625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 4.0, 4.0, 6.0, 8.0, 16.0, 16.0, 26.0, 43.0, 67.0, 66.0, 98.0, 111.0, 134.0, 103.0, 92.0, 59.0, 45.0, 30.0, 17.0, 8.0, 3.0, 8.0, 6.0, 7.0, 5.0, 6.0, 3.0, 1.0, 1.0, 2.0, 4.0, 5.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5079975128173828e-05, -1.4633871614933014e-05, -1.41877681016922e-05, -1.3741664588451385e-05, -1.3295561075210571e-05, -1.2849457561969757e-05, -1.2403354048728943e-05, -1.1957250535488129e-05, -1.1511147022247314e-05, -1.10650435090065e-05, -1.0618939995765686e-05, -1.0172836482524872e-05, -9.726732969284058e-06, -9.280629456043243e-06, -8.83452594280243e-06, -8.388422429561615e-06, -7.9423189163208e-06, -7.4962154030799866e-06, -7.050111889839172e-06, -6.604008376598358e-06, -6.157904863357544e-06, -5.71180135011673e-06, -5.2656978368759155e-06, -4.819594323635101e-06, -4.373490810394287e-06, -3.927387297153473e-06, -3.4812837839126587e-06, -3.0351802706718445e-06, -2.5890767574310303e-06, -2.142973244190216e-06, -1.6968697309494019e-06, -1.2507662177085876e-06, -8.046627044677734e-07, -3.5855919122695923e-07, 8.754432201385498e-08, 5.336478352546692e-07, 9.797513484954834e-07, 1.4258548617362976e-06, 1.8719583749771118e-06, 2.318061888217926e-06, 2.7641654014587402e-06, 3.2102689146995544e-06, 3.6563724279403687e-06, 4.102475941181183e-06, 4.548579454421997e-06, 4.994682967662811e-06, 5.4407864809036255e-06, 5.88688999414444e-06, 6.332993507385254e-06, 6.779097020626068e-06, 7.225200533866882e-06, 7.671304047107697e-06, 8.11740756034851e-06, 8.563511073589325e-06, 9.00961458683014e-06, 9.455718100070953e-06, 9.901821613311768e-06, 1.0347925126552582e-05, 1.0794028639793396e-05, 1.124013215303421e-05, 1.1686235666275024e-05, 1.2132339179515839e-05, 1.2578442692756653e-05, 1.3024546205997467e-05, 1.3470649719238281e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 5.0, 7.0, 7.0, 8.0, 4.0, 20.0, 19.0, 26.0, 40.0, 37.0, 69.0, 115.0, 183.0, 270.0, 576.0, 1229.0, 2870.0, 8194.0, 53320.0, 797905.0, 162672.0, 13535.0, 4110.0, 1641.0, 737.0, 375.0, 191.0, 138.0, 79.0, 41.0, 37.0, 20.0, 24.0, 14.0, 9.0, 20.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06805419921875, -0.06517982482910156, -0.062305450439453125, -0.05943107604980469, -0.05655670166015625, -0.05368232727050781, -0.050807952880859375, -0.04793357849121094, -0.0450592041015625, -0.04218482971191406, -0.039310455322265625, -0.03643608093261719, -0.03356170654296875, -0.030687332153320312, -0.027812957763671875, -0.024938583374023438, -0.022064208984375, -0.019189834594726562, -0.016315460205078125, -0.013441085815429688, -0.01056671142578125, -0.0076923370361328125, -0.004817962646484375, -0.0019435882568359375, 0.0009307861328125, 0.0038051605224609375, 0.006679534912109375, 0.009553909301757812, 0.01242828369140625, 0.015302658081054688, 0.018177032470703125, 0.021051406860351562, 0.02392578125, 0.026800155639648438, 0.029674530029296875, 0.03254890441894531, 0.03542327880859375, 0.03829765319824219, 0.041172027587890625, 0.04404640197753906, 0.0469207763671875, 0.04979515075683594, 0.052669525146484375, 0.05554389953613281, 0.05841827392578125, 0.06129264831542969, 0.06416702270507812, 0.06704139709472656, 0.069915771484375, 0.07279014587402344, 0.07566452026367188, 0.07853889465332031, 0.08141326904296875, 0.08428764343261719, 0.08716201782226562, 0.09003639221191406, 0.0929107666015625, 0.09578514099121094, 0.09865951538085938, 0.10153388977050781, 0.10440826416015625, 0.10728263854980469, 0.11015701293945312, 0.11303138732910156, 0.11590576171875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 1.0, 5.0, 3.0, 12.0, 16.0, 51.0, 101.0, 197.0, 227.0, 188.0, 98.0, 50.0, 17.0, 8.0, 6.0, 5.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1568603515625, -0.15216064453125, -0.1474609375, -0.14276123046875, -0.1380615234375, -0.13336181640625, -0.128662109375, -0.12396240234375, -0.1192626953125, -0.11456298828125, -0.10986328125, -0.10516357421875, -0.1004638671875, -0.09576416015625, -0.091064453125, -0.08636474609375, -0.0816650390625, -0.07696533203125, -0.072265625, -0.06756591796875, -0.0628662109375, -0.05816650390625, -0.053466796875, -0.04876708984375, -0.0440673828125, -0.03936767578125, -0.03466796875, -0.02996826171875, -0.0252685546875, -0.02056884765625, -0.015869140625, -0.01116943359375, -0.0064697265625, -0.00177001953125, 0.0029296875, 0.00762939453125, 0.0123291015625, 0.01702880859375, 0.021728515625, 0.02642822265625, 0.0311279296875, 0.03582763671875, 0.04052734375, 0.04522705078125, 0.0499267578125, 0.05462646484375, 0.059326171875, 0.06402587890625, 0.0687255859375, 0.07342529296875, 0.078125, 0.08282470703125, 0.0875244140625, 0.09222412109375, 0.096923828125, 0.10162353515625, 0.1063232421875, 0.11102294921875, 0.11572265625, 0.12042236328125, 0.1251220703125, 0.12982177734375, 0.134521484375, 0.13922119140625, 0.1439208984375]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 12.0, 29.0, 203.0, 411.0, 260.0, 64.0, 16.0, 9.0, 1.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.722007751464844, -5.593622207641602, -5.465236663818359, -5.336851119995117, -5.208465576171875, -5.080080509185791, -4.951694965362549, -4.823309421539307, -4.6949238777160645, -4.566538333892822, -4.43815279006958, -4.309767246246338, -4.181382179260254, -4.052996635437012, -3.9246110916137695, -3.7962255477905273, -3.667840003967285, -3.539454460144043, -3.411068916320801, -3.2826836109161377, -3.1542980670928955, -3.0259125232696533, -2.8975272178649902, -2.769141674041748, -2.640756130218506, -2.5123705863952637, -2.3839850425720215, -2.2555997371673584, -2.127214193344116, -1.998828649520874, -1.8704432249069214, -1.7420578002929688, -1.6136727333068848, -1.4852871894836426, -1.35690176486969, -1.2285163402557373, -1.1001307964324951, -0.9717453122138977, -0.8433598279953003, -0.7149743437767029, -0.5865888595581055, -0.45820337533950806, -0.32981789112091064, -0.20143240690231323, -0.07304692268371582, 0.05533856153488159, 0.183724045753479, 0.3121095299720764, 0.44049501419067383, 0.5688804984092712, 0.6972659826278687, 0.8256514668464661, 0.9540369510650635, 1.0824224948883057, 1.2108079195022583, 1.339193344116211, 1.4675788879394531, 1.5959644317626953, 1.724349856376648, 1.8527352809906006, 1.9811208248138428, 2.109506368637085, 2.237891674041748, 2.3662772178649902, 2.4946627616882324]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 4.0, 1.0, 5.0, 6.0, 6.0, 4.0, 5.0, 8.0, 10.0, 11.0, 21.0, 16.0, 24.0, 17.0, 23.0, 35.0, 30.0, 33.0, 37.0, 26.0, 40.0, 52.0, 43.0, 64.0, 43.0, 47.0, 34.0, 41.0, 30.0, 48.0, 30.0, 32.0, 25.0, 20.0, 25.0, 15.0, 18.0, 16.0, 10.0, 13.0, 10.0, 1.0, 10.0, 4.0, 6.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.984366238117218, -0.9525429010391235, -0.920719563961029, -0.8888962268829346, -0.8570728898048401, -0.8252495527267456, -0.7934262752532959, -0.7616028785705566, -0.7297796010971069, -0.6979562640190125, -0.666132926940918, -0.6343095898628235, -0.602486252784729, -0.5706629157066345, -0.53883957862854, -0.5070163011550903, -0.4751929044723511, -0.4433695673942566, -0.4115462303161621, -0.3797228932380676, -0.34789955615997314, -0.31607621908187866, -0.28425291180610657, -0.2524295747280121, -0.2206062376499176, -0.18878290057182312, -0.15695956349372864, -0.12513624131679535, -0.09331290423870087, -0.061489567160606384, -0.029666244983673096, 0.0021570920944213867, 0.033980488777160645, 0.06580382585525513, 0.09762715548276901, 0.1294504851102829, 0.16127382218837738, 0.19309715926647186, 0.22492048144340515, 0.25674381852149963, 0.2885671555995941, 0.3203904926776886, 0.3522138297557831, 0.3840371370315552, 0.41586047410964966, 0.44768381118774414, 0.4795071482658386, 0.5113304853439331, 0.5431538224220276, 0.5749771595001221, 0.6068004965782166, 0.638623833656311, 0.6704471707344055, 0.7022705078125, 0.7340937852859497, 0.765917181968689, 0.7977404594421387, 0.8295637965202332, 0.8613871335983276, 0.8932104706764221, 0.9250338077545166, 0.9568571448326111, 0.9886804819107056, 1.0205037593841553, 1.0523271560668945]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 2.0, 2.0, 7.0, 5.0, 12.0, 13.0, 5.0, 15.0, 22.0, 24.0, 25.0, 38.0, 44.0, 53.0, 92.0, 232.0, 828.0, 4972.0, 4039510.0, 142902.0, 4103.0, 763.0, 214.0, 116.0, 57.0, 50.0, 28.0, 36.0, 26.0, 16.0, 13.0, 12.0, 10.0, 9.0, 5.0, 8.0, 2.0, 5.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3115234375, -0.3017768859863281, -0.29203033447265625, -0.2822837829589844, -0.2725372314453125, -0.2627906799316406, -0.25304412841796875, -0.24329757690429688, -0.233551025390625, -0.22380447387695312, -0.21405792236328125, -0.20431137084960938, -0.1945648193359375, -0.18481826782226562, -0.17507171630859375, -0.16532516479492188, -0.15557861328125, -0.14583206176757812, -0.13608551025390625, -0.12633895874023438, -0.1165924072265625, -0.10684585571289062, -0.09709930419921875, -0.08735275268554688, -0.077606201171875, -0.06785964965820312, -0.05811309814453125, -0.048366546630859375, -0.0386199951171875, -0.028873443603515625, -0.01912689208984375, -0.009380340576171875, 0.0003662109375, 0.010112762451171875, 0.01985931396484375, 0.029605865478515625, 0.0393524169921875, 0.049098968505859375, 0.05884552001953125, 0.06859207153320312, 0.078338623046875, 0.08808517456054688, 0.09783172607421875, 0.10757827758789062, 0.1173248291015625, 0.12707138061523438, 0.13681793212890625, 0.14656448364257812, 0.15631103515625, 0.16605758666992188, 0.17580413818359375, 0.18555068969726562, 0.1952972412109375, 0.20504379272460938, 0.21479034423828125, 0.22453689575195312, 0.234283447265625, 0.24402999877929688, 0.25377655029296875, 0.2635231018066406, 0.2732696533203125, 0.2830162048339844, 0.29276275634765625, 0.3025093078613281, 0.312255859375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 8.0, 7.0, 7.0, 6.0, 9.0, 17.0, 12.0, 18.0, 15.0, 19.0, 20.0, 30.0, 22.0, 34.0, 39.0, 37.0, 42.0, 32.0, 55.0, 53.0, 42.0, 52.0, 27.0, 44.0, 40.0, 30.0, 34.0, 44.0, 40.0, 32.0, 21.0, 19.0, 16.0, 11.0, 17.0, 14.0, 7.0, 4.0, 4.0, 3.0, 6.0, 3.0, 0.0, 2.0, 2.0, 4.0, 0.0, 1.0], "bins": [-0.06427001953125, -0.062487125396728516, -0.06070423126220703, -0.05892133712768555, -0.05713844299316406, -0.05535554885864258, -0.053572654724121094, -0.05178976058959961, -0.050006866455078125, -0.04822397232055664, -0.046441078186035156, -0.04465818405151367, -0.04287528991699219, -0.0410923957824707, -0.03930950164794922, -0.037526607513427734, -0.03574371337890625, -0.033960819244384766, -0.03217792510986328, -0.030395030975341797, -0.028612136840820312, -0.026829242706298828, -0.025046348571777344, -0.02326345443725586, -0.021480560302734375, -0.01969766616821289, -0.017914772033691406, -0.016131877899169922, -0.014348983764648438, -0.012566089630126953, -0.010783195495605469, -0.009000301361083984, -0.0072174072265625, -0.005434513092041016, -0.0036516189575195312, -0.0018687248229980469, -8.58306884765625e-05, 0.0016970634460449219, 0.0034799575805664062, 0.005262851715087891, 0.007045745849609375, 0.00882863998413086, 0.010611534118652344, 0.012394428253173828, 0.014177322387695312, 0.015960216522216797, 0.01774311065673828, 0.019526004791259766, 0.02130889892578125, 0.023091793060302734, 0.02487468719482422, 0.026657581329345703, 0.028440475463867188, 0.030223369598388672, 0.032006263732910156, 0.03378915786743164, 0.035572052001953125, 0.03735494613647461, 0.039137840270996094, 0.04092073440551758, 0.04270362854003906, 0.04448652267456055, 0.04626941680908203, 0.048052310943603516, 0.049835205078125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 6.0, 10.0, 3.0, 21.0, 15.0, 18.0, 31.0, 20.0, 25.0, 34.0, 49.0, 48.0, 93.0, 218.0, 1003.0, 8069.0, 4145239.0, 36374.0, 2157.0, 393.0, 142.0, 66.0, 47.0, 43.0, 28.0, 29.0, 13.0, 18.0, 23.0, 18.0, 17.0, 5.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.402587890625, -0.3909912109375, -0.37939453125, -0.3677978515625, -0.356201171875, -0.3446044921875, -0.3330078125, -0.3214111328125, -0.309814453125, -0.2982177734375, -0.28662109375, -0.2750244140625, -0.263427734375, -0.2518310546875, -0.240234375, -0.2286376953125, -0.217041015625, -0.2054443359375, -0.19384765625, -0.1822509765625, -0.170654296875, -0.1590576171875, -0.1474609375, -0.1358642578125, -0.124267578125, -0.1126708984375, -0.10107421875, -0.0894775390625, -0.077880859375, -0.0662841796875, -0.0546875, -0.0430908203125, -0.031494140625, -0.0198974609375, -0.00830078125, 0.0032958984375, 0.014892578125, 0.0264892578125, 0.0380859375, 0.0496826171875, 0.061279296875, 0.0728759765625, 0.08447265625, 0.0960693359375, 0.107666015625, 0.1192626953125, 0.130859375, 0.1424560546875, 0.154052734375, 0.1656494140625, 0.17724609375, 0.1888427734375, 0.200439453125, 0.2120361328125, 0.2236328125, 0.2352294921875, 0.246826171875, 0.2584228515625, 0.27001953125, 0.2816162109375, 0.293212890625, 0.3048095703125, 0.31640625, 0.3280029296875, 0.339599609375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 6.0, 5.0, 22.0, 90.0, 3869.0, 68.0, 16.0, 8.0, 2.0, 3.0], "bins": [-0.175537109375, -0.1725296974182129, -0.16952228546142578, -0.16651487350463867, -0.16350746154785156, -0.16050004959106445, -0.15749263763427734, -0.15448522567749023, -0.15147781372070312, -0.14847040176391602, -0.1454629898071289, -0.1424555778503418, -0.1394481658935547, -0.13644075393676758, -0.13343334197998047, -0.13042593002319336, -0.12741851806640625, -0.12441110610961914, -0.12140369415283203, -0.11839628219604492, -0.11538887023925781, -0.1123814582824707, -0.1093740463256836, -0.10636663436889648, -0.10335922241210938, -0.10035181045532227, -0.09734439849853516, -0.09433698654174805, -0.09132957458496094, -0.08832216262817383, -0.08531475067138672, -0.08230733871459961, -0.0792999267578125, -0.07629251480102539, -0.07328510284423828, -0.07027769088745117, -0.06727027893066406, -0.06426286697387695, -0.061255455017089844, -0.058248043060302734, -0.055240631103515625, -0.052233219146728516, -0.049225807189941406, -0.0462183952331543, -0.04321098327636719, -0.04020357131958008, -0.03719615936279297, -0.03418874740600586, -0.03118133544921875, -0.02817392349243164, -0.02516651153564453, -0.022159099578857422, -0.019151687622070312, -0.016144275665283203, -0.013136863708496094, -0.010129451751708984, -0.007122039794921875, -0.004114627838134766, -0.0011072158813476562, 0.0019001960754394531, 0.0049076080322265625, 0.007915019989013672, 0.010922431945800781, 0.01392984390258789, 0.016937255859375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 11.0, 40.0, 123.0, 617.0, 198.0, 20.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6806716322898865, -0.6592617034912109, -0.6378517746925354, -0.6164418458938599, -0.5950319170951843, -0.5736219882965088, -0.5522119998931885, -0.5308021306991577, -0.5093921422958374, -0.48798221349716187, -0.46657228469848633, -0.4451623558998108, -0.42375242710113525, -0.4023424983024597, -0.3809325397014618, -0.35952261090278625, -0.3381127119064331, -0.31670278310775757, -0.29529285430908203, -0.2738829255104065, -0.25247299671173096, -0.23106305301189423, -0.2096531093120575, -0.18824318051338196, -0.16683325171470642, -0.14542332291603088, -0.12401338666677475, -0.10260345041751862, -0.08119352161884308, -0.05978359282016754, -0.03837364912033081, -0.016963720321655273, 0.004446268081665039, 0.025856200605630875, 0.04726613312959671, 0.06867606937885284, 0.09008599817752838, 0.11149592697620392, 0.13290587067604065, 0.1543157994747162, 0.17572572827339172, 0.19713565707206726, 0.2185455858707428, 0.23995552957057953, 0.26136547327041626, 0.2827754020690918, 0.30418533086776733, 0.32559525966644287, 0.3470051884651184, 0.36841511726379395, 0.3898250460624695, 0.411234974861145, 0.43264490365982056, 0.4540548324584961, 0.475464791059494, 0.49687471985816956, 0.5182846784591675, 0.539694607257843, 0.5611045360565186, 0.5825144648551941, 0.6039243936538696, 0.6253343224525452, 0.6467442512512207, 0.668154239654541, 0.6895641088485718]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 4.0, 4.0, 12.0, 8.0, 9.0, 13.0, 16.0, 24.0, 27.0, 37.0, 27.0, 24.0, 35.0, 31.0, 52.0, 58.0, 42.0, 43.0, 49.0, 51.0, 50.0, 38.0, 47.0, 38.0, 35.0, 23.0, 34.0, 31.0, 30.0, 26.0, 17.0, 12.0, 10.0, 9.0, 14.0, 9.0, 6.0, 6.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.12235355377197266, -0.11856792122125626, -0.11478228867053986, -0.11099665611982346, -0.10721102356910706, -0.10342539101839066, -0.09963975846767426, -0.09585412591695786, -0.09206849336624146, -0.08828286081552505, -0.08449722826480865, -0.08071159571409225, -0.07692596316337585, -0.07314033061265945, -0.06935469806194305, -0.06556906551122665, -0.061783432960510254, -0.057997800409793854, -0.054212167859077454, -0.05042653530836105, -0.04664090275764465, -0.04285527020692825, -0.03906963765621185, -0.03528400510549545, -0.03149837255477905, -0.027712740004062653, -0.023927107453346252, -0.020141474902629852, -0.016355842351913452, -0.012570209801197052, -0.008784577250480652, -0.004998944699764252, -0.0012133121490478516, 0.0025723204016685486, 0.006357952952384949, 0.010143585503101349, 0.013929218053817749, 0.01771485060453415, 0.02150048315525055, 0.02528611570596695, 0.02907174825668335, 0.03285738080739975, 0.03664301335811615, 0.04042864590883255, 0.04421427845954895, 0.04799991101026535, 0.05178554356098175, 0.05557117611169815, 0.05935680866241455, 0.06314244121313095, 0.06692807376384735, 0.07071370631456375, 0.07449933886528015, 0.07828497141599655, 0.08207060396671295, 0.08585623651742935, 0.08964186906814575, 0.09342750161886215, 0.09721313416957855, 0.10099876672029495, 0.10478439927101135, 0.10857003182172775, 0.11235566437244415, 0.11614129692316055, 0.11992692947387695]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 5.0, 3.0, 9.0, 13.0, 10.0, 25.0, 20.0, 38.0, 52.0, 95.0, 125.0, 134.0, 222.0, 325.0, 435.0, 654.0, 977.0, 1710.0, 2966.0, 7143.0, 25349.0, 153863.0, 617208.0, 190961.0, 30119.0, 7967.0, 3177.0, 1689.0, 1055.0, 666.0, 437.0, 318.0, 234.0, 162.0, 98.0, 79.0, 66.0, 46.0, 29.0, 27.0, 13.0, 12.0, 10.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.1951904296875, -0.18937301635742188, -0.18355560302734375, -0.17773818969726562, -0.1719207763671875, -0.16610336303710938, -0.16028594970703125, -0.15446853637695312, -0.148651123046875, -0.14283370971679688, -0.13701629638671875, -0.13119888305664062, -0.1253814697265625, -0.11956405639648438, -0.11374664306640625, -0.10792922973632812, -0.10211181640625, -0.09629440307617188, -0.09047698974609375, -0.08465957641601562, -0.0788421630859375, -0.07302474975585938, -0.06720733642578125, -0.061389923095703125, -0.055572509765625, -0.049755096435546875, -0.04393768310546875, -0.038120269775390625, -0.0323028564453125, -0.026485443115234375, -0.02066802978515625, -0.014850616455078125, -0.009033203125, -0.003215789794921875, 0.00260162353515625, 0.008419036865234375, 0.0142364501953125, 0.020053863525390625, 0.02587127685546875, 0.031688690185546875, 0.037506103515625, 0.043323516845703125, 0.04914093017578125, 0.054958343505859375, 0.0607757568359375, 0.06659317016601562, 0.07241058349609375, 0.07822799682617188, 0.08404541015625, 0.08986282348632812, 0.09568023681640625, 0.10149765014648438, 0.1073150634765625, 0.11313247680664062, 0.11894989013671875, 0.12476730346679688, 0.130584716796875, 0.13640213012695312, 0.14221954345703125, 0.14803695678710938, 0.1538543701171875, 0.15967178344726562, 0.16548919677734375, 0.17130661010742188, 0.1771240234375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 3.0, 4.0, 5.0, 3.0, 3.0, 6.0, 7.0, 12.0, 6.0, 9.0, 16.0, 18.0, 19.0, 25.0, 22.0, 31.0, 25.0, 40.0, 39.0, 29.0, 41.0, 41.0, 52.0, 44.0, 54.0, 40.0, 34.0, 38.0, 35.0, 45.0, 38.0, 39.0, 28.0, 23.0, 20.0, 16.0, 17.0, 16.0, 13.0, 17.0, 7.0, 9.0, 5.0, 5.0, 3.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.06689453125, -0.06491899490356445, -0.0629434585571289, -0.06096792221069336, -0.05899238586425781, -0.057016849517822266, -0.05504131317138672, -0.05306577682495117, -0.051090240478515625, -0.04911470413208008, -0.04713916778564453, -0.045163631439208984, -0.04318809509277344, -0.04121255874633789, -0.039237022399902344, -0.0372614860534668, -0.03528594970703125, -0.0333104133605957, -0.031334877014160156, -0.02935934066772461, -0.027383804321289062, -0.025408267974853516, -0.02343273162841797, -0.021457195281982422, -0.019481658935546875, -0.017506122589111328, -0.015530586242675781, -0.013555049896240234, -0.011579513549804688, -0.00960397720336914, -0.007628440856933594, -0.005652904510498047, -0.0036773681640625, -0.0017018318176269531, 0.00027370452880859375, 0.0022492408752441406, 0.0042247772216796875, 0.006200313568115234, 0.008175849914550781, 0.010151386260986328, 0.012126922607421875, 0.014102458953857422, 0.01607799530029297, 0.018053531646728516, 0.020029067993164062, 0.02200460433959961, 0.023980140686035156, 0.025955677032470703, 0.02793121337890625, 0.029906749725341797, 0.031882286071777344, 0.03385782241821289, 0.03583335876464844, 0.037808895111083984, 0.03978443145751953, 0.04175996780395508, 0.043735504150390625, 0.04571104049682617, 0.04768657684326172, 0.049662113189697266, 0.05163764953613281, 0.05361318588256836, 0.055588722229003906, 0.05756425857543945, 0.059539794921875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 7.0, 8.0, 16.0, 27.0, 47.0, 68.0, 87.0, 148.0, 229.0, 289.0, 451.0, 867.0, 1565.0, 3337.0, 12609.0, 462692.0, 545319.0, 13595.0, 3306.0, 1571.0, 897.0, 506.0, 327.0, 185.0, 149.0, 99.0, 57.0, 34.0, 20.0, 16.0, 7.0, 3.0, 3.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.395263671875, -0.38364410400390625, -0.3720245361328125, -0.36040496826171875, -0.348785400390625, -0.33716583251953125, -0.3255462646484375, -0.31392669677734375, -0.30230712890625, -0.29068756103515625, -0.2790679931640625, -0.26744842529296875, -0.255828857421875, -0.24420928955078125, -0.2325897216796875, -0.22097015380859375, -0.2093505859375, -0.19773101806640625, -0.1861114501953125, -0.17449188232421875, -0.162872314453125, -0.15125274658203125, -0.1396331787109375, -0.12801361083984375, -0.11639404296875, -0.10477447509765625, -0.0931549072265625, -0.08153533935546875, -0.069915771484375, -0.05829620361328125, -0.0466766357421875, -0.03505706787109375, -0.0234375, -0.01181793212890625, -0.0001983642578125, 0.01142120361328125, 0.023040771484375, 0.03466033935546875, 0.0462799072265625, 0.05789947509765625, 0.06951904296875, 0.08113861083984375, 0.0927581787109375, 0.10437774658203125, 0.115997314453125, 0.12761688232421875, 0.1392364501953125, 0.15085601806640625, 0.1624755859375, 0.17409515380859375, 0.1857147216796875, 0.19733428955078125, 0.208953857421875, 0.22057342529296875, 0.2321929931640625, 0.24381256103515625, 0.25543212890625, 0.26705169677734375, 0.2786712646484375, 0.29029083251953125, 0.301910400390625, 0.31352996826171875, 0.3251495361328125, 0.33676910400390625, 0.348388671875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 2.0, 3.0, 2.0, 9.0, 7.0, 18.0, 9.0, 27.0, 33.0, 34.0, 41.0, 49.0, 52.0, 65.0, 42.0, 62.0, 69.0, 62.0, 56.0, 57.0, 54.0, 44.0, 42.0, 37.0, 25.0, 23.0, 23.0, 14.0, 8.0, 8.0, 4.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.413818359375, -0.4019775390625, -0.39013671875, -0.3782958984375, -0.366455078125, -0.3546142578125, -0.3427734375, -0.3309326171875, -0.319091796875, -0.3072509765625, -0.29541015625, -0.2835693359375, -0.271728515625, -0.2598876953125, -0.248046875, -0.2362060546875, -0.224365234375, -0.2125244140625, -0.20068359375, -0.1888427734375, -0.177001953125, -0.1651611328125, -0.1533203125, -0.1414794921875, -0.129638671875, -0.1177978515625, -0.10595703125, -0.0941162109375, -0.082275390625, -0.0704345703125, -0.05859375, -0.0467529296875, -0.034912109375, -0.0230712890625, -0.01123046875, 0.0006103515625, 0.012451171875, 0.0242919921875, 0.0361328125, 0.0479736328125, 0.059814453125, 0.0716552734375, 0.08349609375, 0.0953369140625, 0.107177734375, 0.1190185546875, 0.130859375, 0.1427001953125, 0.154541015625, 0.1663818359375, 0.17822265625, 0.1900634765625, 0.201904296875, 0.2137451171875, 0.2255859375, 0.2374267578125, 0.249267578125, 0.2611083984375, 0.27294921875, 0.2847900390625, 0.296630859375, 0.3084716796875, 0.3203125, 0.3321533203125, 0.343994140625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 5.0, 9.0, 6.0, 29.0, 56.0, 163.0, 605.0, 3988.0, 588096.0, 450976.0, 3760.0, 591.0, 158.0, 60.0, 22.0, 9.0, 7.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.329345703125, -0.31871795654296875, -0.3080902099609375, -0.29746246337890625, -0.286834716796875, -0.27620697021484375, -0.2655792236328125, -0.25495147705078125, -0.24432373046875, -0.23369598388671875, -0.2230682373046875, -0.21244049072265625, -0.201812744140625, -0.19118499755859375, -0.1805572509765625, -0.16992950439453125, -0.1593017578125, -0.14867401123046875, -0.1380462646484375, -0.12741851806640625, -0.116790771484375, -0.10616302490234375, -0.0955352783203125, -0.08490753173828125, -0.07427978515625, -0.06365203857421875, -0.0530242919921875, -0.04239654541015625, -0.031768798828125, -0.02114105224609375, -0.0105133056640625, 0.00011444091796875, 0.0107421875, 0.02136993408203125, 0.0319976806640625, 0.04262542724609375, 0.053253173828125, 0.06388092041015625, 0.0745086669921875, 0.08513641357421875, 0.09576416015625, 0.10639190673828125, 0.1170196533203125, 0.12764739990234375, 0.138275146484375, 0.14890289306640625, 0.1595306396484375, 0.17015838623046875, 0.1807861328125, 0.19141387939453125, 0.2020416259765625, 0.21266937255859375, 0.223297119140625, 0.23392486572265625, 0.2445526123046875, 0.25518035888671875, 0.26580810546875, 0.27643585205078125, 0.2870635986328125, 0.29769134521484375, 0.308319091796875, 0.31894683837890625, 0.3295745849609375, 0.34020233154296875, 0.350830078125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 2.0, 13.0, 9.0, 26.0, 53.0, 90.0, 142.0, 169.0, 188.0, 117.0, 65.0, 43.0, 28.0, 15.0, 9.0, 10.0, 1.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8477439880371094e-05, -1.7729587852954865e-05, -1.6981735825538635e-05, -1.6233883798122406e-05, -1.5486031770706177e-05, -1.4738179743289948e-05, -1.3990327715873718e-05, -1.3242475688457489e-05, -1.249462366104126e-05, -1.174677163362503e-05, -1.0998919606208801e-05, -1.0251067578792572e-05, -9.503215551376343e-06, -8.755363523960114e-06, -8.007511496543884e-06, -7.259659469127655e-06, -6.511807441711426e-06, -5.7639554142951965e-06, -5.016103386878967e-06, -4.268251359462738e-06, -3.520399332046509e-06, -2.7725473046302795e-06, -2.0246952772140503e-06, -1.276843249797821e-06, -5.289912223815918e-07, 2.1886080503463745e-07, 9.667128324508667e-07, 1.714564859867096e-06, 2.462416887283325e-06, 3.2102689146995544e-06, 3.958120942115784e-06, 4.705972969532013e-06, 5.453824996948242e-06, 6.2016770243644714e-06, 6.949529051780701e-06, 7.69738107919693e-06, 8.44523310661316e-06, 9.193085134029388e-06, 9.940937161445618e-06, 1.0688789188861847e-05, 1.1436641216278076e-05, 1.2184493243694305e-05, 1.2932345271110535e-05, 1.3680197298526764e-05, 1.4428049325942993e-05, 1.5175901353359222e-05, 1.592375338077545e-05, 1.667160540819168e-05, 1.741945743560791e-05, 1.816730946302414e-05, 1.891516149044037e-05, 1.9663013517856598e-05, 2.0410865545272827e-05, 2.1158717572689056e-05, 2.1906569600105286e-05, 2.2654421627521515e-05, 2.3402273654937744e-05, 2.4150125682353973e-05, 2.4897977709770203e-05, 2.5645829737186432e-05, 2.639368176460266e-05, 2.714153379201889e-05, 2.788938581943512e-05, 2.863723784685135e-05, 2.9385089874267578e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 9.0, 1.0, 8.0, 7.0, 7.0, 9.0, 18.0, 16.0, 28.0, 63.0, 116.0, 191.0, 397.0, 893.0, 2374.0, 7687.0, 57973.0, 930807.0, 37801.0, 6506.0, 2149.0, 762.0, 360.0, 151.0, 98.0, 36.0, 27.0, 27.0, 11.0, 8.0, 4.0, 4.0, 4.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16796875, -0.16294479370117188, -0.15792083740234375, -0.15289688110351562, -0.1478729248046875, -0.14284896850585938, -0.13782501220703125, -0.13280105590820312, -0.127777099609375, -0.12275314331054688, -0.11772918701171875, -0.11270523071289062, -0.1076812744140625, -0.10265731811523438, -0.09763336181640625, -0.09260940551757812, -0.08758544921875, -0.08256149291992188, -0.07753753662109375, -0.07251358032226562, -0.0674896240234375, -0.062465667724609375, -0.05744171142578125, -0.052417755126953125, -0.047393798828125, -0.042369842529296875, -0.03734588623046875, -0.032321929931640625, -0.0272979736328125, -0.022274017333984375, -0.01725006103515625, -0.012226104736328125, -0.0072021484375, -0.002178192138671875, 0.00284576416015625, 0.007869720458984375, 0.0128936767578125, 0.017917633056640625, 0.02294158935546875, 0.027965545654296875, 0.032989501953125, 0.038013458251953125, 0.04303741455078125, 0.048061370849609375, 0.0530853271484375, 0.058109283447265625, 0.06313323974609375, 0.06815719604492188, 0.07318115234375, 0.07820510864257812, 0.08322906494140625, 0.08825302124023438, 0.0932769775390625, 0.09830093383789062, 0.10332489013671875, 0.10834884643554688, 0.113372802734375, 0.11839675903320312, 0.12342071533203125, 0.12844467163085938, 0.1334686279296875, 0.13849258422851562, 0.14351654052734375, 0.14854049682617188, 0.153564453125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 5.0, 2.0, 5.0, 3.0, 4.0, 2.0, 5.0, 6.0, 10.0, 40.0, 77.0, 230.0, 293.0, 178.0, 59.0, 20.0, 13.0, 5.0, 4.0, 4.0, 5.0, 5.0, 2.0, 4.0, 2.0, 3.0, 0.0, 4.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.37060546875, -0.36067962646484375, -0.3507537841796875, -0.34082794189453125, -0.330902099609375, -0.32097625732421875, -0.3110504150390625, -0.30112457275390625, -0.29119873046875, -0.28127288818359375, -0.2713470458984375, -0.26142120361328125, -0.251495361328125, -0.24156951904296875, -0.2316436767578125, -0.22171783447265625, -0.2117919921875, -0.20186614990234375, -0.1919403076171875, -0.18201446533203125, -0.172088623046875, -0.16216278076171875, -0.1522369384765625, -0.14231109619140625, -0.13238525390625, -0.12245941162109375, -0.1125335693359375, -0.10260772705078125, -0.092681884765625, -0.08275604248046875, -0.0728302001953125, -0.06290435791015625, -0.052978515625, -0.04305267333984375, -0.0331268310546875, -0.02320098876953125, -0.013275146484375, -0.00334930419921875, 0.0065765380859375, 0.01650238037109375, 0.02642822265625, 0.03635406494140625, 0.0462799072265625, 0.05620574951171875, 0.066131591796875, 0.07605743408203125, 0.0859832763671875, 0.09590911865234375, 0.1058349609375, 0.11576080322265625, 0.1256866455078125, 0.13561248779296875, 0.145538330078125, 0.15546417236328125, 0.1653900146484375, 0.17531585693359375, 0.18524169921875, 0.19516754150390625, 0.2050933837890625, 0.21501922607421875, 0.224945068359375, 0.23487091064453125, 0.2447967529296875, 0.25472259521484375, 0.2646484375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 6.0, 3.0, 11.0, 23.0, 43.0, 97.0, 187.0, 282.0, 221.0, 79.0, 37.0, 14.0, 8.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8872499465942383, -3.792384147644043, -3.6975183486938477, -3.6026525497436523, -3.507786750793457, -3.4129209518432617, -3.3180551528930664, -3.223189353942871, -3.128323554992676, -3.0334577560424805, -2.938591957092285, -2.84372615814209, -2.7488603591918945, -2.653994560241699, -2.559128761291504, -2.4642629623413086, -2.3693971633911133, -2.274531364440918, -2.1796655654907227, -2.0847997665405273, -1.989933967590332, -1.8950681686401367, -1.8002023696899414, -1.705336570739746, -1.6104707717895508, -1.5156049728393555, -1.4207391738891602, -1.3258733749389648, -1.2310075759887695, -1.1361417770385742, -1.041275978088379, -0.9464101791381836, -0.8515441417694092, -0.7566783428192139, -0.6618125438690186, -0.5669467449188232, -0.47208094596862793, -0.3772151470184326, -0.2823493480682373, -0.187483549118042, -0.09261775016784668, 0.002248048782348633, 0.09711384773254395, 0.19197964668273926, 0.28684544563293457, 0.3817112445831299, 0.4765770435333252, 0.5714428424835205, 0.6663086414337158, 0.7611744403839111, 0.8560402393341064, 0.9509060382843018, 1.045771837234497, 1.1406376361846924, 1.2355034351348877, 1.330369234085083, 1.4252350330352783, 1.5201008319854736, 1.614966630935669, 1.7098324298858643, 1.8046982288360596, 1.8995640277862549, 1.9944298267364502, 2.0892956256866455, 2.184161424636841]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 2.0, 3.0, 3.0, 9.0, 6.0, 8.0, 13.0, 11.0, 14.0, 18.0, 29.0, 30.0, 29.0, 42.0, 32.0, 50.0, 35.0, 51.0, 45.0, 45.0, 59.0, 57.0, 73.0, 42.0, 35.0, 37.0, 45.0, 33.0, 26.0, 24.0, 15.0, 17.0, 11.0, 11.0, 11.0, 9.0, 9.0, 6.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.568739414215088, -1.5169123411178589, -1.4650852680206299, -1.4132580757141113, -1.3614310026168823, -1.3096039295196533, -1.2577768564224243, -1.2059497833251953, -1.1541227102279663, -1.1022956371307373, -1.0504685640335083, -0.9986414313316345, -0.9468143582344055, -0.8949872255325317, -0.8431601524353027, -0.7913330793380737, -0.7395059466362, -0.687678873538971, -0.6358517408370972, -0.5840246677398682, -0.5321975946426392, -0.48037049174308777, -0.4285433888435364, -0.3767163157463074, -0.324889212846756, -0.2730621099472046, -0.22123503684997559, -0.1694079339504242, -0.117580845952034, -0.0657537579536438, -0.013926655054092407, 0.0379004180431366, 0.08972752094268799, 0.14155460894107819, 0.19338169693946838, 0.24520879983901978, 0.2970358729362488, 0.34886297583580017, 0.40069007873535156, 0.45251715183258057, 0.5043442249298096, 0.5561712980270386, 0.6079984307289124, 0.6598255038261414, 0.7116525769233704, 0.7634797096252441, 0.8153067827224731, 0.8671338558197021, 0.9189609885215759, 0.9707880616188049, 1.0226151943206787, 1.0744422674179077, 1.1262693405151367, 1.1780964136123657, 1.2299234867095947, 1.2817506790161133, 1.3335777521133423, 1.3854048252105713, 1.4372318983078003, 1.4890589714050293, 1.5408861637115479, 1.5927132368087769, 1.6445403099060059, 1.6963673830032349, 1.7481944561004639]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 2.0, 7.0, 6.0, 4.0, 8.0, 5.0, 7.0, 10.0, 15.0, 27.0, 28.0, 30.0, 51.0, 101.0, 207.0, 538.0, 2782.0, 54711.0, 4125745.0, 8354.0, 985.0, 292.0, 130.0, 71.0, 58.0, 24.0, 21.0, 16.0, 13.0, 11.0, 6.0, 4.0, 3.0, 4.0, 3.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.455322265625, -0.4424018859863281, -0.42948150634765625, -0.4165611267089844, -0.4036407470703125, -0.3907203674316406, -0.37779998779296875, -0.3648796081542969, -0.351959228515625, -0.3390388488769531, -0.32611846923828125, -0.3131980895996094, -0.3002777099609375, -0.2873573303222656, -0.27443695068359375, -0.2615165710449219, -0.24859619140625, -0.23567581176757812, -0.22275543212890625, -0.20983505249023438, -0.1969146728515625, -0.18399429321289062, -0.17107391357421875, -0.15815353393554688, -0.145233154296875, -0.13231277465820312, -0.11939239501953125, -0.10647201538085938, -0.0935516357421875, -0.08063125610351562, -0.06771087646484375, -0.054790496826171875, -0.0418701171875, -0.028949737548828125, -0.01602935791015625, -0.003108978271484375, 0.0098114013671875, 0.022731781005859375, 0.03565216064453125, 0.048572540283203125, 0.061492919921875, 0.07441329956054688, 0.08733367919921875, 0.10025405883789062, 0.1131744384765625, 0.12609481811523438, 0.13901519775390625, 0.15193557739257812, 0.16485595703125, 0.17777633666992188, 0.19069671630859375, 0.20361709594726562, 0.2165374755859375, 0.22945785522460938, 0.24237823486328125, 0.2552986145019531, 0.268218994140625, 0.2811393737792969, 0.29405975341796875, 0.3069801330566406, 0.3199005126953125, 0.3328208923339844, 0.34574127197265625, 0.3586616516113281, 0.37158203125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 10.0, 10.0, 12.0, 12.0, 32.0, 29.0, 25.0, 32.0, 42.0, 59.0, 69.0, 74.0, 69.0, 69.0, 70.0, 68.0, 65.0, 47.0, 52.0, 47.0, 30.0, 26.0, 13.0, 12.0, 6.0, 7.0, 5.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0955810546875, -0.09228992462158203, -0.08899879455566406, -0.0857076644897461, -0.08241653442382812, -0.07912540435791016, -0.07583427429199219, -0.07254314422607422, -0.06925201416015625, -0.06596088409423828, -0.06266975402832031, -0.059378623962402344, -0.056087493896484375, -0.052796363830566406, -0.04950523376464844, -0.04621410369873047, -0.0429229736328125, -0.03963184356689453, -0.03634071350097656, -0.033049583435058594, -0.029758453369140625, -0.026467323303222656, -0.023176193237304688, -0.01988506317138672, -0.01659393310546875, -0.013302803039550781, -0.010011672973632812, -0.006720542907714844, -0.003429412841796875, -0.00013828277587890625, 0.0031528472900390625, 0.006443977355957031, 0.009735107421875, 0.013026237487792969, 0.016317367553710938, 0.019608497619628906, 0.022899627685546875, 0.026190757751464844, 0.029481887817382812, 0.03277301788330078, 0.03606414794921875, 0.03935527801513672, 0.04264640808105469, 0.045937538146972656, 0.049228668212890625, 0.052519798278808594, 0.05581092834472656, 0.05910205841064453, 0.0623931884765625, 0.06568431854248047, 0.06897544860839844, 0.0722665786743164, 0.07555770874023438, 0.07884883880615234, 0.08213996887207031, 0.08543109893798828, 0.08872222900390625, 0.09201335906982422, 0.09530448913574219, 0.09859561920166016, 0.10188674926757812, 0.1051778793334961, 0.10846900939941406, 0.11176013946533203, 0.11505126953125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 4.0, 6.0, 6.0, 11.0, 12.0, 16.0, 20.0, 27.0, 35.0, 55.0, 63.0, 97.0, 100.0, 162.0, 163.0, 221.0, 288.0, 344.0, 557.0, 3000.0, 4178972.0, 7770.0, 617.0, 398.0, 288.0, 210.0, 162.0, 127.0, 114.0, 82.0, 69.0, 68.0, 51.0, 37.0, 38.0, 22.0, 17.0, 14.0, 12.0, 11.0, 4.0, 8.0, 0.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.91943359375, -0.8883743286132812, -0.8573150634765625, -0.8262557983398438, -0.795196533203125, -0.7641372680664062, -0.7330780029296875, -0.7020187377929688, -0.67095947265625, -0.6399002075195312, -0.6088409423828125, -0.5777816772460938, -0.546722412109375, -0.5156631469726562, -0.4846038818359375, -0.45354461669921875, -0.4224853515625, -0.39142608642578125, -0.3603668212890625, -0.32930755615234375, -0.298248291015625, -0.26718902587890625, -0.2361297607421875, -0.20507049560546875, -0.17401123046875, -0.14295196533203125, -0.1118927001953125, -0.08083343505859375, -0.049774169921875, -0.01871490478515625, 0.0123443603515625, 0.04340362548828125, 0.074462890625, 0.10552215576171875, 0.1365814208984375, 0.16764068603515625, 0.198699951171875, 0.22975921630859375, 0.2608184814453125, 0.29187774658203125, 0.32293701171875, 0.35399627685546875, 0.3850555419921875, 0.41611480712890625, 0.447174072265625, 0.47823333740234375, 0.5092926025390625, 0.5403518676757812, 0.5714111328125, 0.6024703979492188, 0.6335296630859375, 0.6645889282226562, 0.695648193359375, 0.7267074584960938, 0.7577667236328125, 0.7888259887695312, 0.81988525390625, 0.8509445190429688, 0.8820037841796875, 0.9130630493164062, 0.944122314453125, 0.9751815795898438, 1.0062408447265625, 1.0373001098632812, 1.068359375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 9.0, 103.0, 3926.0, 38.0, 11.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.237060546875, -0.22058486938476562, -0.20410919189453125, -0.18763351440429688, -0.1711578369140625, -0.15468215942382812, -0.13820648193359375, -0.12173080444335938, -0.105255126953125, -0.08877944946289062, -0.07230377197265625, -0.055828094482421875, -0.0393524169921875, -0.022876739501953125, -0.00640106201171875, 0.010074615478515625, 0.02655029296875, 0.043025970458984375, 0.05950164794921875, 0.07597732543945312, 0.0924530029296875, 0.10892868041992188, 0.12540435791015625, 0.14188003540039062, 0.158355712890625, 0.17483139038085938, 0.19130706787109375, 0.20778274536132812, 0.2242584228515625, 0.24073410034179688, 0.25720977783203125, 0.2736854553222656, 0.2901611328125, 0.3066368103027344, 0.32311248779296875, 0.3395881652832031, 0.3560638427734375, 0.3725395202636719, 0.38901519775390625, 0.4054908752441406, 0.421966552734375, 0.4384422302246094, 0.45491790771484375, 0.4713935852050781, 0.4878692626953125, 0.5043449401855469, 0.5208206176757812, 0.5372962951660156, 0.55377197265625, 0.5702476501464844, 0.5867233276367188, 0.6031990051269531, 0.6196746826171875, 0.6361503601074219, 0.6526260375976562, 0.6691017150878906, 0.685577392578125, 0.7020530700683594, 0.7185287475585938, 0.7350044250488281, 0.7514801025390625, 0.7679557800292969, 0.7844314575195312, 0.8009071350097656, 0.8173828125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 9.0, 12.0, 21.0, 59.0, 98.0, 246.0, 265.0, 158.0, 64.0, 54.0, 11.0, 6.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5737394690513611, -0.5339073538780212, -0.49407529830932617, -0.45424318313598633, -0.41441112756729126, -0.3745790123939514, -0.33474692702293396, -0.2949148416519165, -0.25508275628089905, -0.2152506709098816, -0.17541858553886414, -0.13558648526668549, -0.09575439989566803, -0.055922314524650574, -0.016090214252471924, 0.023741871118545532, 0.06357395648956299, 0.10340604186058044, 0.1432381272315979, 0.18307022750377655, 0.222902312874794, 0.26273441314697266, 0.3025664985179901, 0.34239858388900757, 0.382230669260025, 0.4220627546310425, 0.46189484000205994, 0.5017269253730774, 0.5415590405464172, 0.5813910961151123, 0.6212232112884521, 0.661055326461792, 0.7008873224258423, 0.7407194375991821, 0.7805514931678772, 0.820383608341217, 0.8602156639099121, 0.900047779083252, 0.9398798942565918, 0.9797119498252869, 1.019544005393982, 1.0593761205673218, 1.0992082357406616, 1.139040231704712, 1.1788723468780518, 1.2187044620513916, 1.2585365772247314, 1.2983686923980713, 1.3382008075714111, 1.378032922744751, 1.4178650379180908, 1.4576970338821411, 1.497529149055481, 1.5373612642288208, 1.5771933794021606, 1.617025375366211, 1.6568574905395508, 1.6966896057128906, 1.7365217208862305, 1.7763537168502808, 1.8161858320236206, 1.8560179471969604, 1.8958500623703003, 1.9356820583343506, 1.9755141735076904]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 0.0, 6.0, 10.0, 10.0, 17.0, 14.0, 26.0, 38.0, 59.0, 64.0, 96.0, 123.0, 110.0, 106.0, 80.0, 72.0, 51.0, 38.0, 20.0, 25.0, 11.0, 7.0, 10.0, 5.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3556588888168335, -1.3171637058258057, -1.2786684036254883, -1.2401732206344604, -1.201677918434143, -1.1631827354431152, -1.1246874332427979, -1.08619225025177, -1.0476969480514526, -1.0092017650604248, -0.9707064628601074, -0.9322112202644348, -0.8937159776687622, -0.8552207350730896, -0.816725492477417, -0.7782303094863892, -0.7397350668907166, -0.701239824295044, -0.6627445816993713, -0.6242493391036987, -0.5857540965080261, -0.5472588539123535, -0.5087636709213257, -0.4702683985233307, -0.4317731559276581, -0.3932779133319855, -0.35478267073631287, -0.31628745794296265, -0.27779221534729004, -0.23929695785045624, -0.20080173015594482, -0.16230648756027222, -0.12381124496459961, -0.085316002368927, -0.04682076722383499, -0.008325532078742981, 0.030169710516929626, 0.06866495311260223, 0.10716018080711365, 0.14565542340278625, 0.18415066599845886, 0.22264590859413147, 0.2611411511898041, 0.2996363639831543, 0.3381316065788269, 0.3766268491744995, 0.4151220917701721, 0.4536173343658447, 0.49211257696151733, 0.5306078195571899, 0.5691030621528625, 0.6075983047485352, 0.6460935473442078, 0.6845887899398804, 0.7230839729309082, 0.7615792751312256, 0.8000744581222534, 0.838569700717926, 0.8770649433135986, 0.9155601859092712, 0.9540554285049438, 0.9925506711006165, 1.031045913696289, 1.069541096687317, 1.1080363988876343]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 4.0, 8.0, 7.0, 13.0, 27.0, 20.0, 25.0, 40.0, 75.0, 129.0, 211.0, 401.0, 669.0, 1501.0, 3130.0, 7858.0, 21896.0, 70724.0, 271329.0, 461513.0, 145629.0, 40387.0, 13392.0, 5090.0, 2194.0, 1008.0, 517.0, 296.0, 166.0, 89.0, 76.0, 43.0, 25.0, 14.0, 14.0, 10.0, 12.0, 4.0, 1.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1666259765625, -0.16146278381347656, -0.15629959106445312, -0.1511363983154297, -0.14597320556640625, -0.1408100128173828, -0.13564682006835938, -0.13048362731933594, -0.1253204345703125, -0.12015724182128906, -0.11499404907226562, -0.10983085632324219, -0.10466766357421875, -0.09950447082519531, -0.09434127807617188, -0.08917808532714844, -0.084014892578125, -0.07885169982910156, -0.07368850708007812, -0.06852531433105469, -0.06336212158203125, -0.05819892883300781, -0.053035736083984375, -0.04787254333496094, -0.0427093505859375, -0.03754615783691406, -0.032382965087890625, -0.027219772338867188, -0.02205657958984375, -0.016893386840820312, -0.011730194091796875, -0.0065670013427734375, -0.00140380859375, 0.0037593841552734375, 0.008922576904296875, 0.014085769653320312, 0.01924896240234375, 0.024412155151367188, 0.029575347900390625, 0.03473854064941406, 0.0399017333984375, 0.04506492614746094, 0.050228118896484375, 0.05539131164550781, 0.06055450439453125, 0.06571769714355469, 0.07088088989257812, 0.07604408264160156, 0.081207275390625, 0.08637046813964844, 0.09153366088867188, 0.09669685363769531, 0.10186004638671875, 0.10702323913574219, 0.11218643188476562, 0.11734962463378906, 0.1225128173828125, 0.12767601013183594, 0.13283920288085938, 0.1380023956298828, 0.14316558837890625, 0.1483287811279297, 0.15349197387695312, 0.15865516662597656, 0.163818359375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 6.0, 6.0, 14.0, 15.0, 26.0, 30.0, 36.0, 51.0, 71.0, 92.0, 102.0, 100.0, 79.0, 83.0, 63.0, 60.0, 48.0, 54.0, 25.0, 14.0, 15.0, 7.0, 7.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1722412109375, -0.167266845703125, -0.16229248046875, -0.157318115234375, -0.15234375, -0.147369384765625, -0.14239501953125, -0.137420654296875, -0.1324462890625, -0.127471923828125, -0.12249755859375, -0.117523193359375, -0.112548828125, -0.107574462890625, -0.10260009765625, -0.097625732421875, -0.0926513671875, -0.087677001953125, -0.08270263671875, -0.077728271484375, -0.07275390625, -0.067779541015625, -0.06280517578125, -0.057830810546875, -0.0528564453125, -0.047882080078125, -0.04290771484375, -0.037933349609375, -0.032958984375, -0.027984619140625, -0.02301025390625, -0.018035888671875, -0.0130615234375, -0.008087158203125, -0.00311279296875, 0.001861572265625, 0.0068359375, 0.011810302734375, 0.01678466796875, 0.021759033203125, 0.0267333984375, 0.031707763671875, 0.03668212890625, 0.041656494140625, 0.046630859375, 0.051605224609375, 0.05657958984375, 0.061553955078125, 0.0665283203125, 0.071502685546875, 0.07647705078125, 0.081451416015625, 0.08642578125, 0.091400146484375, 0.09637451171875, 0.101348876953125, 0.1063232421875, 0.111297607421875, 0.11627197265625, 0.121246337890625, 0.126220703125, 0.131195068359375, 0.13616943359375, 0.141143798828125, 0.1461181640625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 4.0, 8.0, 12.0, 26.0, 59.0, 82.0, 166.0, 320.0, 705.0, 3535.0, 431426.0, 606753.0, 3946.0, 805.0, 301.0, 158.0, 104.0, 56.0, 28.0, 20.0, 11.0, 4.0, 5.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.92822265625, -0.90093994140625, -0.8736572265625, -0.84637451171875, -0.819091796875, -0.79180908203125, -0.7645263671875, -0.73724365234375, -0.7099609375, -0.68267822265625, -0.6553955078125, -0.62811279296875, -0.600830078125, -0.57354736328125, -0.5462646484375, -0.51898193359375, -0.49169921875, -0.46441650390625, -0.4371337890625, -0.40985107421875, -0.382568359375, -0.35528564453125, -0.3280029296875, -0.30072021484375, -0.2734375, -0.24615478515625, -0.2188720703125, -0.19158935546875, -0.164306640625, -0.13702392578125, -0.1097412109375, -0.08245849609375, -0.05517578125, -0.02789306640625, -0.0006103515625, 0.02667236328125, 0.053955078125, 0.08123779296875, 0.1085205078125, 0.13580322265625, 0.1630859375, 0.19036865234375, 0.2176513671875, 0.24493408203125, 0.272216796875, 0.29949951171875, 0.3267822265625, 0.35406494140625, 0.38134765625, 0.40863037109375, 0.4359130859375, 0.46319580078125, 0.490478515625, 0.51776123046875, 0.5450439453125, 0.57232666015625, 0.599609375, 0.62689208984375, 0.6541748046875, 0.68145751953125, 0.708740234375, 0.73602294921875, 0.7633056640625, 0.79058837890625, 0.81787109375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 13.0, 21.0, 44.0, 87.0, 143.0, 165.0, 169.0, 158.0, 107.0, 59.0, 27.0, 11.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1640625, -1.1253204345703125, -1.086578369140625, -1.0478363037109375, -1.00909423828125, -0.9703521728515625, -0.931610107421875, -0.8928680419921875, -0.8541259765625, -0.8153839111328125, -0.776641845703125, -0.7378997802734375, -0.69915771484375, -0.6604156494140625, -0.621673583984375, -0.5829315185546875, -0.544189453125, -0.5054473876953125, -0.466705322265625, -0.4279632568359375, -0.38922119140625, -0.3504791259765625, -0.311737060546875, -0.2729949951171875, -0.2342529296875, -0.1955108642578125, -0.156768798828125, -0.1180267333984375, -0.07928466796875, -0.0405426025390625, -0.001800537109375, 0.0369415283203125, 0.07568359375, 0.1144256591796875, 0.153167724609375, 0.1919097900390625, 0.23065185546875, 0.2693939208984375, 0.308135986328125, 0.3468780517578125, 0.3856201171875, 0.4243621826171875, 0.463104248046875, 0.5018463134765625, 0.54058837890625, 0.5793304443359375, 0.618072509765625, 0.6568145751953125, 0.695556640625, 0.7342987060546875, 0.773040771484375, 0.8117828369140625, 0.85052490234375, 0.8892669677734375, 0.928009033203125, 0.9667510986328125, 1.0054931640625, 1.0442352294921875, 1.082977294921875, 1.1217193603515625, 1.16046142578125, 1.1992034912109375, 1.237945556640625, 1.2766876220703125, 1.3154296875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 3.0, 0.0, 4.0, 2.0, 3.0, 4.0, 3.0, 14.0, 15.0, 19.0, 30.0, 51.0, 87.0, 157.0, 317.0, 741.0, 2774.0, 17823.0, 479082.0, 524532.0, 18568.0, 2801.0, 811.0, 341.0, 168.0, 78.0, 40.0, 35.0, 21.0, 7.0, 9.0, 8.0, 3.0, 7.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09051513671875, -0.08658123016357422, -0.08264732360839844, -0.07871341705322266, -0.07477951049804688, -0.0708456039428711, -0.06691169738769531, -0.06297779083251953, -0.05904388427734375, -0.05510997772216797, -0.05117607116699219, -0.047242164611816406, -0.043308258056640625, -0.039374351501464844, -0.03544044494628906, -0.03150653839111328, -0.0275726318359375, -0.02363872528076172, -0.019704818725585938, -0.015770912170410156, -0.011837005615234375, -0.007903099060058594, -0.0039691925048828125, -3.528594970703125e-05, 0.00389862060546875, 0.007832527160644531, 0.011766433715820312, 0.015700340270996094, 0.019634246826171875, 0.023568153381347656, 0.027502059936523438, 0.03143596649169922, 0.035369873046875, 0.03930377960205078, 0.04323768615722656, 0.047171592712402344, 0.051105499267578125, 0.055039405822753906, 0.05897331237792969, 0.06290721893310547, 0.06684112548828125, 0.07077503204345703, 0.07470893859863281, 0.0786428451538086, 0.08257675170898438, 0.08651065826416016, 0.09044456481933594, 0.09437847137451172, 0.0983123779296875, 0.10224628448486328, 0.10618019104003906, 0.11011409759521484, 0.11404800415039062, 0.1179819107055664, 0.12191581726074219, 0.12584972381591797, 0.12978363037109375, 0.13371753692626953, 0.1376514434814453, 0.1415853500366211, 0.14551925659179688, 0.14945316314697266, 0.15338706970214844, 0.15732097625732422, 0.1612548828125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 3.0, 3.0, 4.0, 4.0, 5.0, 13.0, 11.0, 18.0, 26.0, 32.0, 57.0, 55.0, 94.0, 105.0, 114.0, 99.0, 91.0, 78.0, 55.0, 28.0, 24.0, 19.0, 15.0, 10.0, 13.0, 6.0, 5.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.9788742065429688e-05, -1.9245781004428864e-05, -1.870281994342804e-05, -1.8159858882427216e-05, -1.761689782142639e-05, -1.7073936760425568e-05, -1.6530975699424744e-05, -1.598801463842392e-05, -1.5445053577423096e-05, -1.4902092516422272e-05, -1.4359131455421448e-05, -1.3816170394420624e-05, -1.32732093334198e-05, -1.2730248272418976e-05, -1.2187287211418152e-05, -1.1644326150417328e-05, -1.1101365089416504e-05, -1.055840402841568e-05, -1.0015442967414856e-05, -9.472481906414032e-06, -8.929520845413208e-06, -8.386559784412384e-06, -7.84359872341156e-06, -7.300637662410736e-06, -6.757676601409912e-06, -6.214715540409088e-06, -5.671754479408264e-06, -5.12879341840744e-06, -4.585832357406616e-06, -4.042871296405792e-06, -3.4999102354049683e-06, -2.9569491744041443e-06, -2.4139881134033203e-06, -1.8710270524024963e-06, -1.3280659914016724e-06, -7.851049304008484e-07, -2.421438694000244e-07, 3.0081719160079956e-07, 8.437782526016235e-07, 1.3867393136024475e-06, 1.9297003746032715e-06, 2.4726614356040955e-06, 3.0156224966049194e-06, 3.5585835576057434e-06, 4.101544618606567e-06, 4.644505679607391e-06, 5.187466740608215e-06, 5.730427801609039e-06, 6.273388862609863e-06, 6.816349923610687e-06, 7.359310984611511e-06, 7.902272045612335e-06, 8.44523310661316e-06, 8.988194167613983e-06, 9.531155228614807e-06, 1.0074116289615631e-05, 1.0617077350616455e-05, 1.1160038411617279e-05, 1.1702999472618103e-05, 1.2245960533618927e-05, 1.2788921594619751e-05, 1.3331882655620575e-05, 1.3874843716621399e-05, 1.4417804777622223e-05, 1.4960765838623047e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 5.0, 2.0, 6.0, 8.0, 5.0, 12.0, 25.0, 33.0, 63.0, 113.0, 233.0, 554.0, 1536.0, 6412.0, 64976.0, 896514.0, 68831.0, 6602.0, 1533.0, 594.0, 217.0, 120.0, 65.0, 39.0, 14.0, 19.0, 12.0, 6.0, 6.0, 6.0, 2.0, 3.0], "bins": [-0.1876220703125, -0.18367290496826172, -0.17972373962402344, -0.17577457427978516, -0.17182540893554688, -0.1678762435913086, -0.1639270782470703, -0.15997791290283203, -0.15602874755859375, -0.15207958221435547, -0.1481304168701172, -0.1441812515258789, -0.14023208618164062, -0.13628292083740234, -0.13233375549316406, -0.12838459014892578, -0.1244354248046875, -0.12048625946044922, -0.11653709411621094, -0.11258792877197266, -0.10863876342773438, -0.1046895980834961, -0.10074043273925781, -0.09679126739501953, -0.09284210205078125, -0.08889293670654297, -0.08494377136230469, -0.0809946060180664, -0.07704544067382812, -0.07309627532958984, -0.06914710998535156, -0.06519794464111328, -0.061248779296875, -0.05729961395263672, -0.05335044860839844, -0.049401283264160156, -0.045452117919921875, -0.041502952575683594, -0.03755378723144531, -0.03360462188720703, -0.02965545654296875, -0.02570629119873047, -0.021757125854492188, -0.017807960510253906, -0.013858795166015625, -0.009909629821777344, -0.0059604644775390625, -0.0020112991333007812, 0.0019378662109375, 0.005887031555175781, 0.009836196899414062, 0.013785362243652344, 0.017734527587890625, 0.021683692932128906, 0.025632858276367188, 0.02958202362060547, 0.03353118896484375, 0.03748035430908203, 0.04142951965332031, 0.045378684997558594, 0.049327850341796875, 0.053277015686035156, 0.05722618103027344, 0.06117534637451172, 0.06512451171875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 6.0, 21.0, 21.0, 24.0, 37.0, 41.0, 86.0, 89.0, 109.0, 116.0, 121.0, 94.0, 68.0, 43.0, 33.0, 28.0, 16.0, 13.0, 10.0, 6.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1446533203125, -0.14107513427734375, -0.1374969482421875, -0.13391876220703125, -0.130340576171875, -0.12676239013671875, -0.1231842041015625, -0.11960601806640625, -0.11602783203125, -0.11244964599609375, -0.1088714599609375, -0.10529327392578125, -0.101715087890625, -0.09813690185546875, -0.0945587158203125, -0.09098052978515625, -0.08740234375, -0.08382415771484375, -0.0802459716796875, -0.07666778564453125, -0.073089599609375, -0.06951141357421875, -0.0659332275390625, -0.06235504150390625, -0.05877685546875, -0.05519866943359375, -0.0516204833984375, -0.04804229736328125, -0.044464111328125, -0.04088592529296875, -0.0373077392578125, -0.03372955322265625, -0.0301513671875, -0.02657318115234375, -0.0229949951171875, -0.01941680908203125, -0.015838623046875, -0.01226043701171875, -0.0086822509765625, -0.00510406494140625, -0.00152587890625, 0.00205230712890625, 0.0056304931640625, 0.00920867919921875, 0.012786865234375, 0.01636505126953125, 0.0199432373046875, 0.02352142333984375, 0.027099609375, 0.03067779541015625, 0.0342559814453125, 0.03783416748046875, 0.041412353515625, 0.04499053955078125, 0.0485687255859375, 0.05214691162109375, 0.05572509765625, 0.05930328369140625, 0.0628814697265625, 0.06645965576171875, 0.070037841796875, 0.07361602783203125, 0.0771942138671875, 0.08077239990234375, 0.0843505859375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 23.0, 104.0, 609.0, 234.0, 36.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.323984146118164, -13.018522262573242, -12.71306037902832, -12.407598495483398, -12.102136611938477, -11.796674728393555, -11.491212844848633, -11.185750961303711, -10.880289077758789, -10.574827194213867, -10.269365310668945, -9.963903427124023, -9.658441543579102, -9.35297966003418, -9.047517776489258, -8.742055892944336, -8.436594009399414, -8.131132125854492, -7.82567024230957, -7.520208358764648, -7.214746475219727, -6.909284591674805, -6.603822708129883, -6.298360824584961, -5.992897987365723, -5.687436103820801, -5.381974220275879, -5.076512336730957, -4.771050453186035, -4.465588569641113, -4.160126686096191, -3.8546645641326904, -3.5492029190063477, -3.243741035461426, -2.938279151916504, -2.632817268371582, -2.32735538482666, -2.0218935012817383, -1.7164313793182373, -1.4109694957733154, -1.1055076122283936, -0.8000457286834717, -0.49458378553390503, -0.18912184238433838, 0.1163400411605835, 0.42180192470550537, 0.7272639274597168, 1.0327258110046387, 1.3381876945495605, 1.6436495780944824, 1.9491114616394043, 2.254573345184326, 2.560035228729248, 2.86549711227417, 3.170959234237671, 3.4764211177825928, 3.7818830013275146, 4.087345123291016, 4.3928070068359375, 4.698268890380859, 5.003730773925781, 5.309192657470703, 5.614654541015625, 5.920116424560547, 6.225578308105469]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 5.0, 3.0, 3.0, 7.0, 10.0, 13.0, 7.0, 17.0, 29.0, 27.0, 41.0, 33.0, 47.0, 50.0, 50.0, 68.0, 63.0, 96.0, 74.0, 54.0, 44.0, 46.0, 48.0, 31.0, 26.0, 23.0, 25.0, 13.0, 14.0, 10.0, 11.0, 7.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.590027332305908, -2.511993408203125, -2.433959484100342, -2.3559253215789795, -2.2778913974761963, -2.199857473373413, -2.12182354927063, -2.0437896251678467, -1.965755581855774, -1.8877216577529907, -1.809687614440918, -1.7316536903381348, -1.6536197662353516, -1.5755857229232788, -1.4975517988204956, -1.4195177555084229, -1.3414838314056396, -1.2634499073028564, -1.1854158639907837, -1.1073819398880005, -1.0293478965759277, -0.9513139724731445, -0.8732800483703613, -0.7952460646629333, -0.7172120809555054, -0.6391780972480774, -0.5611441135406494, -0.4831101894378662, -0.40507620573043823, -0.32704222202301025, -0.24900826811790466, -0.17097431421279907, -0.0929403305053711, -0.014906361699104309, 0.06312760710716248, 0.14116157591342926, 0.21919554471969604, 0.297229528427124, 0.3752634823322296, 0.4532974362373352, 0.5313314199447632, 0.6093654036521912, 0.6873993873596191, 0.7654333114624023, 0.8434672951698303, 0.9215012788772583, 0.9995352029800415, 1.0775692462921143, 1.1556031703948975, 1.2336370944976807, 1.3116711378097534, 1.3897050619125366, 1.4677391052246094, 1.5457730293273926, 1.6238069534301758, 1.701840877532959, 1.7798749208450317, 1.857908844947815, 1.9359428882598877, 2.013976812362671, 2.092010736465454, 2.1700448989868164, 2.2480788230895996, 2.326112747192383, 2.404146671295166]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 13.0, 10.0, 20.0, 50.0, 105.0, 201.0, 481.0, 1217.0, 3348.0, 11409.0, 63653.0, 3382464.0, 688904.0, 31541.0, 7192.0, 2179.0, 833.0, 337.0, 145.0, 87.0, 47.0, 25.0, 14.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.280517578125, -0.2742595672607422, -0.2680015563964844, -0.26174354553222656, -0.25548553466796875, -0.24922752380371094, -0.24296951293945312, -0.2367115020751953, -0.2304534912109375, -0.2241954803466797, -0.21793746948242188, -0.21167945861816406, -0.20542144775390625, -0.19916343688964844, -0.19290542602539062, -0.1866474151611328, -0.180389404296875, -0.1741313934326172, -0.16787338256835938, -0.16161537170410156, -0.15535736083984375, -0.14909934997558594, -0.14284133911132812, -0.1365833282470703, -0.1303253173828125, -0.12406730651855469, -0.11780929565429688, -0.11155128479003906, -0.10529327392578125, -0.09903526306152344, -0.09277725219726562, -0.08651924133300781, -0.08026123046875, -0.07400321960449219, -0.06774520874023438, -0.06148719787597656, -0.05522918701171875, -0.04897117614746094, -0.042713165283203125, -0.03645515441894531, -0.0301971435546875, -0.023939132690429688, -0.017681121826171875, -0.011423110961914062, -0.00516510009765625, 0.0010929107666015625, 0.007350921630859375, 0.013608932495117188, 0.019866943359375, 0.026124954223632812, 0.032382965087890625, 0.03864097595214844, 0.04489898681640625, 0.05115699768066406, 0.057415008544921875, 0.06367301940917969, 0.0699310302734375, 0.07618904113769531, 0.08244705200195312, 0.08870506286621094, 0.09496307373046875, 0.10122108459472656, 0.10747909545898438, 0.11373710632324219, 0.1199951171875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 5.0, 10.0, 4.0, 6.0, 12.0, 12.0, 16.0, 19.0, 21.0, 30.0, 29.0, 32.0, 36.0, 39.0, 45.0, 51.0, 58.0, 59.0, 44.0, 55.0, 61.0, 49.0, 52.0, 38.0, 35.0, 28.0, 26.0, 27.0, 23.0, 17.0, 12.0, 11.0, 10.0, 3.0, 5.0, 6.0, 6.0, 1.0, 5.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.08441162109375, -0.08186721801757812, -0.07932281494140625, -0.07677841186523438, -0.0742340087890625, -0.07168960571289062, -0.06914520263671875, -0.06660079956054688, -0.064056396484375, -0.061511993408203125, -0.05896759033203125, -0.056423187255859375, -0.0538787841796875, -0.051334381103515625, -0.04878997802734375, -0.046245574951171875, -0.043701171875, -0.041156768798828125, -0.03861236572265625, -0.036067962646484375, -0.0335235595703125, -0.030979156494140625, -0.02843475341796875, -0.025890350341796875, -0.023345947265625, -0.020801544189453125, -0.01825714111328125, -0.015712738037109375, -0.0131683349609375, -0.010623931884765625, -0.00807952880859375, -0.005535125732421875, -0.00299072265625, -0.000446319580078125, 0.00209808349609375, 0.004642486572265625, 0.0071868896484375, 0.009731292724609375, 0.01227569580078125, 0.014820098876953125, 0.017364501953125, 0.019908905029296875, 0.02245330810546875, 0.024997711181640625, 0.0275421142578125, 0.030086517333984375, 0.03263092041015625, 0.035175323486328125, 0.0377197265625, 0.040264129638671875, 0.04280853271484375, 0.045352935791015625, 0.0478973388671875, 0.050441741943359375, 0.05298614501953125, 0.055530548095703125, 0.058074951171875, 0.060619354248046875, 0.06316375732421875, 0.06570816040039062, 0.0682525634765625, 0.07079696655273438, 0.07334136962890625, 0.07588577270507812, 0.07843017578125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 8.0, 9.0, 15.0, 32.0, 43.0, 71.0, 99.0, 182.0, 309.0, 639.0, 2350.0, 20471.0, 3098539.0, 1052013.0, 16337.0, 2015.0, 541.0, 270.0, 146.0, 90.0, 41.0, 26.0, 11.0, 11.0, 4.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31689453125, -0.3055572509765625, -0.294219970703125, -0.2828826904296875, -0.27154541015625, -0.2602081298828125, -0.248870849609375, -0.2375335693359375, -0.2261962890625, -0.2148590087890625, -0.203521728515625, -0.1921844482421875, -0.18084716796875, -0.1695098876953125, -0.158172607421875, -0.1468353271484375, -0.135498046875, -0.1241607666015625, -0.112823486328125, -0.1014862060546875, -0.09014892578125, -0.0788116455078125, -0.067474365234375, -0.0561370849609375, -0.0447998046875, -0.0334625244140625, -0.022125244140625, -0.0107879638671875, 0.00054931640625, 0.0118865966796875, 0.023223876953125, 0.0345611572265625, 0.0458984375, 0.0572357177734375, 0.068572998046875, 0.0799102783203125, 0.09124755859375, 0.1025848388671875, 0.113922119140625, 0.1252593994140625, 0.1365966796875, 0.1479339599609375, 0.159271240234375, 0.1706085205078125, 0.18194580078125, 0.1932830810546875, 0.204620361328125, 0.2159576416015625, 0.227294921875, 0.2386322021484375, 0.249969482421875, 0.2613067626953125, 0.27264404296875, 0.2839813232421875, 0.295318603515625, 0.3066558837890625, 0.3179931640625, 0.3293304443359375, 0.340667724609375, 0.3520050048828125, 0.36334228515625, 0.3746795654296875, 0.386016845703125, 0.3973541259765625, 0.40869140625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 8.0, 6.0, 8.0, 21.0, 28.0, 34.0, 71.0, 142.0, 415.0, 1788.0, 1055.0, 249.0, 84.0, 53.0, 29.0, 28.0, 18.0, 7.0, 9.0, 9.0, 5.0, 7.0, 3.0, 0.0, 3.0], "bins": [-0.431396484375, -0.42254638671875, -0.4136962890625, -0.40484619140625, -0.39599609375, -0.38714599609375, -0.3782958984375, -0.36944580078125, -0.360595703125, -0.35174560546875, -0.3428955078125, -0.33404541015625, -0.3251953125, -0.31634521484375, -0.3074951171875, -0.29864501953125, -0.289794921875, -0.28094482421875, -0.2720947265625, -0.26324462890625, -0.25439453125, -0.24554443359375, -0.2366943359375, -0.22784423828125, -0.218994140625, -0.21014404296875, -0.2012939453125, -0.19244384765625, -0.18359375, -0.17474365234375, -0.1658935546875, -0.15704345703125, -0.148193359375, -0.13934326171875, -0.1304931640625, -0.12164306640625, -0.11279296875, -0.10394287109375, -0.0950927734375, -0.08624267578125, -0.077392578125, -0.06854248046875, -0.0596923828125, -0.05084228515625, -0.0419921875, -0.03314208984375, -0.0242919921875, -0.01544189453125, -0.006591796875, 0.00225830078125, 0.0111083984375, 0.01995849609375, 0.02880859375, 0.03765869140625, 0.0465087890625, 0.05535888671875, 0.064208984375, 0.07305908203125, 0.0819091796875, 0.09075927734375, 0.099609375, 0.10845947265625, 0.1173095703125, 0.12615966796875, 0.135009765625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 8.0, 11.0, 15.0, 52.0, 191.0, 349.0, 245.0, 81.0, 33.0, 3.0, 6.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9845123291015625, -2.8955163955688477, -2.806520462036133, -2.717524528503418, -2.628528594970703, -2.539532423019409, -2.4505364894866943, -2.3615405559539795, -2.2725446224212646, -2.18354868888855, -2.094552755355835, -2.00555682182312, -1.9165607690811157, -1.8275648355484009, -1.7385687828063965, -1.6495728492736816, -1.5605769157409668, -1.471580982208252, -1.382585048675537, -1.2935889959335327, -1.2045930624008179, -1.115597128868103, -1.0266010761260986, -0.9376051425933838, -0.848609209060669, -0.7596132755279541, -0.6706172823905945, -0.5816212892532349, -0.49262535572052, -0.4036293923854828, -0.31463342905044556, -0.22563743591308594, -0.1366415023803711, -0.04764553904533386, 0.04135042428970337, 0.1303463876247406, 0.21934235095977783, 0.30833831429481506, 0.3973342776298523, 0.4863302707672119, 0.5753262042999268, 0.6643221378326416, 0.7533181309700012, 0.8423141241073608, 0.9313100576400757, 1.0203059911727905, 1.109302043914795, 1.1982979774475098, 1.2872939109802246, 1.3762898445129395, 1.4652857780456543, 1.5542818307876587, 1.6432777643203735, 1.7322736978530884, 1.8212697505950928, 1.9102656841278076, 1.9992616176605225, 2.0882575511932373, 2.177253484725952, 2.266249418258667, 2.355245590209961, 2.444241523742676, 2.5332374572753906, 2.6222333908081055, 2.7112293243408203]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 7.0, 8.0, 8.0, 29.0, 34.0, 40.0, 70.0, 68.0, 80.0, 79.0, 93.0, 82.0, 80.0, 59.0, 59.0, 45.0, 25.0, 29.0, 40.0, 21.0, 11.0, 12.0, 6.0, 5.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.842083215713501, -1.791167974472046, -1.7402528524398804, -1.6893376111984253, -1.6384224891662598, -1.5875072479248047, -1.5365921258926392, -1.485676884651184, -1.4347617626190186, -1.3838465213775635, -1.332931399345398, -1.2820161581039429, -1.2311010360717773, -1.1801857948303223, -1.1292706727981567, -1.0783554315567017, -1.0274403095245361, -0.9765251278877258, -0.9256099462509155, -0.8746947646141052, -0.8237795829772949, -0.7728643417358398, -0.7219492197036743, -0.6710339784622192, -0.6201187372207642, -0.5692035555839539, -0.5182883739471436, -0.46737319231033325, -0.41645801067352295, -0.36554279923439026, -0.31462761759757996, -0.26371243596076965, -0.21279728412628174, -0.16188210248947144, -0.11096691340208054, -0.060051724314689636, -0.009136542677879333, 0.04177865386009216, 0.09269383549690247, 0.14360901713371277, 0.19452419877052307, 0.24543938040733337, 0.2963545620441437, 0.34726977348327637, 0.39818495512008667, 0.449100136756897, 0.5000153183937073, 0.5509305000305176, 0.6018456816673279, 0.6527608633041382, 0.7036760449409485, 0.7545912265777588, 0.8055064082145691, 0.8564215898513794, 0.9073368310928345, 0.958251953125, 1.009167194366455, 1.0600824356079102, 1.1109975576400757, 1.1619127988815308, 1.2128279209136963, 1.2637431621551514, 1.314658284187317, 1.365573525428772, 1.4164886474609375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 5.0, 4.0, 11.0, 11.0, 40.0, 39.0, 74.0, 131.0, 216.0, 389.0, 715.0, 1368.0, 2667.0, 5596.0, 12384.0, 29179.0, 72888.0, 181220.0, 333085.0, 238954.0, 99281.0, 39505.0, 16407.0, 7217.0, 3397.0, 1700.0, 894.0, 495.0, 260.0, 175.0, 90.0, 66.0, 35.0, 18.0, 11.0, 14.0, 4.0, 2.0, 5.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1134033203125, -0.11013221740722656, -0.10686111450195312, -0.10359001159667969, -0.10031890869140625, -0.09704780578613281, -0.09377670288085938, -0.09050559997558594, -0.0872344970703125, -0.08396339416503906, -0.08069229125976562, -0.07742118835449219, -0.07415008544921875, -0.07087898254394531, -0.06760787963867188, -0.06433677673339844, -0.061065673828125, -0.05779457092285156, -0.054523468017578125, -0.05125236511230469, -0.04798126220703125, -0.04471015930175781, -0.041439056396484375, -0.03816795349121094, -0.0348968505859375, -0.03162574768066406, -0.028354644775390625, -0.025083541870117188, -0.02181243896484375, -0.018541336059570312, -0.015270233154296875, -0.011999130249023438, -0.00872802734375, -0.0054569244384765625, -0.002185821533203125, 0.0010852813720703125, 0.00435638427734375, 0.0076274871826171875, 0.010898590087890625, 0.014169692993164062, 0.0174407958984375, 0.020711898803710938, 0.023983001708984375, 0.027254104614257812, 0.03052520751953125, 0.03379631042480469, 0.037067413330078125, 0.04033851623535156, 0.043609619140625, 0.04688072204589844, 0.050151824951171875, 0.05342292785644531, 0.05669403076171875, 0.05996513366699219, 0.06323623657226562, 0.06650733947753906, 0.0697784423828125, 0.07304954528808594, 0.07632064819335938, 0.07959175109863281, 0.08286285400390625, 0.08613395690917969, 0.08940505981445312, 0.09267616271972656, 0.095947265625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 7.0, 7.0, 6.0, 6.0, 11.0, 8.0, 13.0, 19.0, 17.0, 37.0, 34.0, 38.0, 39.0, 51.0, 54.0, 62.0, 47.0, 61.0, 45.0, 62.0, 49.0, 48.0, 45.0, 46.0, 34.0, 27.0, 32.0, 19.0, 20.0, 19.0, 15.0, 3.0, 6.0, 4.0, 4.0, 4.0, 1.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.10406494140625, -0.1013784408569336, -0.09869194030761719, -0.09600543975830078, -0.09331893920898438, -0.09063243865966797, -0.08794593811035156, -0.08525943756103516, -0.08257293701171875, -0.07988643646240234, -0.07719993591308594, -0.07451343536376953, -0.07182693481445312, -0.06914043426513672, -0.06645393371582031, -0.0637674331665039, -0.0610809326171875, -0.058394432067871094, -0.05570793151855469, -0.05302143096923828, -0.050334930419921875, -0.04764842987060547, -0.04496192932128906, -0.042275428771972656, -0.03958892822265625, -0.036902427673339844, -0.03421592712402344, -0.03152942657470703, -0.028842926025390625, -0.02615642547607422, -0.023469924926757812, -0.020783424377441406, -0.018096923828125, -0.015410423278808594, -0.012723922729492188, -0.010037422180175781, -0.007350921630859375, -0.004664421081542969, -0.0019779205322265625, 0.0007085800170898438, 0.00339508056640625, 0.006081581115722656, 0.008768081665039062, 0.011454582214355469, 0.014141082763671875, 0.01682758331298828, 0.019514083862304688, 0.022200584411621094, 0.0248870849609375, 0.027573585510253906, 0.030260086059570312, 0.03294658660888672, 0.035633087158203125, 0.03831958770751953, 0.04100608825683594, 0.043692588806152344, 0.04637908935546875, 0.049065589904785156, 0.05175209045410156, 0.05443859100341797, 0.057125091552734375, 0.05981159210205078, 0.06249809265136719, 0.0651845932006836, 0.06787109375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 4.0, 6.0, 7.0, 11.0, 7.0, 22.0, 17.0, 35.0, 52.0, 76.0, 89.0, 164.0, 225.0, 374.0, 682.0, 1386.0, 3203.0, 10409.0, 58334.0, 563240.0, 357691.0, 39267.0, 7865.0, 2538.0, 1174.0, 593.0, 371.0, 230.0, 135.0, 99.0, 63.0, 43.0, 45.0, 34.0, 18.0, 11.0, 10.0, 8.0, 5.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2156982421875, -0.20848464965820312, -0.20127105712890625, -0.19405746459960938, -0.1868438720703125, -0.17963027954101562, -0.17241668701171875, -0.16520309448242188, -0.157989501953125, -0.15077590942382812, -0.14356231689453125, -0.13634872436523438, -0.1291351318359375, -0.12192153930664062, -0.11470794677734375, -0.10749435424804688, -0.10028076171875, -0.09306716918945312, -0.08585357666015625, -0.07863998413085938, -0.0714263916015625, -0.06421279907226562, -0.05699920654296875, -0.049785614013671875, -0.042572021484375, -0.035358428955078125, -0.02814483642578125, -0.020931243896484375, -0.0137176513671875, -0.006504058837890625, 0.00070953369140625, 0.007923126220703125, 0.01513671875, 0.022350311279296875, 0.02956390380859375, 0.036777496337890625, 0.0439910888671875, 0.051204681396484375, 0.05841827392578125, 0.06563186645507812, 0.072845458984375, 0.08005905151367188, 0.08727264404296875, 0.09448623657226562, 0.1016998291015625, 0.10891342163085938, 0.11612701416015625, 0.12334060668945312, 0.13055419921875, 0.13776779174804688, 0.14498138427734375, 0.15219497680664062, 0.1594085693359375, 0.16662216186523438, 0.17383575439453125, 0.18104934692382812, 0.188262939453125, 0.19547653198242188, 0.20269012451171875, 0.20990371704101562, 0.2171173095703125, 0.22433090209960938, 0.23154449462890625, 0.23875808715820312, 0.2459716796875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 3.0, 3.0, 7.0, 3.0, 8.0, 10.0, 13.0, 17.0, 21.0, 17.0, 25.0, 22.0, 28.0, 37.0, 38.0, 49.0, 49.0, 55.0, 57.0, 41.0, 48.0, 55.0, 40.0, 45.0, 42.0, 35.0, 39.0, 27.0, 21.0, 18.0, 26.0, 20.0, 10.0, 9.0, 13.0, 11.0, 6.0, 7.0, 7.0, 8.0, 1.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.35595703125, -0.3453941345214844, -0.33483123779296875, -0.3242683410644531, -0.3137054443359375, -0.3031425476074219, -0.29257965087890625, -0.2820167541503906, -0.271453857421875, -0.2608909606933594, -0.25032806396484375, -0.23976516723632812, -0.2292022705078125, -0.21863937377929688, -0.20807647705078125, -0.19751358032226562, -0.18695068359375, -0.17638778686523438, -0.16582489013671875, -0.15526199340820312, -0.1446990966796875, -0.13413619995117188, -0.12357330322265625, -0.11301040649414062, -0.102447509765625, -0.09188461303710938, -0.08132171630859375, -0.07075881958007812, -0.0601959228515625, -0.049633026123046875, -0.03907012939453125, -0.028507232666015625, -0.0179443359375, -0.007381439208984375, 0.00318145751953125, 0.013744354248046875, 0.0243072509765625, 0.034870147705078125, 0.04543304443359375, 0.055995941162109375, 0.066558837890625, 0.07712173461914062, 0.08768463134765625, 0.09824752807617188, 0.1088104248046875, 0.11937332153320312, 0.12993621826171875, 0.14049911499023438, 0.15106201171875, 0.16162490844726562, 0.17218780517578125, 0.18275070190429688, 0.1933135986328125, 0.20387649536132812, 0.21443939208984375, 0.22500228881835938, 0.235565185546875, 0.24612808227539062, 0.25669097900390625, 0.2672538757324219, 0.2778167724609375, 0.2883796691894531, 0.29894256591796875, 0.3095054626464844, 0.320068359375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 5.0, 7.0, 7.0, 13.0, 13.0, 22.0, 22.0, 42.0, 63.0, 103.0, 183.0, 348.0, 692.0, 1590.0, 4943.0, 29920.0, 834847.0, 160163.0, 10663.0, 2765.0, 1021.0, 483.0, 237.0, 142.0, 84.0, 48.0, 43.0, 22.0, 15.0, 14.0, 7.0, 12.0, 4.0, 4.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.13232421875, -0.12772178649902344, -0.12311935424804688, -0.11851692199707031, -0.11391448974609375, -0.10931205749511719, -0.10470962524414062, -0.10010719299316406, -0.0955047607421875, -0.09090232849121094, -0.08629989624023438, -0.08169746398925781, -0.07709503173828125, -0.07249259948730469, -0.06789016723632812, -0.06328773498535156, -0.058685302734375, -0.05408287048339844, -0.049480438232421875, -0.04487800598144531, -0.04027557373046875, -0.03567314147949219, -0.031070709228515625, -0.026468276977539062, -0.0218658447265625, -0.017263412475585938, -0.012660980224609375, -0.008058547973632812, -0.00345611572265625, 0.0011463165283203125, 0.005748748779296875, 0.010351181030273438, 0.01495361328125, 0.019556045532226562, 0.024158477783203125, 0.028760910034179688, 0.03336334228515625, 0.03796577453613281, 0.042568206787109375, 0.04717063903808594, 0.0517730712890625, 0.05637550354003906, 0.060977935791015625, 0.06558036804199219, 0.07018280029296875, 0.07478523254394531, 0.07938766479492188, 0.08399009704589844, 0.088592529296875, 0.09319496154785156, 0.09779739379882812, 0.10239982604980469, 0.10700225830078125, 0.11160469055175781, 0.11620712280273438, 0.12080955505371094, 0.1254119873046875, 0.13001441955566406, 0.13461685180664062, 0.1392192840576172, 0.14382171630859375, 0.1484241485595703, 0.15302658081054688, 0.15762901306152344, 0.1622314453125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 1.0, 12.0, 9.0, 44.0, 61.0, 167.0, 216.0, 231.0, 140.0, 57.0, 23.0, 16.0, 7.0, 2.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.439188003540039e-05, -3.289896994829178e-05, -3.1406059861183167e-05, -2.9913149774074554e-05, -2.8420239686965942e-05, -2.692732959985733e-05, -2.5434419512748718e-05, -2.3941509425640106e-05, -2.2448599338531494e-05, -2.0955689251422882e-05, -1.946277916431427e-05, -1.7969869077205658e-05, -1.6476958990097046e-05, -1.4984048902988434e-05, -1.3491138815879822e-05, -1.199822872877121e-05, -1.0505318641662598e-05, -9.012408554553986e-06, -7.5194984674453735e-06, -6.0265883803367615e-06, -4.533678293228149e-06, -3.0407682061195374e-06, -1.5478581190109253e-06, -5.494803190231323e-08, 1.4379620552062988e-06, 2.930872142314911e-06, 4.423782229423523e-06, 5.916692316532135e-06, 7.409602403640747e-06, 8.902512490749359e-06, 1.0395422577857971e-05, 1.1888332664966583e-05, 1.3381242752075195e-05, 1.4874152839183807e-05, 1.636706292629242e-05, 1.785997301340103e-05, 1.9352883100509644e-05, 2.0845793187618256e-05, 2.2338703274726868e-05, 2.383161336183548e-05, 2.5324523448944092e-05, 2.6817433536052704e-05, 2.8310343623161316e-05, 2.9803253710269928e-05, 3.129616379737854e-05, 3.278907388448715e-05, 3.4281983971595764e-05, 3.5774894058704376e-05, 3.726780414581299e-05, 3.87607142329216e-05, 4.025362432003021e-05, 4.1746534407138824e-05, 4.3239444494247437e-05, 4.473235458135605e-05, 4.622526466846466e-05, 4.771817475557327e-05, 4.9211084842681885e-05, 5.07039949297905e-05, 5.219690501689911e-05, 5.368981510400772e-05, 5.518272519111633e-05, 5.6675635278224945e-05, 5.816854536533356e-05, 5.966145545244217e-05, 6.115436553955078e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 3.0, 12.0, 7.0, 13.0, 12.0, 25.0, 33.0, 61.0, 82.0, 151.0, 293.0, 569.0, 1444.0, 4317.0, 20325.0, 402247.0, 586413.0, 24950.0, 4696.0, 1516.0, 633.0, 283.0, 166.0, 78.0, 72.0, 52.0, 40.0, 22.0, 5.0, 8.0, 4.0, 6.0, 6.0, 2.0, 0.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1329345703125, -0.12924671173095703, -0.12555885314941406, -0.1218709945678711, -0.11818313598632812, -0.11449527740478516, -0.11080741882324219, -0.10711956024169922, -0.10343170166015625, -0.09974384307861328, -0.09605598449707031, -0.09236812591552734, -0.08868026733398438, -0.0849924087524414, -0.08130455017089844, -0.07761669158935547, -0.0739288330078125, -0.07024097442626953, -0.06655311584472656, -0.0628652572631836, -0.059177398681640625, -0.055489540100097656, -0.05180168151855469, -0.04811382293701172, -0.04442596435546875, -0.04073810577392578, -0.03705024719238281, -0.033362388610839844, -0.029674530029296875, -0.025986671447753906, -0.022298812866210938, -0.01861095428466797, -0.014923095703125, -0.011235237121582031, -0.0075473785400390625, -0.0038595199584960938, -0.000171661376953125, 0.0035161972045898438, 0.0072040557861328125, 0.010891914367675781, 0.01457977294921875, 0.01826763153076172, 0.021955490112304688, 0.025643348693847656, 0.029331207275390625, 0.033019065856933594, 0.03670692443847656, 0.04039478302001953, 0.0440826416015625, 0.04777050018310547, 0.05145835876464844, 0.055146217346191406, 0.058834075927734375, 0.06252193450927734, 0.06620979309082031, 0.06989765167236328, 0.07358551025390625, 0.07727336883544922, 0.08096122741699219, 0.08464908599853516, 0.08833694458007812, 0.0920248031616211, 0.09571266174316406, 0.09940052032470703, 0.10308837890625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 1.0, 2.0, 10.0, 6.0, 4.0, 15.0, 24.0, 37.0, 41.0, 76.0, 72.0, 99.0, 132.0, 129.0, 118.0, 82.0, 44.0, 37.0, 21.0, 17.0, 11.0, 4.0, 5.0, 6.0, 3.0, 2.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.153564453125, -0.14939594268798828, -0.14522743225097656, -0.14105892181396484, -0.13689041137695312, -0.1327219009399414, -0.1285533905029297, -0.12438488006591797, -0.12021636962890625, -0.11604785919189453, -0.11187934875488281, -0.1077108383178711, -0.10354232788085938, -0.09937381744384766, -0.09520530700683594, -0.09103679656982422, -0.0868682861328125, -0.08269977569580078, -0.07853126525878906, -0.07436275482177734, -0.07019424438476562, -0.0660257339477539, -0.06185722351074219, -0.05768871307373047, -0.05352020263671875, -0.04935169219970703, -0.04518318176269531, -0.041014671325683594, -0.036846160888671875, -0.032677650451660156, -0.028509140014648438, -0.02434062957763672, -0.020172119140625, -0.01600360870361328, -0.011835098266601562, -0.007666587829589844, -0.003498077392578125, 0.0006704330444335938, 0.0048389434814453125, 0.009007453918457031, 0.01317596435546875, 0.01734447479248047, 0.021512985229492188, 0.025681495666503906, 0.029850006103515625, 0.034018516540527344, 0.03818702697753906, 0.04235553741455078, 0.0465240478515625, 0.05069255828857422, 0.05486106872558594, 0.059029579162597656, 0.06319808959960938, 0.0673666000366211, 0.07153511047363281, 0.07570362091064453, 0.07987213134765625, 0.08404064178466797, 0.08820915222167969, 0.0923776626586914, 0.09654617309570312, 0.10071468353271484, 0.10488319396972656, 0.10905170440673828, 0.11322021484375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 7.0, 20.0, 12.0, 43.0, 112.0, 209.0, 290.0, 188.0, 78.0, 22.0, 14.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6796948909759521, -1.5936390161514282, -1.5075831413269043, -1.4215272665023804, -1.3354713916778564, -1.2494155168533325, -1.1633596420288086, -1.0773037672042847, -0.9912478923797607, -0.9051920175552368, -0.8191361427307129, -0.733080267906189, -0.647024393081665, -0.5609685182571411, -0.4749126434326172, -0.38885676860809326, -0.30280089378356934, -0.2167450189590454, -0.13068914413452148, -0.04463326930999756, 0.04142260551452637, 0.1274784803390503, 0.21353435516357422, 0.29959022998809814, 0.38564610481262207, 0.471701979637146, 0.5577578544616699, 0.6438137292861938, 0.7298696041107178, 0.8159254789352417, 0.9019813537597656, 0.9880372285842896, 1.0740928649902344, 1.1601487398147583, 1.2462046146392822, 1.3322604894638062, 1.41831636428833, 1.504372239112854, 1.590428113937378, 1.6764839887619019, 1.7625398635864258, 1.8485957384109497, 1.9346516132354736, 2.020707607269287, 2.1067633628845215, 2.192819118499756, 2.2788751125335693, 2.364931106567383, 2.450986862182617, 2.5370426177978516, 2.623098611831665, 2.7091546058654785, 2.795210361480713, 2.8812661170959473, 2.9673221111297607, 3.053378105163574, 3.1394338607788086, 3.225489616394043, 3.3115456104278564, 3.39760160446167, 3.4836573600769043, 3.5697131156921387, 3.655769109725952, 3.7418251037597656, 3.827880859375]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 5.0, 4.0, 5.0, 12.0, 5.0, 14.0, 16.0, 14.0, 23.0, 21.0, 27.0, 31.0, 31.0, 48.0, 49.0, 39.0, 58.0, 56.0, 72.0, 78.0, 64.0, 55.0, 42.0, 35.0, 37.0, 27.0, 22.0, 28.0, 18.0, 15.0, 18.0, 9.0, 9.0, 9.0, 6.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.933605670928955, -1.8831411600112915, -1.8326765298843384, -1.7822120189666748, -1.7317475080490112, -1.6812829971313477, -1.6308183670043945, -1.580353856086731, -1.5298893451690674, -1.4794248342514038, -1.4289602041244507, -1.378495693206787, -1.3280311822891235, -1.27756667137146, -1.2271020412445068, -1.1766375303268433, -1.1261730194091797, -1.0757085084915161, -1.025243878364563, -0.9747793674468994, -0.9243148565292358, -0.8738502860069275, -0.8233857154846191, -0.7729212045669556, -0.7224565744400024, -0.6719920039176941, -0.6215274930000305, -0.5710629224777222, -0.5205984115600586, -0.47013384103775024, -0.4196693003177643, -0.3692047595977783, -0.31874024868011475, -0.2682757079601288, -0.21781116724014282, -0.16734661161899567, -0.1168820708990097, -0.06641751527786255, -0.015952974557876587, 0.034511566162109375, 0.08497610688209534, 0.1354406476020813, 0.18590518832206726, 0.23636974394321442, 0.2868342995643616, 0.33729884028434753, 0.3877633810043335, 0.43822792172431946, 0.4886924624443054, 0.5391570329666138, 0.5896215438842773, 0.6400861144065857, 0.6905506253242493, 0.7410151958465576, 0.7914797067642212, 0.8419442772865295, 0.8924088478088379, 0.9428734183311462, 0.9933379292488098, 1.0438024997711182, 1.0942670106887817, 1.1447315216064453, 1.1951961517333984, 1.245660662651062, 1.2961251735687256]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 0.0, 3.0, 0.0, 2.0, 4.0, 2.0, 9.0, 11.0, 34.0, 77.0, 165.0, 434.0, 4109786.0, 83063.0, 386.0, 162.0, 76.0, 38.0, 17.0, 15.0, 5.0, 1.0, 0.0, 4.0], "bins": [-4.3203125, -4.23870849609375, -4.1571044921875, -4.07550048828125, -3.993896484375, -3.91229248046875, -3.8306884765625, -3.74908447265625, -3.66748046875, -3.58587646484375, -3.5042724609375, -3.42266845703125, -3.341064453125, -3.25946044921875, -3.1778564453125, -3.09625244140625, -3.0146484375, -2.93304443359375, -2.8514404296875, -2.76983642578125, -2.688232421875, -2.60662841796875, -2.5250244140625, -2.44342041015625, -2.36181640625, -2.28021240234375, -2.1986083984375, -2.11700439453125, -2.035400390625, -1.95379638671875, -1.8721923828125, -1.79058837890625, -1.708984375, -1.62738037109375, -1.5457763671875, -1.46417236328125, -1.382568359375, -1.30096435546875, -1.2193603515625, -1.13775634765625, -1.05615234375, -0.97454833984375, -0.8929443359375, -0.81134033203125, -0.729736328125, -0.64813232421875, -0.5665283203125, -0.48492431640625, -0.4033203125, -0.32171630859375, -0.2401123046875, -0.15850830078125, -0.076904296875, 0.00469970703125, 0.0863037109375, 0.16790771484375, 0.24951171875, 0.33111572265625, 0.4127197265625, 0.49432373046875, 0.575927734375, 0.65753173828125, 0.7391357421875, 0.82073974609375, 0.90234375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 7.0, 7.0, 13.0, 14.0, 19.0, 32.0, 43.0, 64.0, 70.0, 85.0, 95.0, 103.0, 95.0, 86.0, 83.0, 51.0, 50.0, 30.0, 27.0, 13.0, 11.0, 8.0, 4.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.228759765625, -0.22403812408447266, -0.2193164825439453, -0.21459484100341797, -0.20987319946289062, -0.20515155792236328, -0.20042991638183594, -0.1957082748413086, -0.19098663330078125, -0.1862649917602539, -0.18154335021972656, -0.17682170867919922, -0.17210006713867188, -0.16737842559814453, -0.1626567840576172, -0.15793514251708984, -0.1532135009765625, -0.14849185943603516, -0.1437702178955078, -0.13904857635498047, -0.13432693481445312, -0.12960529327392578, -0.12488365173339844, -0.1201620101928711, -0.11544036865234375, -0.1107187271118164, -0.10599708557128906, -0.10127544403076172, -0.09655380249023438, -0.09183216094970703, -0.08711051940917969, -0.08238887786865234, -0.077667236328125, -0.07294559478759766, -0.06822395324707031, -0.06350231170654297, -0.058780670166015625, -0.05405902862548828, -0.04933738708496094, -0.044615745544433594, -0.03989410400390625, -0.035172462463378906, -0.030450820922851562, -0.02572917938232422, -0.021007537841796875, -0.01628589630126953, -0.011564254760742188, -0.006842613220214844, -0.0021209716796875, 0.0026006698608398438, 0.0073223114013671875, 0.012043952941894531, 0.016765594482421875, 0.02148723602294922, 0.026208877563476562, 0.030930519104003906, 0.03565216064453125, 0.040373802185058594, 0.04509544372558594, 0.04981708526611328, 0.054538726806640625, 0.05926036834716797, 0.06398200988769531, 0.06870365142822266, 0.07342529296875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 9.0, 8.0, 15.0, 13.0, 13.0, 25.0, 27.0, 47.0, 58.0, 49.0, 74.0, 99.0, 205.0, 383.0, 958.0, 3157.0, 14919.0, 137126.0, 3871490.0, 145514.0, 14960.0, 3262.0, 1016.0, 385.0, 160.0, 86.0, 63.0, 46.0, 33.0, 24.0, 16.0, 14.0, 14.0, 8.0, 6.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.287353515625, -0.27926063537597656, -0.2711677551269531, -0.2630748748779297, -0.25498199462890625, -0.2468891143798828, -0.23879623413085938, -0.23070335388183594, -0.2226104736328125, -0.21451759338378906, -0.20642471313476562, -0.1983318328857422, -0.19023895263671875, -0.1821460723876953, -0.17405319213867188, -0.16596031188964844, -0.157867431640625, -0.14977455139160156, -0.14168167114257812, -0.1335887908935547, -0.12549591064453125, -0.11740303039550781, -0.10931015014648438, -0.10121726989746094, -0.0931243896484375, -0.08503150939941406, -0.07693862915039062, -0.06884574890136719, -0.06075286865234375, -0.05265998840332031, -0.044567108154296875, -0.03647422790527344, -0.02838134765625, -0.020288467407226562, -0.012195587158203125, -0.0041027069091796875, 0.00399017333984375, 0.012083053588867188, 0.020175933837890625, 0.028268814086914062, 0.0363616943359375, 0.04445457458496094, 0.052547454833984375, 0.06064033508300781, 0.06873321533203125, 0.07682609558105469, 0.08491897583007812, 0.09301185607910156, 0.101104736328125, 0.10919761657714844, 0.11729049682617188, 0.1253833770751953, 0.13347625732421875, 0.1415691375732422, 0.14966201782226562, 0.15775489807128906, 0.1658477783203125, 0.17394065856933594, 0.18203353881835938, 0.1901264190673828, 0.19821929931640625, 0.2063121795654297, 0.21440505981445312, 0.22249794006347656, 0.2305908203125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 9.0, 6.0, 16.0, 16.0, 22.0, 55.0, 140.0, 581.0, 2210.0, 733.0, 161.0, 57.0, 34.0, 19.0, 6.0, 10.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52783203125, -0.5159759521484375, -0.504119873046875, -0.4922637939453125, -0.48040771484375, -0.4685516357421875, -0.456695556640625, -0.4448394775390625, -0.4329833984375, -0.4211273193359375, -0.409271240234375, -0.3974151611328125, -0.38555908203125, -0.3737030029296875, -0.361846923828125, -0.3499908447265625, -0.338134765625, -0.3262786865234375, -0.314422607421875, -0.3025665283203125, -0.29071044921875, -0.2788543701171875, -0.266998291015625, -0.2551422119140625, -0.2432861328125, -0.2314300537109375, -0.219573974609375, -0.2077178955078125, -0.19586181640625, -0.1840057373046875, -0.172149658203125, -0.1602935791015625, -0.1484375, -0.1365814208984375, -0.124725341796875, -0.1128692626953125, -0.10101318359375, -0.0891571044921875, -0.077301025390625, -0.0654449462890625, -0.0535888671875, -0.0417327880859375, -0.029876708984375, -0.0180206298828125, -0.00616455078125, 0.0056915283203125, 0.017547607421875, 0.0294036865234375, 0.041259765625, 0.0531158447265625, 0.064971923828125, 0.0768280029296875, 0.08868408203125, 0.1005401611328125, 0.112396240234375, 0.1242523193359375, 0.1361083984375, 0.1479644775390625, 0.159820556640625, 0.1716766357421875, 0.18353271484375, 0.1953887939453125, 0.207244873046875, 0.2191009521484375, 0.23095703125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 8.0, 4.0, 5.0, 18.0, 59.0, 159.0, 274.0, 281.0, 119.0, 40.0, 13.0, 7.0, 6.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.357764482498169, -3.2860474586486816, -3.2143301963806152, -3.142613172531128, -3.0708959102630615, -2.999178886413574, -2.927461624145508, -2.8557446002960205, -2.784027576446533, -2.712310552597046, -2.6405932903289795, -2.568876266479492, -2.497159004211426, -2.4254419803619385, -2.353724956512451, -2.2820076942443848, -2.2102904319763184, -2.138573408126831, -2.0668561458587646, -1.9951391220092773, -1.9234219789505005, -1.8517048358917236, -1.7799876928329468, -1.70827054977417, -1.6365535259246826, -1.5648363828659058, -1.493119239807129, -1.4214022159576416, -1.3496850728988647, -1.277967929840088, -1.206250786781311, -1.1345336437225342, -1.0628167390823364, -0.9910995960235596, -0.9193825125694275, -0.8476653695106506, -0.7759482860565186, -0.7042311429977417, -0.6325139999389648, -0.5607969164848328, -0.4890797734260559, -0.41736266016960144, -0.345645546913147, -0.2739284038543701, -0.20221129059791565, -0.13049417734146118, -0.058777034282684326, 0.012940049171447754, 0.08465719223022461, 0.15637430548667908, 0.22809143364429474, 0.2998085618019104, 0.37152567505836487, 0.44324278831481934, 0.5149599313735962, 0.5866770148277283, 0.6583941578865051, 0.730111300945282, 0.8018283843994141, 0.8735455274581909, 0.9452626705169678, 1.016979694366455, 1.0886969566345215, 1.1604139804840088, 1.2321311235427856]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 9.0, 7.0, 17.0, 13.0, 15.0, 16.0, 30.0, 27.0, 60.0, 59.0, 58.0, 78.0, 59.0, 81.0, 66.0, 72.0, 54.0, 61.0, 51.0, 40.0, 33.0, 23.0, 20.0, 8.0, 10.0, 10.0, 7.0, 5.0, 9.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0161917209625244, -0.9840325713157654, -0.9518734812736511, -0.9197143316268921, -0.8875552415847778, -0.8553960919380188, -0.8232369422912598, -0.7910778522491455, -0.7589187026023865, -0.7267595529556274, -0.6946004629135132, -0.6624413132667542, -0.6302821636199951, -0.5981230735778809, -0.5659639239311218, -0.5338047742843628, -0.5016456842422485, -0.4694865643978119, -0.43732744455337524, -0.4051682949066162, -0.37300917506217957, -0.3408500552177429, -0.3086909055709839, -0.27653178572654724, -0.2443726658821106, -0.21221354603767395, -0.1800544112920761, -0.14789527654647827, -0.11573615670204163, -0.08357703685760498, -0.05141790211200714, -0.019258767366409302, 0.012900352478027344, 0.045059479773044586, 0.07721860706806183, 0.10937773436307907, 0.1415368616580963, 0.17369598150253296, 0.2058551162481308, 0.23801425099372864, 0.2701733708381653, 0.30233249068260193, 0.3344916105270386, 0.3666507601737976, 0.39880988001823425, 0.4309689998626709, 0.46312814950942993, 0.4952872693538666, 0.5274463891983032, 0.5596055388450623, 0.5917646288871765, 0.6239237785339355, 0.6560828685760498, 0.6882420182228088, 0.7204011678695679, 0.7525602579116821, 0.7847194075584412, 0.8168785572052002, 0.8490376472473145, 0.8811967968940735, 0.9133559465408325, 0.9455150365829468, 0.9776741862297058, 1.0098333358764648, 1.041992425918579]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 5.0, 7.0, 13.0, 16.0, 24.0, 51.0, 96.0, 144.0, 313.0, 677.0, 1870.0, 5682.0, 22398.0, 113191.0, 509296.0, 318125.0, 58050.0, 12844.0, 3553.0, 1195.0, 486.0, 224.0, 117.0, 72.0, 45.0, 22.0, 17.0, 7.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.261474609375, -0.25473594665527344, -0.24799728393554688, -0.2412586212158203, -0.23451995849609375, -0.2277812957763672, -0.22104263305664062, -0.21430397033691406, -0.2075653076171875, -0.20082664489746094, -0.19408798217773438, -0.1873493194580078, -0.18061065673828125, -0.1738719940185547, -0.16713333129882812, -0.16039466857910156, -0.153656005859375, -0.14691734313964844, -0.14017868041992188, -0.1334400177001953, -0.12670135498046875, -0.11996269226074219, -0.11322402954101562, -0.10648536682128906, -0.0997467041015625, -0.09300804138183594, -0.08626937866210938, -0.07953071594238281, -0.07279205322265625, -0.06605339050292969, -0.059314727783203125, -0.05257606506347656, -0.04583740234375, -0.03909873962402344, -0.032360076904296875, -0.025621414184570312, -0.01888275146484375, -0.012144088745117188, -0.005405426025390625, 0.0013332366943359375, 0.0080718994140625, 0.014810562133789062, 0.021549224853515625, 0.028287887573242188, 0.03502655029296875, 0.04176521301269531, 0.048503875732421875, 0.05524253845214844, 0.061981201171875, 0.06871986389160156, 0.07545852661132812, 0.08219718933105469, 0.08893585205078125, 0.09567451477050781, 0.10241317749023438, 0.10915184020996094, 0.1158905029296875, 0.12262916564941406, 0.12936782836914062, 0.1361064910888672, 0.14284515380859375, 0.1495838165283203, 0.15632247924804688, 0.16306114196777344, 0.1697998046875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 6.0, 9.0, 6.0, 10.0, 9.0, 13.0, 25.0, 22.0, 42.0, 30.0, 48.0, 44.0, 62.0, 59.0, 79.0, 67.0, 67.0, 66.0, 62.0, 65.0, 41.0, 42.0, 32.0, 25.0, 14.0, 20.0, 10.0, 14.0, 7.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.14111328125, -0.13785457611083984, -0.1345958709716797, -0.13133716583251953, -0.12807846069335938, -0.12481975555419922, -0.12156105041503906, -0.1183023452758789, -0.11504364013671875, -0.1117849349975586, -0.10852622985839844, -0.10526752471923828, -0.10200881958007812, -0.09875011444091797, -0.09549140930175781, -0.09223270416259766, -0.0889739990234375, -0.08571529388427734, -0.08245658874511719, -0.07919788360595703, -0.07593917846679688, -0.07268047332763672, -0.06942176818847656, -0.0661630630493164, -0.06290435791015625, -0.059645652770996094, -0.05638694763183594, -0.05312824249267578, -0.049869537353515625, -0.04661083221435547, -0.04335212707519531, -0.040093421936035156, -0.036834716796875, -0.033576011657714844, -0.030317306518554688, -0.02705860137939453, -0.023799896240234375, -0.02054119110107422, -0.017282485961914062, -0.014023780822753906, -0.01076507568359375, -0.007506370544433594, -0.0042476654052734375, -0.0009889602661132812, 0.002269744873046875, 0.005528450012207031, 0.008787155151367188, 0.012045860290527344, 0.0153045654296875, 0.018563270568847656, 0.021821975708007812, 0.02508068084716797, 0.028339385986328125, 0.03159809112548828, 0.03485679626464844, 0.038115501403808594, 0.04137420654296875, 0.044632911682128906, 0.04789161682128906, 0.05115032196044922, 0.054409027099609375, 0.05766773223876953, 0.06092643737792969, 0.06418514251708984, 0.06744384765625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 4.0, 10.0, 8.0, 12.0, 15.0, 25.0, 37.0, 48.0, 99.0, 165.0, 298.0, 641.0, 1435.0, 4284.0, 23891.0, 301308.0, 656734.0, 49205.0, 6726.0, 1938.0, 815.0, 359.0, 201.0, 112.0, 71.0, 40.0, 23.0, 17.0, 9.0, 12.0, 1.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2978515625, -0.2879753112792969, -0.27809906005859375, -0.2682228088378906, -0.2583465576171875, -0.24847030639648438, -0.23859405517578125, -0.22871780395507812, -0.218841552734375, -0.20896530151367188, -0.19908905029296875, -0.18921279907226562, -0.1793365478515625, -0.16946029663085938, -0.15958404541015625, -0.14970779418945312, -0.13983154296875, -0.12995529174804688, -0.12007904052734375, -0.11020278930664062, -0.1003265380859375, -0.09045028686523438, -0.08057403564453125, -0.07069778442382812, -0.060821533203125, -0.050945281982421875, -0.04106903076171875, -0.031192779541015625, -0.0213165283203125, -0.011440277099609375, -0.00156402587890625, 0.008312225341796875, 0.0181884765625, 0.028064727783203125, 0.03794097900390625, 0.047817230224609375, 0.0576934814453125, 0.06756973266601562, 0.07744598388671875, 0.08732223510742188, 0.097198486328125, 0.10707473754882812, 0.11695098876953125, 0.12682723999023438, 0.1367034912109375, 0.14657974243164062, 0.15645599365234375, 0.16633224487304688, 0.17620849609375, 0.18608474731445312, 0.19596099853515625, 0.20583724975585938, 0.2157135009765625, 0.22558975219726562, 0.23546600341796875, 0.24534225463867188, 0.255218505859375, 0.2650947570800781, 0.27497100830078125, 0.2848472595214844, 0.2947235107421875, 0.3045997619628906, 0.31447601318359375, 0.3243522644042969, 0.334228515625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 5.0, 13.0, 11.0, 23.0, 38.0, 35.0, 53.0, 77.0, 71.0, 91.0, 86.0, 89.0, 93.0, 81.0, 65.0, 61.0, 45.0, 25.0, 13.0, 11.0, 8.0, 4.0, 6.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.54541015625, -0.52783203125, -0.51025390625, -0.49267578125, -0.47509765625, -0.45751953125, -0.43994140625, -0.42236328125, -0.40478515625, -0.38720703125, -0.36962890625, -0.35205078125, -0.33447265625, -0.31689453125, -0.29931640625, -0.28173828125, -0.26416015625, -0.24658203125, -0.22900390625, -0.21142578125, -0.19384765625, -0.17626953125, -0.15869140625, -0.14111328125, -0.12353515625, -0.10595703125, -0.08837890625, -0.07080078125, -0.05322265625, -0.03564453125, -0.01806640625, -0.00048828125, 0.01708984375, 0.03466796875, 0.05224609375, 0.06982421875, 0.08740234375, 0.10498046875, 0.12255859375, 0.14013671875, 0.15771484375, 0.17529296875, 0.19287109375, 0.21044921875, 0.22802734375, 0.24560546875, 0.26318359375, 0.28076171875, 0.29833984375, 0.31591796875, 0.33349609375, 0.35107421875, 0.36865234375, 0.38623046875, 0.40380859375, 0.42138671875, 0.43896484375, 0.45654296875, 0.47412109375, 0.49169921875, 0.50927734375, 0.52685546875, 0.54443359375, 0.56201171875, 0.57958984375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 9.0, 5.0, 9.0, 12.0, 15.0, 36.0, 56.0, 95.0, 204.0, 452.0, 1344.0, 6978.0, 294880.0, 731644.0, 10164.0, 1610.0, 524.0, 218.0, 123.0, 70.0, 35.0, 32.0, 19.0, 10.0, 3.0, 3.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.296875, -0.28762054443359375, -0.2783660888671875, -0.26911163330078125, -0.259857177734375, -0.25060272216796875, -0.2413482666015625, -0.23209381103515625, -0.22283935546875, -0.21358489990234375, -0.2043304443359375, -0.19507598876953125, -0.185821533203125, -0.17656707763671875, -0.1673126220703125, -0.15805816650390625, -0.1488037109375, -0.13954925537109375, -0.1302947998046875, -0.12104034423828125, -0.111785888671875, -0.10253143310546875, -0.0932769775390625, -0.08402252197265625, -0.07476806640625, -0.06551361083984375, -0.0562591552734375, -0.04700469970703125, -0.037750244140625, -0.02849578857421875, -0.0192413330078125, -0.00998687744140625, -0.000732421875, 0.00852203369140625, 0.0177764892578125, 0.02703094482421875, 0.036285400390625, 0.04553985595703125, 0.0547943115234375, 0.06404876708984375, 0.07330322265625, 0.08255767822265625, 0.0918121337890625, 0.10106658935546875, 0.110321044921875, 0.11957550048828125, 0.1288299560546875, 0.13808441162109375, 0.1473388671875, 0.15659332275390625, 0.1658477783203125, 0.17510223388671875, 0.184356689453125, 0.19361114501953125, 0.2028656005859375, 0.21212005615234375, 0.22137451171875, 0.23062896728515625, 0.2398834228515625, 0.24913787841796875, 0.258392333984375, 0.26764678955078125, 0.2769012451171875, 0.28615570068359375, 0.29541015625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 15.0, 47.0, 195.0, 442.0, 208.0, 48.0, 16.0, 9.0, 8.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.26716423034668e-05, -7.91521742939949e-05, -7.563270628452301e-05, -7.211323827505112e-05, -6.859377026557922e-05, -6.507430225610733e-05, -6.155483424663544e-05, -5.8035366237163544e-05, -5.451589822769165e-05, -5.099643021821976e-05, -4.7476962208747864e-05, -4.395749419927597e-05, -4.043802618980408e-05, -3.6918558180332184e-05, -3.339909017086029e-05, -2.9879622161388397e-05, -2.6360154151916504e-05, -2.284068614244461e-05, -1.9321218132972717e-05, -1.5801750123500824e-05, -1.228228211402893e-05, -8.762814104557037e-06, -5.243346095085144e-06, -1.7238780856132507e-06, 1.7955899238586426e-06, 5.315057933330536e-06, 8.83452594280243e-06, 1.2353993952274323e-05, 1.5873461961746216e-05, 1.939292997121811e-05, 2.2912397980690002e-05, 2.6431865990161896e-05, 2.995133399963379e-05, 3.347080200910568e-05, 3.6990270018577576e-05, 4.050973802804947e-05, 4.402920603752136e-05, 4.7548674046993256e-05, 5.106814205646515e-05, 5.458761006593704e-05, 5.8107078075408936e-05, 6.162654608488083e-05, 6.514601409435272e-05, 6.866548210382462e-05, 7.218495011329651e-05, 7.57044181227684e-05, 7.92238861322403e-05, 8.274335414171219e-05, 8.626282215118408e-05, 8.978229016065598e-05, 9.330175817012787e-05, 9.682122617959976e-05, 0.00010034069418907166, 0.00010386016219854355, 0.00010737963020801544, 0.00011089909821748734, 0.00011441856622695923, 0.00011793803423643112, 0.00012145750224590302, 0.0001249769702553749, 0.0001284964382648468, 0.0001320159062743187, 0.0001355353742837906, 0.00013905484229326248, 0.00014257431030273438]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 6.0, 8.0, 13.0, 15.0, 30.0, 65.0, 126.0, 279.0, 669.0, 2213.0, 11834.0, 222456.0, 774936.0, 30274.0, 3899.0, 1001.0, 388.0, 158.0, 67.0, 45.0, 33.0, 12.0, 7.0, 9.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1737060546875, -0.1679534912109375, -0.162200927734375, -0.1564483642578125, -0.15069580078125, -0.1449432373046875, -0.139190673828125, -0.1334381103515625, -0.127685546875, -0.1219329833984375, -0.116180419921875, -0.1104278564453125, -0.10467529296875, -0.0989227294921875, -0.093170166015625, -0.0874176025390625, -0.0816650390625, -0.0759124755859375, -0.070159912109375, -0.0644073486328125, -0.05865478515625, -0.0529022216796875, -0.047149658203125, -0.0413970947265625, -0.03564453125, -0.0298919677734375, -0.024139404296875, -0.0183868408203125, -0.01263427734375, -0.0068817138671875, -0.001129150390625, 0.0046234130859375, 0.0103759765625, 0.0161285400390625, 0.021881103515625, 0.0276336669921875, 0.03338623046875, 0.0391387939453125, 0.044891357421875, 0.0506439208984375, 0.056396484375, 0.0621490478515625, 0.067901611328125, 0.0736541748046875, 0.07940673828125, 0.0851593017578125, 0.090911865234375, 0.0966644287109375, 0.1024169921875, 0.1081695556640625, 0.113922119140625, 0.1196746826171875, 0.12542724609375, 0.1311798095703125, 0.136932373046875, 0.1426849365234375, 0.1484375, 0.1541900634765625, 0.159942626953125, 0.1656951904296875, 0.17144775390625, 0.1772003173828125, 0.182952880859375, 0.1887054443359375, 0.1944580078125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 8.0, 8.0, 7.0, 12.0, 16.0, 26.0, 28.0, 28.0, 61.0, 73.0, 84.0, 82.0, 98.0, 93.0, 86.0, 57.0, 61.0, 37.0, 38.0, 33.0, 17.0, 15.0, 15.0, 7.0, 5.0, 2.0, 2.0, 0.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.137451171875, -0.133697509765625, -0.12994384765625, -0.126190185546875, -0.1224365234375, -0.118682861328125, -0.11492919921875, -0.111175537109375, -0.107421875, -0.103668212890625, -0.09991455078125, -0.096160888671875, -0.0924072265625, -0.088653564453125, -0.08489990234375, -0.081146240234375, -0.077392578125, -0.073638916015625, -0.06988525390625, -0.066131591796875, -0.0623779296875, -0.058624267578125, -0.05487060546875, -0.051116943359375, -0.04736328125, -0.043609619140625, -0.03985595703125, -0.036102294921875, -0.0323486328125, -0.028594970703125, -0.02484130859375, -0.021087646484375, -0.017333984375, -0.013580322265625, -0.00982666015625, -0.006072998046875, -0.0023193359375, 0.001434326171875, 0.00518798828125, 0.008941650390625, 0.0126953125, 0.016448974609375, 0.02020263671875, 0.023956298828125, 0.0277099609375, 0.031463623046875, 0.03521728515625, 0.038970947265625, 0.042724609375, 0.046478271484375, 0.05023193359375, 0.053985595703125, 0.0577392578125, 0.061492919921875, 0.06524658203125, 0.069000244140625, 0.07275390625, 0.076507568359375, 0.08026123046875, 0.084014892578125, 0.0877685546875, 0.091522216796875, 0.09527587890625, 0.099029541015625, 0.102783203125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 7.0, 28.0, 118.0, 341.0, 320.0, 115.0, 43.0, 19.0, 9.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.989715576171875, -2.8531434535980225, -2.71657133102417, -2.5799989700317383, -2.4434268474578857, -2.306854724884033, -2.1702823638916016, -2.033710241317749, -1.8971381187438965, -1.760565996170044, -1.6239937543869019, -1.4874215126037598, -1.3508493900299072, -1.2142772674560547, -1.0777050256729126, -0.9411328434944153, -0.804560661315918, -0.6679884791374207, -0.5314162969589233, -0.394844114780426, -0.2582719326019287, -0.1216997504234314, 0.014872431755065918, 0.15144461393356323, 0.28801679611206055, 0.42458897829055786, 0.5611611604690552, 0.6977333426475525, 0.8343055248260498, 0.9708777070045471, 1.1074498891830444, 1.2440221309661865, 1.380594253540039, 1.5171663761138916, 1.6537386178970337, 1.7903108596801758, 1.9268829822540283, 2.063455104827881, 2.2000274658203125, 2.336599588394165, 2.4731717109680176, 2.60974383354187, 2.7463159561157227, 2.8828883171081543, 3.019460439682007, 3.1560325622558594, 3.292604923248291, 3.4291770458221436, 3.565749168395996, 3.7023212909698486, 3.838893413543701, 3.975465774536133, 4.112037658691406, 4.248610019683838, 4.3851823806762695, 4.521754264831543, 4.658326625823975, 4.794898986816406, 4.93147087097168, 5.068043231964111, 5.204615592956543, 5.341187477111816, 5.477759838104248, 5.6143317222595215, 5.750904083251953]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 5.0, 9.0, 13.0, 12.0, 20.0, 25.0, 27.0, 23.0, 33.0, 29.0, 51.0, 67.0, 66.0, 84.0, 76.0, 77.0, 66.0, 67.0, 53.0, 37.0, 36.0, 22.0, 32.0, 22.0, 13.0, 8.0, 9.0, 6.0, 5.0, 0.0, 4.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.3520870208740234, -2.2909655570983887, -2.229843854904175, -2.16872239112854, -2.107600688934326, -2.0464792251586914, -1.985357642173767, -1.9242360591888428, -1.8631144762039185, -1.8019928932189941, -1.7408713102340698, -1.6797497272491455, -1.6186282634735107, -1.5575065612792969, -1.496385097503662, -1.4352635145187378, -1.3741419315338135, -1.3130203485488892, -1.2518987655639648, -1.1907771825790405, -1.1296555995941162, -1.0685341358184814, -1.0074125528335571, -0.9462909698486328, -0.8851693868637085, -0.8240478038787842, -0.7629262208938599, -0.7018046975135803, -0.640683114528656, -0.5795615315437317, -0.5184400081634521, -0.45731842517852783, -0.3961968421936035, -0.3350752592086792, -0.27395370602607727, -0.21283213794231415, -0.15171056985855103, -0.09058898687362671, -0.02946743369102478, 0.03165411949157715, 0.09277570247650146, 0.1538972705602646, 0.2150188386440277, 0.27614039182662964, 0.33726197481155396, 0.39838355779647827, 0.4595051109790802, 0.5206266641616821, 0.5817482471466064, 0.6428698301315308, 0.7039914131164551, 0.7651129364967346, 0.8262345194816589, 0.8873561024665833, 0.9484776258468628, 1.009599208831787, 1.0707207918167114, 1.1318423748016357, 1.19296395778656, 1.2540855407714844, 1.3152070045471191, 1.376328706741333, 1.4374501705169678, 1.498571753501892, 1.5596933364868164]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 10.0, 23.0, 37.0, 71.0, 168.0, 620.0, 8056.0, 3143771.0, 1036233.0, 4576.0, 444.0, 137.0, 58.0, 28.0, 14.0, 12.0, 3.0, 8.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60595703125, -0.5927619934082031, -0.5795669555664062, -0.5663719177246094, -0.5531768798828125, -0.5399818420410156, -0.5267868041992188, -0.5135917663574219, -0.500396728515625, -0.4872016906738281, -0.47400665283203125, -0.4608116149902344, -0.4476165771484375, -0.4344215393066406, -0.42122650146484375, -0.4080314636230469, -0.39483642578125, -0.3816413879394531, -0.36844635009765625, -0.3552513122558594, -0.3420562744140625, -0.3288612365722656, -0.31566619873046875, -0.3024711608886719, -0.289276123046875, -0.2760810852050781, -0.26288604736328125, -0.24969100952148438, -0.2364959716796875, -0.22330093383789062, -0.21010589599609375, -0.19691085815429688, -0.1837158203125, -0.17052078247070312, -0.15732574462890625, -0.14413070678710938, -0.1309356689453125, -0.11774063110351562, -0.10454559326171875, -0.09135055541992188, -0.078155517578125, -0.06496047973632812, -0.05176544189453125, -0.038570404052734375, -0.0253753662109375, -0.012180328369140625, 0.00101470947265625, 0.014209747314453125, 0.02740478515625, 0.040599822998046875, 0.05379486083984375, 0.06698989868164062, 0.0801849365234375, 0.09337997436523438, 0.10657501220703125, 0.11977005004882812, 0.132965087890625, 0.14616012573242188, 0.15935516357421875, 0.17255020141601562, 0.1857452392578125, 0.19894027709960938, 0.21213531494140625, 0.22533035278320312, 0.238525390625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 5.0, 5.0, 5.0, 11.0, 9.0, 9.0, 12.0, 15.0, 11.0, 17.0, 29.0, 29.0, 36.0, 34.0, 41.0, 44.0, 50.0, 52.0, 51.0, 50.0, 42.0, 60.0, 44.0, 43.0, 36.0, 39.0, 35.0, 23.0, 26.0, 23.0, 24.0, 17.0, 18.0, 17.0, 14.0, 4.0, 8.0, 5.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07318115234375, -0.07101154327392578, -0.06884193420410156, -0.06667232513427734, -0.06450271606445312, -0.062333106994628906, -0.06016349792480469, -0.05799388885498047, -0.05582427978515625, -0.05365467071533203, -0.05148506164550781, -0.049315452575683594, -0.047145843505859375, -0.044976234436035156, -0.04280662536621094, -0.04063701629638672, -0.0384674072265625, -0.03629779815673828, -0.03412818908691406, -0.031958580017089844, -0.029788970947265625, -0.027619361877441406, -0.025449752807617188, -0.02328014373779297, -0.02111053466796875, -0.01894092559814453, -0.016771316528320312, -0.014601707458496094, -0.012432098388671875, -0.010262489318847656, -0.008092880249023438, -0.005923271179199219, -0.003753662109375, -0.0015840530395507812, 0.0005855560302734375, 0.0027551651000976562, 0.004924774169921875, 0.007094383239746094, 0.009263992309570312, 0.011433601379394531, 0.01360321044921875, 0.01577281951904297, 0.017942428588867188, 0.020112037658691406, 0.022281646728515625, 0.024451255798339844, 0.026620864868164062, 0.02879047393798828, 0.0309600830078125, 0.03312969207763672, 0.03529930114746094, 0.037468910217285156, 0.039638519287109375, 0.041808128356933594, 0.04397773742675781, 0.04614734649658203, 0.04831695556640625, 0.05048656463623047, 0.05265617370605469, 0.054825782775878906, 0.056995391845703125, 0.059165000915527344, 0.06133460998535156, 0.06350421905517578, 0.065673828125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 3.0, 5.0, 7.0, 13.0, 15.0, 14.0, 22.0, 34.0, 36.0, 63.0, 95.0, 159.0, 376.0, 1223.0, 9459.0, 284860.0, 3857933.0, 36617.0, 2436.0, 502.0, 189.0, 86.0, 51.0, 30.0, 23.0, 13.0, 8.0, 9.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.295166015625, -0.2834815979003906, -0.27179718017578125, -0.2601127624511719, -0.2484283447265625, -0.23674392700195312, -0.22505950927734375, -0.21337509155273438, -0.201690673828125, -0.19000625610351562, -0.17832183837890625, -0.16663742065429688, -0.1549530029296875, -0.14326858520507812, -0.13158416748046875, -0.11989974975585938, -0.10821533203125, -0.09653091430664062, -0.08484649658203125, -0.07316207885742188, -0.0614776611328125, -0.049793243408203125, -0.03810882568359375, -0.026424407958984375, -0.014739990234375, -0.003055572509765625, 0.00862884521484375, 0.020313262939453125, 0.0319976806640625, 0.043682098388671875, 0.05536651611328125, 0.06705093383789062, 0.0787353515625, 0.09041976928710938, 0.10210418701171875, 0.11378860473632812, 0.1254730224609375, 0.13715744018554688, 0.14884185791015625, 0.16052627563476562, 0.172210693359375, 0.18389511108398438, 0.19557952880859375, 0.20726394653320312, 0.2189483642578125, 0.23063278198242188, 0.24231719970703125, 0.2540016174316406, 0.26568603515625, 0.2773704528808594, 0.28905487060546875, 0.3007392883300781, 0.3124237060546875, 0.3241081237792969, 0.33579254150390625, 0.3474769592285156, 0.359161376953125, 0.3708457946777344, 0.38253021240234375, 0.3942146301269531, 0.4058990478515625, 0.4175834655761719, 0.42926788330078125, 0.4409523010253906, 0.45263671875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 9.0, 8.0, 4.0, 12.0, 17.0, 13.0, 34.0, 40.0, 78.0, 119.0, 298.0, 726.0, 1364.0, 751.0, 283.0, 143.0, 82.0, 46.0, 21.0, 13.0, 10.0, 4.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35498046875, -0.3464221954345703, -0.3378639221191406, -0.32930564880371094, -0.32074737548828125, -0.31218910217285156, -0.3036308288574219, -0.2950725555419922, -0.2865142822265625, -0.2779560089111328, -0.2693977355957031, -0.26083946228027344, -0.25228118896484375, -0.24372291564941406, -0.23516464233398438, -0.2266063690185547, -0.218048095703125, -0.2094898223876953, -0.20093154907226562, -0.19237327575683594, -0.18381500244140625, -0.17525672912597656, -0.16669845581054688, -0.1581401824951172, -0.1495819091796875, -0.1410236358642578, -0.13246536254882812, -0.12390708923339844, -0.11534881591796875, -0.10679054260253906, -0.09823226928710938, -0.08967399597167969, -0.08111572265625, -0.07255744934082031, -0.06399917602539062, -0.05544090270996094, -0.04688262939453125, -0.03832435607910156, -0.029766082763671875, -0.021207809448242188, -0.0126495361328125, -0.0040912628173828125, 0.004467010498046875, 0.013025283813476562, 0.02158355712890625, 0.030141830444335938, 0.038700103759765625, 0.04725837707519531, 0.055816650390625, 0.06437492370605469, 0.07293319702148438, 0.08149147033691406, 0.09004974365234375, 0.09860801696777344, 0.10716629028320312, 0.11572456359863281, 0.1242828369140625, 0.1328411102294922, 0.14139938354492188, 0.14995765686035156, 0.15851593017578125, 0.16707420349121094, 0.17563247680664062, 0.1841907501220703, 0.1927490234375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 14.0, 21.0, 44.0, 119.0, 267.0, 317.0, 143.0, 31.0, 24.0, 10.0, 5.0, 1.0, 1.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.67451286315918, -4.566181659698486, -4.457850456237793, -4.3495192527771, -4.241188049316406, -4.132857322692871, -4.0245256423950195, -3.9161946773529053, -3.807863712310791, -3.6995325088500977, -3.5912013053894043, -3.482870101928711, -3.3745391368865967, -3.2662079334259033, -3.15787672996521, -3.0495455265045166, -2.9412143230438232, -2.83288311958313, -2.7245519161224365, -2.6162209510803223, -2.507889747619629, -2.3995585441589355, -2.291227340698242, -2.182896137237549, -2.0745649337768555, -1.966233730316162, -1.8579026460647583, -1.749571442604065, -1.6412403583526611, -1.5329091548919678, -1.4245779514312744, -1.316246747970581, -1.207916021347046, -1.0995848178863525, -0.9912537336349487, -0.8829225301742554, -0.7745913863182068, -0.6662602424621582, -0.5579290390014648, -0.44959789514541626, -0.3412667512893677, -0.2329355925321579, -0.12460443377494812, -0.01627326011657715, 0.09205788373947144, 0.20038902759552002, 0.3087202310562134, 0.41705137491226196, 0.5253825187683105, 0.6337136626243591, 0.7420448064804077, 0.8503760099411011, 0.9587071537971497, 1.0670382976531982, 1.1753695011138916, 1.283700704574585, 1.3920317888259888, 1.5003629922866821, 1.608694076538086, 1.7170252799987793, 1.8253564834594727, 1.9336875677108765, 2.0420188903808594, 2.1503498554229736, 2.258681058883667]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 7.0, 3.0, 3.0, 15.0, 12.0, 15.0, 24.0, 24.0, 24.0, 36.0, 34.0, 37.0, 40.0, 45.0, 35.0, 40.0, 65.0, 39.0, 51.0, 49.0, 39.0, 46.0, 35.0, 37.0, 41.0, 23.0, 24.0, 23.0, 25.0, 16.0, 16.0, 13.0, 14.0, 7.0, 8.0, 5.0, 8.0, 7.0, 7.0, 3.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.859557032585144, -0.8319158554077148, -0.8042746186256409, -0.7766334414482117, -0.7489922046661377, -0.7213510274887085, -0.6937097907066345, -0.6660686135292053, -0.6384273767471313, -0.6107861995697021, -0.5831449627876282, -0.555503785610199, -0.527862548828125, -0.5002213716506958, -0.4725801348686218, -0.4449389576911926, -0.41729775071144104, -0.38965654373168945, -0.36201533675193787, -0.3343741297721863, -0.3067329227924347, -0.2790917158126831, -0.2514505386352539, -0.22380931675434113, -0.19616810977458954, -0.16852690279483795, -0.14088569581508636, -0.11324449628591537, -0.08560328930616379, -0.0579620897769928, -0.03032088279724121, -0.002679675817489624, 0.024961531162261963, 0.05260273814201355, 0.08024394512176514, 0.10788514465093613, 0.1355263590812683, 0.1631675511598587, 0.1908087581396103, 0.21844996511936188, 0.24609117209911346, 0.27373236417770386, 0.30137357115745544, 0.32901477813720703, 0.3566559851169586, 0.3842971920967102, 0.4119383990764618, 0.4395796060562134, 0.46722081303596497, 0.49486202001571655, 0.5225031971931458, 0.5501444339752197, 0.5777856111526489, 0.6054268479347229, 0.6330680251121521, 0.6607092618942261, 0.6883504390716553, 0.7159916162490845, 0.7436328530311584, 0.7712740302085876, 0.7989152669906616, 0.8265564441680908, 0.8541976809501648, 0.881838858127594, 0.909480094909668]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 3.0, 3.0, 7.0, 10.0, 8.0, 18.0, 19.0, 35.0, 58.0, 82.0, 137.0, 186.0, 299.0, 478.0, 772.0, 1288.0, 2130.0, 3608.0, 6255.0, 11213.0, 19946.0, 36734.0, 65339.0, 113779.0, 177597.0, 207945.0, 164974.0, 102954.0, 58348.0, 32616.0, 17997.0, 9926.0, 5672.0, 3188.0, 1858.0, 1131.0, 703.0, 419.0, 272.0, 176.0, 114.0, 96.0, 56.0, 45.0, 23.0, 13.0, 10.0, 7.0, 6.0, 5.0, 5.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0633544921875, -0.06112384796142578, -0.05889320373535156, -0.056662559509277344, -0.054431915283203125, -0.052201271057128906, -0.04997062683105469, -0.04773998260498047, -0.04550933837890625, -0.04327869415283203, -0.04104804992675781, -0.038817405700683594, -0.036586761474609375, -0.034356117248535156, -0.03212547302246094, -0.02989482879638672, -0.0276641845703125, -0.02543354034423828, -0.023202896118164062, -0.020972251892089844, -0.018741607666015625, -0.016510963439941406, -0.014280319213867188, -0.012049674987792969, -0.00981903076171875, -0.007588386535644531, -0.0053577423095703125, -0.0031270980834960938, -0.000896453857421875, 0.0013341903686523438, 0.0035648345947265625, 0.005795478820800781, 0.008026123046875, 0.010256767272949219, 0.012487411499023438, 0.014718055725097656, 0.016948699951171875, 0.019179344177246094, 0.021409988403320312, 0.02364063262939453, 0.02587127685546875, 0.02810192108154297, 0.030332565307617188, 0.032563209533691406, 0.034793853759765625, 0.037024497985839844, 0.03925514221191406, 0.04148578643798828, 0.0437164306640625, 0.04594707489013672, 0.04817771911621094, 0.050408363342285156, 0.052639007568359375, 0.054869651794433594, 0.05710029602050781, 0.05933094024658203, 0.06156158447265625, 0.06379222869873047, 0.06602287292480469, 0.0682535171508789, 0.07048416137695312, 0.07271480560302734, 0.07494544982910156, 0.07717609405517578, 0.07940673828125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 5.0, 3.0, 6.0, 5.0, 5.0, 4.0, 16.0, 11.0, 18.0, 19.0, 31.0, 30.0, 29.0, 35.0, 36.0, 52.0, 40.0, 34.0, 60.0, 37.0, 46.0, 49.0, 59.0, 47.0, 34.0, 38.0, 21.0, 28.0, 31.0, 27.0, 30.0, 17.0, 18.0, 18.0, 11.0, 16.0, 8.0, 3.0, 5.0, 4.0, 3.0, 1.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0743408203125, -0.0721750259399414, -0.07000923156738281, -0.06784343719482422, -0.06567764282226562, -0.06351184844970703, -0.06134605407714844, -0.059180259704589844, -0.05701446533203125, -0.054848670959472656, -0.05268287658691406, -0.05051708221435547, -0.048351287841796875, -0.04618549346923828, -0.04401969909667969, -0.041853904724121094, -0.0396881103515625, -0.037522315979003906, -0.03535652160644531, -0.03319072723388672, -0.031024932861328125, -0.02885913848876953, -0.026693344116210938, -0.024527549743652344, -0.02236175537109375, -0.020195960998535156, -0.018030166625976562, -0.01586437225341797, -0.013698577880859375, -0.011532783508300781, -0.009366989135742188, -0.007201194763183594, -0.005035400390625, -0.0028696060180664062, -0.0007038116455078125, 0.0014619827270507812, 0.003627777099609375, 0.005793571472167969, 0.007959365844726562, 0.010125160217285156, 0.01229095458984375, 0.014456748962402344, 0.016622543334960938, 0.01878833770751953, 0.020954132080078125, 0.02311992645263672, 0.025285720825195312, 0.027451515197753906, 0.0296173095703125, 0.031783103942871094, 0.03394889831542969, 0.03611469268798828, 0.038280487060546875, 0.04044628143310547, 0.04261207580566406, 0.044777870178222656, 0.04694366455078125, 0.049109458923339844, 0.05127525329589844, 0.05344104766845703, 0.055606842041015625, 0.05777263641357422, 0.05993843078613281, 0.062104225158691406, 0.06427001953125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 7.0, 6.0, 14.0, 20.0, 30.0, 32.0, 48.0, 58.0, 105.0, 154.0, 259.0, 426.0, 782.0, 1628.0, 4515.0, 21986.0, 278960.0, 681338.0, 46606.0, 7038.0, 2185.0, 982.0, 507.0, 326.0, 200.0, 109.0, 73.0, 49.0, 34.0, 25.0, 14.0, 13.0, 7.0, 10.0, 6.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.336669921875, -0.3265190124511719, -0.31636810302734375, -0.3062171936035156, -0.2960662841796875, -0.2859153747558594, -0.27576446533203125, -0.2656135559082031, -0.255462646484375, -0.24531173706054688, -0.23516082763671875, -0.22500991821289062, -0.2148590087890625, -0.20470809936523438, -0.19455718994140625, -0.18440628051757812, -0.17425537109375, -0.16410446166992188, -0.15395355224609375, -0.14380264282226562, -0.1336517333984375, -0.12350082397460938, -0.11334991455078125, -0.10319900512695312, -0.093048095703125, -0.08289718627929688, -0.07274627685546875, -0.06259536743164062, -0.0524444580078125, -0.042293548583984375, -0.03214263916015625, -0.021991729736328125, -0.0118408203125, -0.001689910888671875, 0.00846099853515625, 0.018611907958984375, 0.0287628173828125, 0.038913726806640625, 0.04906463623046875, 0.059215545654296875, 0.069366455078125, 0.07951736450195312, 0.08966827392578125, 0.09981918334960938, 0.1099700927734375, 0.12012100219726562, 0.13027191162109375, 0.14042282104492188, 0.15057373046875, 0.16072463989257812, 0.17087554931640625, 0.18102645874023438, 0.1911773681640625, 0.20132827758789062, 0.21147918701171875, 0.22163009643554688, 0.231781005859375, 0.24193191528320312, 0.25208282470703125, 0.2622337341308594, 0.2723846435546875, 0.2825355529785156, 0.29268646240234375, 0.3028373718261719, 0.31298828125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 8.0, 6.0, 12.0, 8.0, 16.0, 13.0, 19.0, 35.0, 35.0, 35.0, 35.0, 40.0, 58.0, 58.0, 60.0, 59.0, 65.0, 69.0, 51.0, 51.0, 51.0, 48.0, 32.0, 34.0, 22.0, 22.0, 15.0, 3.0, 10.0, 6.0, 8.0, 5.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.357421875, -0.344512939453125, -0.33160400390625, -0.318695068359375, -0.3057861328125, -0.292877197265625, -0.27996826171875, -0.267059326171875, -0.254150390625, -0.241241455078125, -0.22833251953125, -0.215423583984375, -0.2025146484375, -0.189605712890625, -0.17669677734375, -0.163787841796875, -0.15087890625, -0.137969970703125, -0.12506103515625, -0.112152099609375, -0.0992431640625, -0.086334228515625, -0.07342529296875, -0.060516357421875, -0.047607421875, -0.034698486328125, -0.02178955078125, -0.008880615234375, 0.0040283203125, 0.016937255859375, 0.02984619140625, 0.042755126953125, 0.0556640625, 0.068572998046875, 0.08148193359375, 0.094390869140625, 0.1072998046875, 0.120208740234375, 0.13311767578125, 0.146026611328125, 0.158935546875, 0.171844482421875, 0.18475341796875, 0.197662353515625, 0.2105712890625, 0.223480224609375, 0.23638916015625, 0.249298095703125, 0.26220703125, 0.275115966796875, 0.28802490234375, 0.300933837890625, 0.3138427734375, 0.326751708984375, 0.33966064453125, 0.352569580078125, 0.365478515625, 0.378387451171875, 0.39129638671875, 0.404205322265625, 0.4171142578125, 0.430023193359375, 0.44293212890625, 0.455841064453125, 0.46875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 10.0, 13.0, 17.0, 23.0, 51.0, 82.0, 145.0, 290.0, 487.0, 1036.0, 2340.0, 5841.0, 16701.0, 84687.0, 863884.0, 51103.0, 13141.0, 4828.0, 1968.0, 894.0, 449.0, 218.0, 127.0, 83.0, 50.0, 28.0, 18.0, 13.0, 8.0, 7.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19287109375, -0.1865253448486328, -0.18017959594726562, -0.17383384704589844, -0.16748809814453125, -0.16114234924316406, -0.15479660034179688, -0.1484508514404297, -0.1421051025390625, -0.1357593536376953, -0.12941360473632812, -0.12306785583496094, -0.11672210693359375, -0.11037635803222656, -0.10403060913085938, -0.09768486022949219, -0.091339111328125, -0.08499336242675781, -0.07864761352539062, -0.07230186462402344, -0.06595611572265625, -0.05961036682128906, -0.053264617919921875, -0.04691886901855469, -0.0405731201171875, -0.03422737121582031, -0.027881622314453125, -0.021535873413085938, -0.01519012451171875, -0.008844375610351562, -0.002498626708984375, 0.0038471221923828125, 0.01019287109375, 0.016538619995117188, 0.022884368896484375, 0.029230117797851562, 0.03557586669921875, 0.04192161560058594, 0.048267364501953125, 0.05461311340332031, 0.0609588623046875, 0.06730461120605469, 0.07365036010742188, 0.07999610900878906, 0.08634185791015625, 0.09268760681152344, 0.09903335571289062, 0.10537910461425781, 0.111724853515625, 0.11807060241699219, 0.12441635131835938, 0.13076210021972656, 0.13710784912109375, 0.14345359802246094, 0.14979934692382812, 0.1561450958251953, 0.1624908447265625, 0.1688365936279297, 0.17518234252929688, 0.18152809143066406, 0.18787384033203125, 0.19421958923339844, 0.20056533813476562, 0.2069110870361328, 0.2132568359375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 4.0, 3.0, 5.0, 8.0, 7.0, 8.0, 17.0, 18.0, 16.0, 56.0, 109.0, 271.0, 229.0, 101.0, 51.0, 26.0, 13.0, 9.0, 6.0, 7.0, 5.0, 4.0, 7.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.492303848266602e-05, -7.257610559463501e-05, -7.0229172706604e-05, -6.7882239818573e-05, -6.553530693054199e-05, -6.318837404251099e-05, -6.084144115447998e-05, -5.8494508266448975e-05, -5.614757537841797e-05, -5.380064249038696e-05, -5.145370960235596e-05, -4.910677671432495e-05, -4.6759843826293945e-05, -4.441291093826294e-05, -4.2065978050231934e-05, -3.971904516220093e-05, -3.737211227416992e-05, -3.5025179386138916e-05, -3.267824649810791e-05, -3.0331313610076904e-05, -2.79843807220459e-05, -2.5637447834014893e-05, -2.3290514945983887e-05, -2.094358205795288e-05, -1.8596649169921875e-05, -1.624971628189087e-05, -1.3902783393859863e-05, -1.1555850505828857e-05, -9.208917617797852e-06, -6.861984729766846e-06, -4.51505184173584e-06, -2.168118953704834e-06, 1.7881393432617188e-07, 2.5257468223571777e-06, 4.872679710388184e-06, 7.2196125984191895e-06, 9.566545486450195e-06, 1.1913478374481201e-05, 1.4260411262512207e-05, 1.6607344150543213e-05, 1.895427703857422e-05, 2.1301209926605225e-05, 2.364814281463623e-05, 2.5995075702667236e-05, 2.8342008590698242e-05, 3.068894147872925e-05, 3.3035874366760254e-05, 3.538280725479126e-05, 3.7729740142822266e-05, 4.007667303085327e-05, 4.242360591888428e-05, 4.477053880691528e-05, 4.711747169494629e-05, 4.9464404582977295e-05, 5.18113374710083e-05, 5.415827035903931e-05, 5.650520324707031e-05, 5.885213613510132e-05, 6.119906902313232e-05, 6.354600191116333e-05, 6.589293479919434e-05, 6.823986768722534e-05, 7.058680057525635e-05, 7.293373346328735e-05, 7.528066635131836e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 6.0, 5.0, 7.0, 8.0, 7.0, 12.0, 15.0, 35.0, 35.0, 81.0, 115.0, 186.0, 308.0, 511.0, 958.0, 1904.0, 4300.0, 10244.0, 28378.0, 301972.0, 643242.0, 34615.0, 12037.0, 4888.0, 2214.0, 1011.0, 599.0, 331.0, 181.0, 130.0, 70.0, 43.0, 33.0, 26.0, 15.0, 8.0, 4.0, 3.0, 1.0, 6.0, 2.0, 0.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1751708984375, -0.1700305938720703, -0.16489028930664062, -0.15974998474121094, -0.15460968017578125, -0.14946937561035156, -0.14432907104492188, -0.1391887664794922, -0.1340484619140625, -0.1289081573486328, -0.12376785278320312, -0.11862754821777344, -0.11348724365234375, -0.10834693908691406, -0.10320663452148438, -0.09806632995605469, -0.092926025390625, -0.08778572082519531, -0.08264541625976562, -0.07750511169433594, -0.07236480712890625, -0.06722450256347656, -0.062084197998046875, -0.05694389343261719, -0.0518035888671875, -0.04666328430175781, -0.041522979736328125, -0.03638267517089844, -0.03124237060546875, -0.026102066040039062, -0.020961761474609375, -0.015821456909179688, -0.01068115234375, -0.0055408477783203125, -0.000400543212890625, 0.0047397613525390625, 0.00988006591796875, 0.015020370483398438, 0.020160675048828125, 0.025300979614257812, 0.0304412841796875, 0.03558158874511719, 0.040721893310546875, 0.04586219787597656, 0.05100250244140625, 0.05614280700683594, 0.061283111572265625, 0.06642341613769531, 0.071563720703125, 0.07670402526855469, 0.08184432983398438, 0.08698463439941406, 0.09212493896484375, 0.09726524353027344, 0.10240554809570312, 0.10754585266113281, 0.1126861572265625, 0.11782646179199219, 0.12296676635742188, 0.12810707092285156, 0.13324737548828125, 0.13838768005371094, 0.14352798461914062, 0.1486682891845703, 0.15380859375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 2.0, 3.0, 7.0, 3.0, 3.0, 4.0, 13.0, 8.0, 6.0, 16.0, 15.0, 29.0, 43.0, 48.0, 75.0, 93.0, 96.0, 109.0, 104.0, 80.0, 55.0, 41.0, 39.0, 19.0, 24.0, 12.0, 5.0, 8.0, 2.0, 6.0, 9.0, 3.0, 4.0, 1.0, 6.0, 3.0, 1.0, 3.0, 0.0, 2.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11639404296875, -0.11267948150634766, -0.10896492004394531, -0.10525035858154297, -0.10153579711914062, -0.09782123565673828, -0.09410667419433594, -0.0903921127319336, -0.08667755126953125, -0.0829629898071289, -0.07924842834472656, -0.07553386688232422, -0.07181930541992188, -0.06810474395751953, -0.06439018249511719, -0.060675621032714844, -0.0569610595703125, -0.053246498107910156, -0.04953193664550781, -0.04581737518310547, -0.042102813720703125, -0.03838825225830078, -0.03467369079589844, -0.030959129333496094, -0.02724456787109375, -0.023530006408691406, -0.019815444946289062, -0.01610088348388672, -0.012386322021484375, -0.008671760559082031, -0.0049571990966796875, -0.0012426376342773438, 0.002471923828125, 0.006186485290527344, 0.009901046752929688, 0.013615608215332031, 0.017330169677734375, 0.02104473114013672, 0.024759292602539062, 0.028473854064941406, 0.03218841552734375, 0.035902976989746094, 0.03961753845214844, 0.04333209991455078, 0.047046661376953125, 0.05076122283935547, 0.05447578430175781, 0.058190345764160156, 0.0619049072265625, 0.06561946868896484, 0.06933403015136719, 0.07304859161376953, 0.07676315307617188, 0.08047771453857422, 0.08419227600097656, 0.0879068374633789, 0.09162139892578125, 0.0953359603881836, 0.09905052185058594, 0.10276508331298828, 0.10647964477539062, 0.11019420623779297, 0.11390876770019531, 0.11762332916259766, 0.121337890625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 1.0, 6.0, 16.0, 35.0, 99.0, 199.0, 346.0, 160.0, 87.0, 35.0, 7.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.246280670166016, -4.114625930786133, -3.982970714569092, -3.851315975189209, -3.719660997390747, -3.588006019592285, -3.4563510417938232, -3.3246960639953613, -3.1930413246154785, -3.0613863468170166, -2.9297313690185547, -2.798076629638672, -2.66642165184021, -2.534766674041748, -2.403111696243286, -2.271456718444824, -2.1398017406463623, -2.0081467628479004, -1.876491904258728, -1.7448369264602661, -1.6131820678710938, -1.4815270900726318, -1.34987211227417, -1.218217134475708, -1.0865622758865356, -0.9549073576927185, -0.8232524394989014, -0.6915974617004395, -0.5599425435066223, -0.4282876253128052, -0.29663264751434326, -0.16497772932052612, -0.033322811126708984, 0.09833212196826935, 0.22998705506324768, 0.3616420030593872, 0.49329692125320435, 0.6249518394470215, 0.7566068172454834, 0.8882617354393005, 1.0199166536331177, 1.1515716314315796, 1.283226490020752, 1.4148814678192139, 1.5465364456176758, 1.6781913042068481, 1.80984628200531, 1.9415011405944824, 2.0731561183929443, 2.2048110961914062, 2.336466073989868, 2.46812105178833, 2.599775791168213, 2.731430768966675, 2.8630857467651367, 2.9947407245635986, 3.1263957023620605, 3.2580506801605225, 3.3897056579589844, 3.521360397338867, 3.653015375137329, 3.784670352935791, 3.916325330734253, 4.047980308532715, 4.179635047912598]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 2.0, 10.0, 5.0, 13.0, 11.0, 20.0, 14.0, 19.0, 25.0, 21.0, 32.0, 25.0, 23.0, 38.0, 34.0, 44.0, 54.0, 72.0, 73.0, 84.0, 50.0, 32.0, 36.0, 31.0, 33.0, 24.0, 20.0, 26.0, 26.0, 24.0, 12.0, 14.0, 12.0, 15.0, 8.0, 4.0, 2.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7685835361480713, -1.717435359954834, -1.6662871837615967, -1.615139126777649, -1.5639909505844116, -1.5128427743911743, -1.4616947174072266, -1.4105465412139893, -1.359398365020752, -1.3082501888275146, -1.2571020126342773, -1.2059539556503296, -1.1548057794570923, -1.103657603263855, -1.0525095462799072, -1.00136137008667, -0.9502131938934326, -0.8990650177001953, -0.8479169011116028, -0.7967687845230103, -0.745620608329773, -0.6944724321365356, -0.6433243155479431, -0.5921761989593506, -0.5410280227661133, -0.48987987637519836, -0.43873172998428345, -0.38758358359336853, -0.3364354372024536, -0.2852872908115387, -0.23413914442062378, -0.18299099802970886, -0.13184285163879395, -0.08069470524787903, -0.02954655885696411, 0.021601587533950806, 0.07274973392486572, 0.12389788031578064, 0.17504602670669556, 0.22619417309761047, 0.2773423194885254, 0.3284904658794403, 0.3796386122703552, 0.43078675866127014, 0.48193490505218506, 0.5330830812454224, 0.5842311978340149, 0.6353793144226074, 0.6865274906158447, 0.737675666809082, 0.7888237833976746, 0.8399718999862671, 0.8911200761795044, 0.9422682523727417, 0.9934163689613342, 1.0445644855499268, 1.095712661743164, 1.1468608379364014, 1.1980090141296387, 1.2491570711135864, 1.3003052473068237, 1.351453423500061, 1.4026014804840088, 1.453749656677246, 1.5048978328704834]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 0.0, 3.0, 5.0, 9.0, 9.0, 6.0, 7.0, 19.0, 19.0, 30.0, 33.0, 59.0, 88.0, 133.0, 178.0, 312.0, 601.0, 1128.0, 2730.0, 7405.0, 25460.0, 137107.0, 1382752.0, 2313200.0, 263789.0, 41808.0, 10726.0, 3582.0, 1467.0, 677.0, 353.0, 184.0, 132.0, 73.0, 55.0, 48.0, 26.0, 25.0, 15.0, 12.0, 6.0, 5.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.12310791015625, -0.11939430236816406, -0.11568069458007812, -0.11196708679199219, -0.10825347900390625, -0.10453987121582031, -0.10082626342773438, -0.09711265563964844, -0.0933990478515625, -0.08968544006347656, -0.08597183227539062, -0.08225822448730469, -0.07854461669921875, -0.07483100891113281, -0.07111740112304688, -0.06740379333496094, -0.063690185546875, -0.05997657775878906, -0.056262969970703125, -0.05254936218261719, -0.04883575439453125, -0.04512214660644531, -0.041408538818359375, -0.03769493103027344, -0.0339813232421875, -0.030267715454101562, -0.026554107666015625, -0.022840499877929688, -0.01912689208984375, -0.015413284301757812, -0.011699676513671875, -0.007986068725585938, -0.0042724609375, -0.0005588531494140625, 0.003154754638671875, 0.0068683624267578125, 0.01058197021484375, 0.014295578002929688, 0.018009185791015625, 0.021722793579101562, 0.0254364013671875, 0.029150009155273438, 0.032863616943359375, 0.03657722473144531, 0.04029083251953125, 0.04400444030761719, 0.047718048095703125, 0.05143165588378906, 0.055145263671875, 0.05885887145996094, 0.06257247924804688, 0.06628608703613281, 0.06999969482421875, 0.07371330261230469, 0.07742691040039062, 0.08114051818847656, 0.0848541259765625, 0.08856773376464844, 0.09228134155273438, 0.09599494934082031, 0.09970855712890625, 0.10342216491699219, 0.10713577270507812, 0.11084938049316406, 0.11456298828125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 3.0, 8.0, 7.0, 9.0, 8.0, 12.0, 15.0, 19.0, 15.0, 24.0, 33.0, 48.0, 42.0, 51.0, 45.0, 43.0, 47.0, 52.0, 51.0, 51.0, 58.0, 43.0, 38.0, 38.0, 29.0, 38.0, 27.0, 30.0, 26.0, 17.0, 13.0, 11.0, 11.0, 8.0, 6.0, 4.0, 2.0, 5.0, 0.0, 4.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08013916015625, -0.07779312133789062, -0.07544708251953125, -0.07310104370117188, -0.0707550048828125, -0.06840896606445312, -0.06606292724609375, -0.06371688842773438, -0.061370849609375, -0.059024810791015625, -0.05667877197265625, -0.054332733154296875, -0.0519866943359375, -0.049640655517578125, -0.04729461669921875, -0.044948577880859375, -0.0426025390625, -0.040256500244140625, -0.03791046142578125, -0.035564422607421875, -0.0332183837890625, -0.030872344970703125, -0.02852630615234375, -0.026180267333984375, -0.023834228515625, -0.021488189697265625, -0.01914215087890625, -0.016796112060546875, -0.0144500732421875, -0.012104034423828125, -0.00975799560546875, -0.007411956787109375, -0.00506591796875, -0.002719879150390625, -0.00037384033203125, 0.001972198486328125, 0.0043182373046875, 0.006664276123046875, 0.00901031494140625, 0.011356353759765625, 0.013702392578125, 0.016048431396484375, 0.01839447021484375, 0.020740509033203125, 0.0230865478515625, 0.025432586669921875, 0.02777862548828125, 0.030124664306640625, 0.032470703125, 0.034816741943359375, 0.03716278076171875, 0.039508819580078125, 0.0418548583984375, 0.044200897216796875, 0.04654693603515625, 0.048892974853515625, 0.051239013671875, 0.053585052490234375, 0.05593109130859375, 0.058277130126953125, 0.0606231689453125, 0.06296920776367188, 0.06531524658203125, 0.06766128540039062, 0.07000732421875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 6.0, 4.0, 7.0, 7.0, 13.0, 11.0, 22.0, 29.0, 32.0, 38.0, 32.0, 60.0, 85.0, 114.0, 140.0, 250.0, 913.0, 7358.0, 1588685.0, 2585673.0, 8954.0, 955.0, 283.0, 145.0, 101.0, 91.0, 49.0, 54.0, 44.0, 32.0, 29.0, 12.0, 13.0, 14.0, 7.0, 13.0, 2.0, 2.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.474365234375, -0.4568138122558594, -0.43926239013671875, -0.4217109680175781, -0.4041595458984375, -0.3866081237792969, -0.36905670166015625, -0.3515052795410156, -0.333953857421875, -0.3164024353027344, -0.29885101318359375, -0.2812995910644531, -0.2637481689453125, -0.24619674682617188, -0.22864532470703125, -0.21109390258789062, -0.19354248046875, -0.17599105834960938, -0.15843963623046875, -0.14088821411132812, -0.1233367919921875, -0.10578536987304688, -0.08823394775390625, -0.07068252563476562, -0.053131103515625, -0.035579681396484375, -0.01802825927734375, -0.000476837158203125, 0.0170745849609375, 0.034626007080078125, 0.05217742919921875, 0.06972885131835938, 0.0872802734375, 0.10483169555664062, 0.12238311767578125, 0.13993453979492188, 0.1574859619140625, 0.17503738403320312, 0.19258880615234375, 0.21014022827148438, 0.227691650390625, 0.24524307250976562, 0.26279449462890625, 0.2803459167480469, 0.2978973388671875, 0.3154487609863281, 0.33300018310546875, 0.3505516052246094, 0.36810302734375, 0.3856544494628906, 0.40320587158203125, 0.4207572937011719, 0.4383087158203125, 0.4558601379394531, 0.47341156005859375, 0.4909629821777344, 0.508514404296875, 0.5260658264160156, 0.5436172485351562, 0.5611686706542969, 0.5787200927734375, 0.5962715148925781, 0.6138229370117188, 0.6313743591308594, 0.64892578125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 5.0, 7.0, 10.0, 11.0, 17.0, 28.0, 38.0, 62.0, 74.0, 153.0, 275.0, 569.0, 856.0, 792.0, 516.0, 267.0, 149.0, 74.0, 47.0, 37.0, 33.0, 16.0, 12.0, 7.0, 6.0, 3.0, 6.0, 4.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.267822265625, -0.260955810546875, -0.25408935546875, -0.247222900390625, -0.2403564453125, -0.233489990234375, -0.22662353515625, -0.219757080078125, -0.212890625, -0.206024169921875, -0.19915771484375, -0.192291259765625, -0.1854248046875, -0.178558349609375, -0.17169189453125, -0.164825439453125, -0.157958984375, -0.151092529296875, -0.14422607421875, -0.137359619140625, -0.1304931640625, -0.123626708984375, -0.11676025390625, -0.109893798828125, -0.10302734375, -0.096160888671875, -0.08929443359375, -0.082427978515625, -0.0755615234375, -0.068695068359375, -0.06182861328125, -0.054962158203125, -0.048095703125, -0.041229248046875, -0.03436279296875, -0.027496337890625, -0.0206298828125, -0.013763427734375, -0.00689697265625, -3.0517578125e-05, 0.0068359375, 0.013702392578125, 0.02056884765625, 0.027435302734375, 0.0343017578125, 0.041168212890625, 0.04803466796875, 0.054901123046875, 0.061767578125, 0.068634033203125, 0.07550048828125, 0.082366943359375, 0.0892333984375, 0.096099853515625, 0.10296630859375, 0.109832763671875, 0.11669921875, 0.123565673828125, 0.13043212890625, 0.137298583984375, 0.1441650390625, 0.151031494140625, 0.15789794921875, 0.164764404296875, 0.171630859375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 3.0, 3.0, 8.0, 7.0, 23.0, 31.0, 54.0, 125.0, 202.0, 217.0, 158.0, 75.0, 41.0, 14.0, 12.0, 6.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.735196590423584, -3.634678602218628, -3.534160852432251, -3.433642864227295, -3.333125114440918, -3.232607126235962, -3.132089138031006, -3.031571388244629, -2.931053638458252, -2.830535650253296, -2.730017900466919, -2.629499912261963, -2.528982162475586, -2.42846417427063, -2.327946186065674, -2.227428436279297, -2.126910448074341, -2.0263924598693848, -1.9258747100830078, -1.8253567218780518, -1.7248389720916748, -1.6243209838867188, -1.5238031148910522, -1.4232852458953857, -1.3227673768997192, -1.2222495079040527, -1.1217316389083862, -1.0212137699127197, -0.9206958413124084, -0.8201779723167419, -0.7196600437164307, -0.6191421747207642, -0.5186243057250977, -0.41810643672943115, -0.31758853793144226, -0.21707063913345337, -0.11655277013778687, -0.01603490114212036, 0.08448302745819092, 0.18500089645385742, 0.2855187654495239, 0.38603663444519043, 0.4865545332431793, 0.5870724320411682, 0.6875903010368347, 0.7881081700325012, 0.8886260986328125, 0.989143967628479, 1.0896618366241455, 1.190179705619812, 1.2906975746154785, 1.3912155628204346, 1.4917333126068115, 1.5922513008117676, 1.692769169807434, 1.7932870388031006, 1.893804907798767, 1.9943227767944336, 2.0948407649993896, 2.1953585147857666, 2.2958765029907227, 2.3963942527770996, 2.4969122409820557, 2.5974302291870117, 2.6979479789733887]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 4.0, 6.0, 11.0, 13.0, 21.0, 22.0, 36.0, 33.0, 40.0, 48.0, 35.0, 53.0, 70.0, 66.0, 58.0, 56.0, 60.0, 50.0, 59.0, 41.0, 37.0, 29.0, 41.0, 28.0, 19.0, 13.0, 18.0, 7.0, 4.0, 8.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9858115315437317, -0.953815221786499, -0.9218189120292664, -0.8898226022720337, -0.857826292514801, -0.8258299827575684, -0.7938336133956909, -0.761837363243103, -0.7298409938812256, -0.6978446841239929, -0.6658483743667603, -0.6338520646095276, -0.6018557548522949, -0.5698594450950623, -0.5378631353378296, -0.5058667659759521, -0.47387051582336426, -0.4418742060661316, -0.4098778963088989, -0.37788158655166626, -0.3458852767944336, -0.3138889670372009, -0.2818926274776459, -0.2498963177204132, -0.21790000796318054, -0.18590369820594788, -0.1539073884487152, -0.12191106379032135, -0.08991475403308868, -0.05791844427585602, -0.025922119617462158, 0.006074190139770508, 0.03807055950164795, 0.07006686925888062, 0.10206318646669388, 0.13405950367450714, 0.1660558134317398, 0.19805212318897247, 0.23004844784736633, 0.262044757604599, 0.29404106736183167, 0.32603737711906433, 0.358033686876297, 0.39003002643585205, 0.4220263361930847, 0.4540226459503174, 0.48601895570755005, 0.5180152654647827, 0.5500115752220154, 0.582007884979248, 0.6140041947364807, 0.6460005044937134, 0.677996814250946, 0.7099931240081787, 0.7419894933700562, 0.773985743522644, 0.8059821128845215, 0.8379784226417542, 0.8699747323989868, 0.9019710421562195, 0.9339673519134521, 0.9659636616706848, 0.9979599714279175, 1.029956340789795, 1.0619525909423828]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 0.0, 4.0, 2.0, 7.0, 5.0, 6.0, 10.0, 21.0, 26.0, 26.0, 46.0, 58.0, 96.0, 168.0, 224.0, 336.0, 498.0, 867.0, 1326.0, 2323.0, 4253.0, 8089.0, 16674.0, 37824.0, 97000.0, 264250.0, 356582.0, 152741.0, 56988.0, 23992.0, 11031.0, 5470.0, 3030.0, 1706.0, 1017.0, 616.0, 450.0, 249.0, 177.0, 107.0, 79.0, 47.0, 49.0, 34.0, 17.0, 13.0, 7.0, 7.0, 7.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.1536865234375, -0.14860153198242188, -0.14351654052734375, -0.13843154907226562, -0.1333465576171875, -0.12826156616210938, -0.12317657470703125, -0.11809158325195312, -0.113006591796875, -0.10792160034179688, -0.10283660888671875, -0.09775161743164062, -0.0926666259765625, -0.08758163452148438, -0.08249664306640625, -0.07741165161132812, -0.07232666015625, -0.06724166870117188, -0.06215667724609375, -0.057071685791015625, -0.0519866943359375, -0.046901702880859375, -0.04181671142578125, -0.036731719970703125, -0.031646728515625, -0.026561737060546875, -0.02147674560546875, -0.016391754150390625, -0.0113067626953125, -0.006221771240234375, -0.00113677978515625, 0.003948211669921875, 0.009033203125, 0.014118194580078125, 0.01920318603515625, 0.024288177490234375, 0.0293731689453125, 0.034458160400390625, 0.03954315185546875, 0.044628143310546875, 0.049713134765625, 0.054798126220703125, 0.05988311767578125, 0.06496810913085938, 0.0700531005859375, 0.07513809204101562, 0.08022308349609375, 0.08530807495117188, 0.09039306640625, 0.09547805786132812, 0.10056304931640625, 0.10564804077148438, 0.1107330322265625, 0.11581802368164062, 0.12090301513671875, 0.12598800659179688, 0.131072998046875, 0.13615798950195312, 0.14124298095703125, 0.14632797241210938, 0.1514129638671875, 0.15649795532226562, 0.16158294677734375, 0.16666793823242188, 0.1717529296875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0, 5.0, 8.0, 8.0, 8.0, 18.0, 15.0, 14.0, 16.0, 26.0, 22.0, 33.0, 36.0, 39.0, 42.0, 54.0, 37.0, 60.0, 52.0, 52.0, 34.0, 53.0, 49.0, 36.0, 38.0, 40.0, 21.0, 27.0, 29.0, 28.0, 13.0, 14.0, 13.0, 12.0, 7.0, 10.0, 9.0, 4.0, 5.0, 3.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.0831298828125, -0.08083152770996094, -0.07853317260742188, -0.07623481750488281, -0.07393646240234375, -0.07163810729980469, -0.06933975219726562, -0.06704139709472656, -0.0647430419921875, -0.06244468688964844, -0.060146331787109375, -0.05784797668457031, -0.05554962158203125, -0.05325126647949219, -0.050952911376953125, -0.04865455627441406, -0.046356201171875, -0.04405784606933594, -0.041759490966796875, -0.03946113586425781, -0.03716278076171875, -0.03486442565917969, -0.032566070556640625, -0.030267715454101562, -0.0279693603515625, -0.025671005249023438, -0.023372650146484375, -0.021074295043945312, -0.01877593994140625, -0.016477584838867188, -0.014179229736328125, -0.011880874633789062, -0.00958251953125, -0.0072841644287109375, -0.004985809326171875, -0.0026874542236328125, -0.00038909912109375, 0.0019092559814453125, 0.004207611083984375, 0.0065059661865234375, 0.0088043212890625, 0.011102676391601562, 0.013401031494140625, 0.015699386596679688, 0.01799774169921875, 0.020296096801757812, 0.022594451904296875, 0.024892807006835938, 0.027191162109375, 0.029489517211914062, 0.031787872314453125, 0.03408622741699219, 0.03638458251953125, 0.03868293762207031, 0.040981292724609375, 0.04327964782714844, 0.0455780029296875, 0.04787635803222656, 0.050174713134765625, 0.05247306823730469, 0.05477142333984375, 0.05706977844238281, 0.059368133544921875, 0.06166648864746094, 0.06396484375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 4.0, 6.0, 5.0, 10.0, 15.0, 15.0, 18.0, 25.0, 33.0, 69.0, 99.0, 149.0, 286.0, 514.0, 1121.0, 3317.0, 15103.0, 241706.0, 751172.0, 27101.0, 4838.0, 1583.0, 594.0, 292.0, 142.0, 117.0, 53.0, 42.0, 30.0, 24.0, 16.0, 17.0, 14.0, 3.0, 4.0, 6.0, 5.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.66015625, -0.639617919921875, -0.61907958984375, -0.598541259765625, -0.5780029296875, -0.557464599609375, -0.53692626953125, -0.516387939453125, -0.495849609375, -0.475311279296875, -0.45477294921875, -0.434234619140625, -0.4136962890625, -0.393157958984375, -0.37261962890625, -0.352081298828125, -0.33154296875, -0.311004638671875, -0.29046630859375, -0.269927978515625, -0.2493896484375, -0.228851318359375, -0.20831298828125, -0.187774658203125, -0.167236328125, -0.146697998046875, -0.12615966796875, -0.105621337890625, -0.0850830078125, -0.064544677734375, -0.04400634765625, -0.023468017578125, -0.0029296875, 0.017608642578125, 0.03814697265625, 0.058685302734375, 0.0792236328125, 0.099761962890625, 0.12030029296875, 0.140838623046875, 0.161376953125, 0.181915283203125, 0.20245361328125, 0.222991943359375, 0.2435302734375, 0.264068603515625, 0.28460693359375, 0.305145263671875, 0.32568359375, 0.346221923828125, 0.36676025390625, 0.387298583984375, 0.4078369140625, 0.428375244140625, 0.44891357421875, 0.469451904296875, 0.489990234375, 0.510528564453125, 0.53106689453125, 0.551605224609375, 0.5721435546875, 0.592681884765625, 0.61322021484375, 0.633758544921875, 0.654296875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 7.0, 4.0, 6.0, 9.0, 18.0, 22.0, 22.0, 31.0, 29.0, 35.0, 49.0, 51.0, 43.0, 53.0, 44.0, 48.0, 43.0, 61.0, 56.0, 35.0, 49.0, 52.0, 37.0, 32.0, 32.0, 24.0, 25.0, 20.0, 12.0, 10.0, 16.0, 4.0, 6.0, 7.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.302490234375, -0.29277801513671875, -0.2830657958984375, -0.27335357666015625, -0.263641357421875, -0.25392913818359375, -0.2442169189453125, -0.23450469970703125, -0.22479248046875, -0.21508026123046875, -0.2053680419921875, -0.19565582275390625, -0.185943603515625, -0.17623138427734375, -0.1665191650390625, -0.15680694580078125, -0.1470947265625, -0.13738250732421875, -0.1276702880859375, -0.11795806884765625, -0.108245849609375, -0.09853363037109375, -0.0888214111328125, -0.07910919189453125, -0.06939697265625, -0.05968475341796875, -0.0499725341796875, -0.04026031494140625, -0.030548095703125, -0.02083587646484375, -0.0111236572265625, -0.00141143798828125, 0.00830078125, 0.01801300048828125, 0.0277252197265625, 0.03743743896484375, 0.047149658203125, 0.05686187744140625, 0.0665740966796875, 0.07628631591796875, 0.08599853515625, 0.09571075439453125, 0.1054229736328125, 0.11513519287109375, 0.124847412109375, 0.13455963134765625, 0.1442718505859375, 0.15398406982421875, 0.1636962890625, 0.17340850830078125, 0.1831207275390625, 0.19283294677734375, 0.202545166015625, 0.21225738525390625, 0.2219696044921875, 0.23168182373046875, 0.24139404296875, 0.25110626220703125, 0.2608184814453125, 0.27053070068359375, 0.280242919921875, 0.28995513916015625, 0.2996673583984375, 0.30937957763671875, 0.319091796875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 6.0, 11.0, 23.0, 24.0, 38.0, 59.0, 96.0, 122.0, 193.0, 349.0, 563.0, 1004.0, 1897.0, 3793.0, 8646.0, 22741.0, 118407.0, 782521.0, 75253.0, 18398.0, 7340.0, 3233.0, 1650.0, 842.0, 537.0, 292.0, 178.0, 128.0, 75.0, 39.0, 30.0, 28.0, 9.0, 10.0, 6.0, 5.0, 5.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22607421875, -0.21930503845214844, -0.21253585815429688, -0.2057666778564453, -0.19899749755859375, -0.1922283172607422, -0.18545913696289062, -0.17868995666503906, -0.1719207763671875, -0.16515159606933594, -0.15838241577148438, -0.1516132354736328, -0.14484405517578125, -0.1380748748779297, -0.13130569458007812, -0.12453651428222656, -0.117767333984375, -0.11099815368652344, -0.10422897338867188, -0.09745979309082031, -0.09069061279296875, -0.08392143249511719, -0.07715225219726562, -0.07038307189941406, -0.0636138916015625, -0.05684471130371094, -0.050075531005859375, -0.04330635070800781, -0.03653717041015625, -0.029767990112304688, -0.022998809814453125, -0.016229629516601562, -0.00946044921875, -0.0026912689208984375, 0.004077911376953125, 0.010847091674804688, 0.01761627197265625, 0.024385452270507812, 0.031154632568359375, 0.03792381286621094, 0.0446929931640625, 0.05146217346191406, 0.058231353759765625, 0.06500053405761719, 0.07176971435546875, 0.07853889465332031, 0.08530807495117188, 0.09207725524902344, 0.098846435546875, 0.10561561584472656, 0.11238479614257812, 0.11915397644042969, 0.12592315673828125, 0.1326923370361328, 0.13946151733398438, 0.14623069763183594, 0.1529998779296875, 0.15976905822753906, 0.16653823852539062, 0.1733074188232422, 0.18007659912109375, 0.1868457794189453, 0.19361495971679688, 0.20038414001464844, 0.2071533203125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 6.0, 4.0, 8.0, 7.0, 17.0, 18.0, 21.0, 48.0, 122.0, 269.0, 255.0, 81.0, 46.0, 24.0, 14.0, 17.0, 4.0, 11.0, 5.0, 6.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.0001430511474609375, -0.0001391703262925148, -0.0001352895051240921, -0.0001314086839556694, -0.0001275278627872467, -0.000123647041618824, -0.0001197662204504013, -0.00011588539928197861, -0.00011200457811355591, -0.00010812375694513321, -0.00010424293577671051, -0.00010036211460828781, -9.648129343986511e-05, -9.260047227144241e-05, -8.871965110301971e-05, -8.483882993459702e-05, -8.095800876617432e-05, -7.707718759775162e-05, -7.319636642932892e-05, -6.931554526090622e-05, -6.543472409248352e-05, -6.155390292406082e-05, -5.767308175563812e-05, -5.3792260587215424e-05, -4.9911439418792725e-05, -4.6030618250370026e-05, -4.214979708194733e-05, -3.826897591352463e-05, -3.438815474510193e-05, -3.050733357667923e-05, -2.662651240825653e-05, -2.2745691239833832e-05, -1.8864870071411133e-05, -1.4984048902988434e-05, -1.1103227734565735e-05, -7.222406566143036e-06, -3.341585397720337e-06, 5.392357707023621e-07, 4.420056939125061e-06, 8.30087810754776e-06, 1.2181699275970459e-05, 1.6062520444393158e-05, 1.9943341612815857e-05, 2.3824162781238556e-05, 2.7704983949661255e-05, 3.1585805118083954e-05, 3.546662628650665e-05, 3.934744745492935e-05, 4.322826862335205e-05, 4.710908979177475e-05, 5.098991096019745e-05, 5.487073212862015e-05, 5.875155329704285e-05, 6.263237446546555e-05, 6.651319563388824e-05, 7.039401680231094e-05, 7.427483797073364e-05, 7.815565913915634e-05, 8.203648030757904e-05, 8.591730147600174e-05, 8.979812264442444e-05, 9.367894381284714e-05, 9.755976498126984e-05, 0.00010144058614969254, 0.00010532140731811523]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 4.0, 9.0, 8.0, 12.0, 26.0, 34.0, 51.0, 95.0, 181.0, 353.0, 885.0, 2664.0, 12362.0, 134874.0, 853854.0, 34799.0, 5679.0, 1478.0, 569.0, 255.0, 133.0, 78.0, 50.0, 34.0, 22.0, 21.0, 9.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.3623046875, -0.3517303466796875, -0.341156005859375, -0.3305816650390625, -0.32000732421875, -0.3094329833984375, -0.298858642578125, -0.2882843017578125, -0.2777099609375, -0.2671356201171875, -0.256561279296875, -0.2459869384765625, -0.23541259765625, -0.2248382568359375, -0.214263916015625, -0.2036895751953125, -0.193115234375, -0.1825408935546875, -0.171966552734375, -0.1613922119140625, -0.15081787109375, -0.1402435302734375, -0.129669189453125, -0.1190948486328125, -0.1085205078125, -0.0979461669921875, -0.087371826171875, -0.0767974853515625, -0.06622314453125, -0.0556488037109375, -0.045074462890625, -0.0345001220703125, -0.02392578125, -0.0133514404296875, -0.002777099609375, 0.0077972412109375, 0.01837158203125, 0.0289459228515625, 0.039520263671875, 0.0500946044921875, 0.0606689453125, 0.0712432861328125, 0.081817626953125, 0.0923919677734375, 0.10296630859375, 0.1135406494140625, 0.124114990234375, 0.1346893310546875, 0.145263671875, 0.1558380126953125, 0.166412353515625, 0.1769866943359375, 0.18756103515625, 0.1981353759765625, 0.208709716796875, 0.2192840576171875, 0.2298583984375, 0.2404327392578125, 0.251007080078125, 0.2615814208984375, 0.27215576171875, 0.2827301025390625, 0.293304443359375, 0.3038787841796875, 0.314453125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 6.0, 9.0, 2.0, 5.0, 16.0, 17.0, 19.0, 46.0, 82.0, 111.0, 145.0, 168.0, 130.0, 79.0, 50.0, 43.0, 22.0, 18.0, 12.0, 5.0, 3.0, 6.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.21533203125, -0.2074432373046875, -0.199554443359375, -0.1916656494140625, -0.18377685546875, -0.1758880615234375, -0.167999267578125, -0.1601104736328125, -0.1522216796875, -0.1443328857421875, -0.136444091796875, -0.1285552978515625, -0.12066650390625, -0.1127777099609375, -0.104888916015625, -0.0970001220703125, -0.089111328125, -0.0812225341796875, -0.073333740234375, -0.0654449462890625, -0.05755615234375, -0.0496673583984375, -0.041778564453125, -0.0338897705078125, -0.0260009765625, -0.0181121826171875, -0.010223388671875, -0.0023345947265625, 0.00555419921875, 0.0134429931640625, 0.021331787109375, 0.0292205810546875, 0.037109375, 0.0449981689453125, 0.052886962890625, 0.0607757568359375, 0.06866455078125, 0.0765533447265625, 0.084442138671875, 0.0923309326171875, 0.1002197265625, 0.1081085205078125, 0.115997314453125, 0.1238861083984375, 0.13177490234375, 0.1396636962890625, 0.147552490234375, 0.1554412841796875, 0.163330078125, 0.1712188720703125, 0.179107666015625, 0.1869964599609375, 0.19488525390625, 0.2027740478515625, 0.210662841796875, 0.2185516357421875, 0.2264404296875, 0.2343292236328125, 0.242218017578125, 0.2501068115234375, 0.25799560546875, 0.2658843994140625, 0.273773193359375, 0.2816619873046875, 0.28955078125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 2.0, 12.0, 8.0, 22.0, 74.0, 100.0, 222.0, 256.0, 109.0, 80.0, 41.0, 30.0, 10.0, 13.0, 3.0, 3.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5035598278045654, -3.374413013458252, -3.2452664375305176, -3.116119623184204, -2.9869730472564697, -2.8578262329101562, -2.728679656982422, -2.5995328426361084, -2.470386028289795, -2.3412392139434814, -2.212092638015747, -2.0829458236694336, -1.9537992477416992, -1.8246524333953857, -1.6955057382583618, -1.566359043121338, -1.4372124671936035, -1.3080657720565796, -1.1789190769195557, -1.0497722625732422, -0.920625627040863, -0.7914789319038391, -0.6623321771621704, -0.5331854820251465, -0.40403878688812256, -0.27489209175109863, -0.14574536681175232, -0.016598641872406006, 0.11254805326461792, 0.24169474840164185, 0.37084150314331055, 0.4999881982803345, 0.6291351318359375, 0.7582818269729614, 0.8874285221099854, 1.0165753364562988, 1.1457219123840332, 1.2748687267303467, 1.4040154218673706, 1.5331621170043945, 1.6623088121414185, 1.7914555072784424, 1.9206022024154663, 2.0497488975524902, 2.1788957118988037, 2.308042287826538, 2.4371891021728516, 2.566335678100586, 2.6954824924468994, 2.824629306793213, 2.9537758827209473, 3.0829226970672607, 3.212069272994995, 3.3412160873413086, 3.470362663269043, 3.5995094776153564, 3.72865629196167, 3.8578031063079834, 3.9869496822357178, 4.116096496582031, 4.245243072509766, 4.3743896484375, 4.503536701202393, 4.632683277130127, 4.761829853057861]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 5.0, 9.0, 6.0, 9.0, 11.0, 13.0, 12.0, 11.0, 19.0, 15.0, 33.0, 27.0, 21.0, 30.0, 39.0, 31.0, 36.0, 49.0, 74.0, 77.0, 66.0, 58.0, 39.0, 30.0, 24.0, 28.0, 26.0, 33.0, 21.0, 19.0, 23.0, 14.0, 14.0, 17.0, 15.0, 13.0, 5.0, 8.0, 4.0, 5.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 3.0], "bins": [-1.3352550268173218, -1.2987278699874878, -1.2622008323669434, -1.2256736755371094, -1.1891465187072754, -1.1526193618774414, -1.116092324256897, -1.079565167427063, -1.0430381298065186, -1.0065109729766846, -0.9699838757514954, -0.9334567785263062, -0.8969296216964722, -0.860402524471283, -0.8238754272460938, -0.7873482704162598, -0.7508211135864258, -0.7142940163612366, -0.6777668595314026, -0.6412397623062134, -0.6047126054763794, -0.5681855082511902, -0.531658411026001, -0.4951312839984894, -0.4586041569709778, -0.4220770299434662, -0.3855499029159546, -0.3490228056907654, -0.3124956786632538, -0.2759685516357422, -0.23944143950939178, -0.20291432738304138, -0.16638720035552979, -0.1298600733280182, -0.09333296120166779, -0.056805841624736786, -0.020278722047805786, 0.01624840497970581, 0.05277551710605621, 0.08930262923240662, 0.1258297562599182, 0.1623568832874298, 0.1988839954137802, 0.23541110754013062, 0.2719382345676422, 0.3084653615951538, 0.344992458820343, 0.3815195858478546, 0.4180467128753662, 0.4545738399028778, 0.4911009669303894, 0.5276280641555786, 0.5641552209854126, 0.6006823182106018, 0.637209415435791, 0.673736572265625, 0.7102636694908142, 0.7467907667160034, 0.7833179235458374, 0.8198450207710266, 0.8563721179962158, 0.8928992748260498, 0.929426372051239, 0.9659534692764282, 1.0024806261062622]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 2.0, 4.0, 2.0, 9.0, 8.0, 8.0, 9.0, 24.0, 28.0, 30.0, 51.0, 58.0, 127.0, 200.0, 306.0, 562.0, 1133.0, 2219.0, 4623.0, 11679.0, 35243.0, 177665.0, 1974516.0, 1765451.0, 165069.0, 34445.0, 11531.0, 4749.0, 2116.0, 1061.0, 569.0, 291.0, 175.0, 103.0, 65.0, 37.0, 36.0, 29.0, 12.0, 12.0, 8.0, 7.0, 5.0, 6.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.12841796875, -0.1236572265625, -0.118896484375, -0.1141357421875, -0.109375, -0.1046142578125, -0.099853515625, -0.0950927734375, -0.09033203125, -0.0855712890625, -0.080810546875, -0.0760498046875, -0.0712890625, -0.0665283203125, -0.061767578125, -0.0570068359375, -0.05224609375, -0.0474853515625, -0.042724609375, -0.0379638671875, -0.033203125, -0.0284423828125, -0.023681640625, -0.0189208984375, -0.01416015625, -0.0093994140625, -0.004638671875, 0.0001220703125, 0.0048828125, 0.0096435546875, 0.014404296875, 0.0191650390625, 0.02392578125, 0.0286865234375, 0.033447265625, 0.0382080078125, 0.04296875, 0.0477294921875, 0.052490234375, 0.0572509765625, 0.06201171875, 0.0667724609375, 0.071533203125, 0.0762939453125, 0.0810546875, 0.0858154296875, 0.090576171875, 0.0953369140625, 0.10009765625, 0.1048583984375, 0.109619140625, 0.1143798828125, 0.119140625, 0.1239013671875, 0.128662109375, 0.1334228515625, 0.13818359375, 0.1429443359375, 0.147705078125, 0.1524658203125, 0.1572265625, 0.1619873046875, 0.166748046875, 0.1715087890625, 0.17626953125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 5.0, 3.0, 5.0, 10.0, 12.0, 20.0, 15.0, 19.0, 16.0, 28.0, 32.0, 28.0, 36.0, 40.0, 49.0, 59.0, 56.0, 58.0, 50.0, 58.0, 54.0, 45.0, 41.0, 49.0, 42.0, 26.0, 32.0, 32.0, 21.0, 18.0, 6.0, 12.0, 11.0, 3.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08648681640625, -0.08394908905029297, -0.08141136169433594, -0.0788736343383789, -0.07633590698242188, -0.07379817962646484, -0.07126045227050781, -0.06872272491455078, -0.06618499755859375, -0.06364727020263672, -0.06110954284667969, -0.058571815490722656, -0.056034088134765625, -0.053496360778808594, -0.05095863342285156, -0.04842090606689453, -0.0458831787109375, -0.04334545135498047, -0.04080772399902344, -0.038269996643066406, -0.035732269287109375, -0.033194541931152344, -0.030656814575195312, -0.02811908721923828, -0.02558135986328125, -0.02304363250732422, -0.020505905151367188, -0.017968177795410156, -0.015430450439453125, -0.012892723083496094, -0.010354995727539062, -0.007817268371582031, -0.005279541015625, -0.0027418136596679688, -0.0002040863037109375, 0.0023336410522460938, 0.004871368408203125, 0.007409095764160156, 0.009946823120117188, 0.012484550476074219, 0.01502227783203125, 0.01756000518798828, 0.020097732543945312, 0.022635459899902344, 0.025173187255859375, 0.027710914611816406, 0.030248641967773438, 0.03278636932373047, 0.0353240966796875, 0.03786182403564453, 0.04039955139160156, 0.042937278747558594, 0.045475006103515625, 0.048012733459472656, 0.05055046081542969, 0.05308818817138672, 0.05562591552734375, 0.05816364288330078, 0.06070137023925781, 0.06323909759521484, 0.06577682495117188, 0.0683145523071289, 0.07085227966308594, 0.07339000701904297, 0.075927734375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 6.0, 9.0, 6.0, 16.0, 25.0, 21.0, 19.0, 39.0, 50.0, 83.0, 104.0, 153.0, 189.0, 334.0, 723.0, 3337.0, 84016.0, 4064993.0, 35723.0, 2431.0, 788.0, 378.0, 250.0, 163.0, 109.0, 72.0, 54.0, 51.0, 34.0, 24.0, 21.0, 17.0, 12.0, 8.0, 6.0, 4.0, 2.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.744140625, -0.7211761474609375, -0.698211669921875, -0.6752471923828125, -0.65228271484375, -0.6293182373046875, -0.606353759765625, -0.5833892822265625, -0.5604248046875, -0.5374603271484375, -0.514495849609375, -0.4915313720703125, -0.46856689453125, -0.4456024169921875, -0.422637939453125, -0.3996734619140625, -0.376708984375, -0.3537445068359375, -0.330780029296875, -0.3078155517578125, -0.28485107421875, -0.2618865966796875, -0.238922119140625, -0.2159576416015625, -0.1929931640625, -0.1700286865234375, -0.147064208984375, -0.1240997314453125, -0.10113525390625, -0.0781707763671875, -0.055206298828125, -0.0322418212890625, -0.00927734375, 0.0136871337890625, 0.036651611328125, 0.0596160888671875, 0.08258056640625, 0.1055450439453125, 0.128509521484375, 0.1514739990234375, 0.1744384765625, 0.1974029541015625, 0.220367431640625, 0.2433319091796875, 0.26629638671875, 0.2892608642578125, 0.312225341796875, 0.3351898193359375, 0.358154296875, 0.3811187744140625, 0.404083251953125, 0.4270477294921875, 0.45001220703125, 0.4729766845703125, 0.495941162109375, 0.5189056396484375, 0.5418701171875, 0.5648345947265625, 0.587799072265625, 0.6107635498046875, 0.63372802734375, 0.6566925048828125, 0.679656982421875, 0.7026214599609375, 0.7255859375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 12.0, 25.0, 41.0, 109.0, 336.0, 1199.0, 1582.0, 481.0, 170.0, 63.0, 39.0, 11.0, 8.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4306640625, -0.4128265380859375, -0.394989013671875, -0.3771514892578125, -0.35931396484375, -0.3414764404296875, -0.323638916015625, -0.3058013916015625, -0.2879638671875, -0.2701263427734375, -0.252288818359375, -0.2344512939453125, -0.21661376953125, -0.1987762451171875, -0.180938720703125, -0.1631011962890625, -0.145263671875, -0.1274261474609375, -0.109588623046875, -0.0917510986328125, -0.07391357421875, -0.0560760498046875, -0.038238525390625, -0.0204010009765625, -0.0025634765625, 0.0152740478515625, 0.033111572265625, 0.0509490966796875, 0.06878662109375, 0.0866241455078125, 0.104461669921875, 0.1222991943359375, 0.14013671875, 0.1579742431640625, 0.175811767578125, 0.1936492919921875, 0.21148681640625, 0.2293243408203125, 0.247161865234375, 0.2649993896484375, 0.2828369140625, 0.3006744384765625, 0.318511962890625, 0.3363494873046875, 0.35418701171875, 0.3720245361328125, 0.389862060546875, 0.4076995849609375, 0.425537109375, 0.4433746337890625, 0.461212158203125, 0.4790496826171875, 0.49688720703125, 0.5147247314453125, 0.532562255859375, 0.5503997802734375, 0.5682373046875, 0.5860748291015625, 0.603912353515625, 0.6217498779296875, 0.63958740234375, 0.6574249267578125, 0.675262451171875, 0.6930999755859375, 0.7109375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 3.0, 5.0, 9.0, 13.0, 29.0, 66.0, 162.0, 267.0, 244.0, 112.0, 40.0, 22.0, 11.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.190310478210449, -4.0334672927856445, -3.876624345779419, -3.7197813987731934, -3.5629382133483887, -3.406095027923584, -3.2492520809173584, -3.092409133911133, -2.935565948486328, -2.7787227630615234, -2.621879816055298, -2.4650368690490723, -2.3081936836242676, -2.151350498199463, -1.9945075511932373, -1.8376644849777222, -1.680821418762207, -1.523978352546692, -1.3671352863311768, -1.2102922201156616, -1.0534491539001465, -0.8966060876846313, -0.7397630214691162, -0.5829199552536011, -0.42607688903808594, -0.2692338228225708, -0.11239075660705566, 0.04445230960845947, 0.2012953758239746, 0.35813844203948975, 0.5149815082550049, 0.67182457447052, 0.8286676406860352, 0.9855107069015503, 1.1423537731170654, 1.2991968393325806, 1.4560399055480957, 1.6128829717636108, 1.769726037979126, 1.9265691041946411, 2.0834121704101562, 2.240255355834961, 2.3970983028411865, 2.553941249847412, 2.710784435272217, 2.8676276206970215, 3.024470567703247, 3.1813135147094727, 3.3381567001342773, 3.494999885559082, 3.6518428325653076, 3.808685779571533, 3.965528964996338, 4.122372150421143, 4.279214859008789, 4.436058044433594, 4.592901229858398, 4.749744415283203, 4.906587600708008, 5.063430309295654, 5.220273494720459, 5.377116680145264, 5.53395938873291, 5.690802574157715, 5.8476457595825195]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 7.0, 5.0, 4.0, 6.0, 8.0, 16.0, 12.0, 21.0, 25.0, 34.0, 31.0, 30.0, 50.0, 56.0, 52.0, 56.0, 43.0, 59.0, 70.0, 60.0, 47.0, 60.0, 48.0, 42.0, 24.0, 27.0, 20.0, 22.0, 14.0, 13.0, 10.0, 13.0, 7.0, 3.0, 8.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6395113468170166, -1.5903328657150269, -1.541154384613037, -1.4919759035110474, -1.4427974224090576, -1.3936189413070679, -1.3444404602050781, -1.2952619791030884, -1.2460834980010986, -1.1969050168991089, -1.1477265357971191, -1.0985480546951294, -1.0493695735931396, -1.00019109249115, -0.9510126113891602, -0.9018341302871704, -0.8526556491851807, -0.8034771680831909, -0.7542986869812012, -0.7051202058792114, -0.6559417247772217, -0.6067632436752319, -0.5575847625732422, -0.5084062814712524, -0.4592278003692627, -0.41004931926727295, -0.3608708381652832, -0.31169235706329346, -0.2625138759613037, -0.21333539485931396, -0.16415691375732422, -0.11497843265533447, -0.06579983234405518, -0.01662135124206543, 0.032557129859924316, 0.08173561096191406, 0.1309140920639038, 0.18009257316589355, 0.2292710542678833, 0.27844953536987305, 0.3276280164718628, 0.37680649757385254, 0.4259849786758423, 0.47516345977783203, 0.5243419408798218, 0.5735204219818115, 0.6226989030838013, 0.671877384185791, 0.7210558652877808, 0.7702343463897705, 0.8194128274917603, 0.86859130859375, 0.9177697896957397, 0.9669482707977295, 1.0161267518997192, 1.065305233001709, 1.1144837141036987, 1.1636621952056885, 1.2128406763076782, 1.262019157409668, 1.3111976385116577, 1.3603761196136475, 1.4095546007156372, 1.458733081817627, 1.5079115629196167]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 11.0, 22.0, 25.0, 39.0, 53.0, 91.0, 144.0, 205.0, 313.0, 557.0, 921.0, 1711.0, 3566.0, 7363.0, 16578.0, 42279.0, 118562.0, 296826.0, 329048.0, 142848.0, 50774.0, 19699.0, 8345.0, 3984.0, 1973.0, 1075.0, 586.0, 339.0, 232.0, 109.0, 95.0, 66.0, 46.0, 25.0, 20.0, 10.0, 4.0, 7.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1571044921875, -0.15108299255371094, -0.14506149291992188, -0.1390399932861328, -0.13301849365234375, -0.1269969940185547, -0.12097549438476562, -0.11495399475097656, -0.1089324951171875, -0.10291099548339844, -0.09688949584960938, -0.09086799621582031, -0.08484649658203125, -0.07882499694824219, -0.07280349731445312, -0.06678199768066406, -0.060760498046875, -0.05473899841308594, -0.048717498779296875, -0.04269599914550781, -0.03667449951171875, -0.030652999877929688, -0.024631500244140625, -0.018610000610351562, -0.0125885009765625, -0.0065670013427734375, -0.000545501708984375, 0.0054759979248046875, 0.01149749755859375, 0.017518997192382812, 0.023540496826171875, 0.029561996459960938, 0.03558349609375, 0.04160499572753906, 0.047626495361328125, 0.05364799499511719, 0.05966949462890625, 0.06569099426269531, 0.07171249389648438, 0.07773399353027344, 0.0837554931640625, 0.08977699279785156, 0.09579849243164062, 0.10181999206542969, 0.10784149169921875, 0.11386299133300781, 0.11988449096679688, 0.12590599060058594, 0.131927490234375, 0.13794898986816406, 0.14397048950195312, 0.1499919891357422, 0.15601348876953125, 0.1620349884033203, 0.16805648803710938, 0.17407798767089844, 0.1800994873046875, 0.18612098693847656, 0.19214248657226562, 0.1981639862060547, 0.20418548583984375, 0.2102069854736328, 0.21622848510742188, 0.22224998474121094, 0.228271484375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 5.0, 2.0, 0.0, 4.0, 4.0, 1.0, 3.0, 4.0, 6.0, 4.0, 3.0, 6.0, 11.0, 6.0, 8.0, 12.0, 12.0, 18.0, 19.0, 20.0, 24.0, 44.0, 31.0, 33.0, 38.0, 32.0, 36.0, 43.0, 43.0, 42.0, 43.0, 43.0, 39.0, 31.0, 39.0, 40.0, 39.0, 28.0, 21.0, 32.0, 22.0, 17.0, 16.0, 13.0, 16.0, 19.0, 10.0, 4.0, 8.0, 6.0, 1.0, 1.0, 4.0, 3.0, 4.0, 2.0, 1.0, 4.0, 1.0, 1.0], "bins": [-0.0872802734375, -0.0847015380859375, -0.082122802734375, -0.0795440673828125, -0.07696533203125, -0.0743865966796875, -0.071807861328125, -0.0692291259765625, -0.066650390625, -0.0640716552734375, -0.061492919921875, -0.0589141845703125, -0.05633544921875, -0.0537567138671875, -0.051177978515625, -0.0485992431640625, -0.0460205078125, -0.0434417724609375, -0.040863037109375, -0.0382843017578125, -0.03570556640625, -0.0331268310546875, -0.030548095703125, -0.0279693603515625, -0.025390625, -0.0228118896484375, -0.020233154296875, -0.0176544189453125, -0.01507568359375, -0.0124969482421875, -0.009918212890625, -0.0073394775390625, -0.0047607421875, -0.0021820068359375, 0.000396728515625, 0.0029754638671875, 0.00555419921875, 0.0081329345703125, 0.010711669921875, 0.0132904052734375, 0.015869140625, 0.0184478759765625, 0.021026611328125, 0.0236053466796875, 0.02618408203125, 0.0287628173828125, 0.031341552734375, 0.0339202880859375, 0.0364990234375, 0.0390777587890625, 0.041656494140625, 0.0442352294921875, 0.04681396484375, 0.0493927001953125, 0.051971435546875, 0.0545501708984375, 0.05712890625, 0.0597076416015625, 0.062286376953125, 0.0648651123046875, 0.06744384765625, 0.0700225830078125, 0.072601318359375, 0.0751800537109375, 0.0777587890625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 6.0, 14.0, 34.0, 37.0, 54.0, 147.0, 327.0, 713.0, 1747.0, 6135.0, 36435.0, 678990.0, 295040.0, 22026.0, 4345.0, 1455.0, 562.0, 223.0, 135.0, 47.0, 29.0, 28.0, 11.0, 5.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59326171875, -0.5740509033203125, -0.554840087890625, -0.5356292724609375, -0.51641845703125, -0.4972076416015625, -0.477996826171875, -0.4587860107421875, -0.4395751953125, -0.4203643798828125, -0.401153564453125, -0.3819427490234375, -0.36273193359375, -0.3435211181640625, -0.324310302734375, -0.3050994873046875, -0.285888671875, -0.2666778564453125, -0.247467041015625, -0.2282562255859375, -0.20904541015625, -0.1898345947265625, -0.170623779296875, -0.1514129638671875, -0.1322021484375, -0.1129913330078125, -0.093780517578125, -0.0745697021484375, -0.05535888671875, -0.0361480712890625, -0.016937255859375, 0.0022735595703125, 0.021484375, 0.0406951904296875, 0.059906005859375, 0.0791168212890625, 0.09832763671875, 0.1175384521484375, 0.136749267578125, 0.1559600830078125, 0.1751708984375, 0.1943817138671875, 0.213592529296875, 0.2328033447265625, 0.25201416015625, 0.2712249755859375, 0.290435791015625, 0.3096466064453125, 0.328857421875, 0.3480682373046875, 0.367279052734375, 0.3864898681640625, 0.40570068359375, 0.4249114990234375, 0.444122314453125, 0.4633331298828125, 0.4825439453125, 0.5017547607421875, 0.520965576171875, 0.5401763916015625, 0.55938720703125, 0.5785980224609375, 0.597808837890625, 0.6170196533203125, 0.63623046875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 8.0, 4.0, 9.0, 8.0, 9.0, 13.0, 19.0, 14.0, 13.0, 18.0, 35.0, 45.0, 48.0, 62.0, 65.0, 70.0, 57.0, 66.0, 62.0, 50.0, 58.0, 56.0, 51.0, 33.0, 22.0, 29.0, 22.0, 9.0, 13.0, 10.0, 9.0, 7.0, 3.0, 5.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.462158203125, -0.4453620910644531, -0.42856597900390625, -0.4117698669433594, -0.3949737548828125, -0.3781776428222656, -0.36138153076171875, -0.3445854187011719, -0.327789306640625, -0.3109931945800781, -0.29419708251953125, -0.2774009704589844, -0.2606048583984375, -0.24380874633789062, -0.22701263427734375, -0.21021652221679688, -0.19342041015625, -0.17662429809570312, -0.15982818603515625, -0.14303207397460938, -0.1262359619140625, -0.10943984985351562, -0.09264373779296875, -0.07584762573242188, -0.059051513671875, -0.042255401611328125, -0.02545928955078125, -0.008663177490234375, 0.0081329345703125, 0.024929046630859375, 0.04172515869140625, 0.058521270751953125, 0.0753173828125, 0.09211349487304688, 0.10890960693359375, 0.12570571899414062, 0.1425018310546875, 0.15929794311523438, 0.17609405517578125, 0.19289016723632812, 0.209686279296875, 0.22648239135742188, 0.24327850341796875, 0.2600746154785156, 0.2768707275390625, 0.2936668395996094, 0.31046295166015625, 0.3272590637207031, 0.34405517578125, 0.3608512878417969, 0.37764739990234375, 0.3944435119628906, 0.4112396240234375, 0.4280357360839844, 0.44483184814453125, 0.4616279602050781, 0.478424072265625, 0.4952201843261719, 0.5120162963867188, 0.5288124084472656, 0.5456085205078125, 0.5624046325683594, 0.5792007446289062, 0.5959968566894531, 0.61279296875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 1.0, 3.0, 2.0, 9.0, 8.0, 16.0, 16.0, 34.0, 30.0, 52.0, 78.0, 133.0, 187.0, 329.0, 515.0, 954.0, 1762.0, 3480.0, 7816.0, 19647.0, 60009.0, 282029.0, 551141.0, 78045.0, 24220.0, 9286.0, 4145.0, 1931.0, 1088.0, 609.0, 370.0, 198.0, 127.0, 88.0, 54.0, 46.0, 37.0, 20.0, 15.0, 9.0, 7.0, 2.0, 7.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.1707763671875, -0.1656169891357422, -0.16045761108398438, -0.15529823303222656, -0.15013885498046875, -0.14497947692871094, -0.13982009887695312, -0.1346607208251953, -0.1295013427734375, -0.12434196472167969, -0.11918258666992188, -0.11402320861816406, -0.10886383056640625, -0.10370445251464844, -0.09854507446289062, -0.09338569641113281, -0.088226318359375, -0.08306694030761719, -0.07790756225585938, -0.07274818420410156, -0.06758880615234375, -0.06242942810058594, -0.057270050048828125, -0.05211067199707031, -0.0469512939453125, -0.04179191589355469, -0.036632537841796875, -0.03147315979003906, -0.02631378173828125, -0.021154403686523438, -0.015995025634765625, -0.010835647583007812, -0.00567626953125, -0.0005168914794921875, 0.004642486572265625, 0.009801864624023438, 0.01496124267578125, 0.020120620727539062, 0.025279998779296875, 0.030439376831054688, 0.0355987548828125, 0.04075813293457031, 0.045917510986328125, 0.05107688903808594, 0.05623626708984375, 0.06139564514160156, 0.06655502319335938, 0.07171440124511719, 0.076873779296875, 0.08203315734863281, 0.08719253540039062, 0.09235191345214844, 0.09751129150390625, 0.10267066955566406, 0.10783004760742188, 0.11298942565917969, 0.1181488037109375, 0.12330818176269531, 0.12846755981445312, 0.13362693786621094, 0.13878631591796875, 0.14394569396972656, 0.14910507202148438, 0.1542644500732422, 0.159423828125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 8.0, 5.0, 8.0, 8.0, 9.0, 8.0, 10.0, 24.0, 24.0, 36.0, 50.0, 69.0, 96.0, 116.0, 128.0, 109.0, 79.0, 57.0, 39.0, 29.0, 20.0, 14.0, 16.0, 9.0, 8.0, 4.0, 3.0, 5.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.830692291259766e-05, -6.611272692680359e-05, -6.391853094100952e-05, -6.172433495521545e-05, -5.953013896942139e-05, -5.733594298362732e-05, -5.514174699783325e-05, -5.2947551012039185e-05, -5.075335502624512e-05, -4.855915904045105e-05, -4.636496305465698e-05, -4.4170767068862915e-05, -4.197657108306885e-05, -3.978237509727478e-05, -3.758817911148071e-05, -3.5393983125686646e-05, -3.319978713989258e-05, -3.100559115409851e-05, -2.8811395168304443e-05, -2.6617199182510376e-05, -2.442300319671631e-05, -2.222880721092224e-05, -2.0034611225128174e-05, -1.7840415239334106e-05, -1.564621925354004e-05, -1.3452023267745972e-05, -1.1257827281951904e-05, -9.063631296157837e-06, -6.8694353103637695e-06, -4.675239324569702e-06, -2.4810433387756348e-06, -2.868473529815674e-07, 1.9073486328125e-06, 4.101544618606567e-06, 6.295740604400635e-06, 8.489936590194702e-06, 1.068413257598877e-05, 1.2878328561782837e-05, 1.5072524547576904e-05, 1.726672053337097e-05, 1.946091651916504e-05, 2.1655112504959106e-05, 2.3849308490753174e-05, 2.604350447654724e-05, 2.823770046234131e-05, 3.0431896448135376e-05, 3.262609243392944e-05, 3.482028841972351e-05, 3.701448440551758e-05, 3.9208680391311646e-05, 4.140287637710571e-05, 4.359707236289978e-05, 4.579126834869385e-05, 4.7985464334487915e-05, 5.017966032028198e-05, 5.237385630607605e-05, 5.456805229187012e-05, 5.6762248277664185e-05, 5.895644426345825e-05, 6.115064024925232e-05, 6.334483623504639e-05, 6.553903222084045e-05, 6.773322820663452e-05, 6.992742419242859e-05, 7.212162017822266e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 12.0, 13.0, 17.0, 23.0, 55.0, 72.0, 123.0, 201.0, 385.0, 715.0, 1574.0, 3631.0, 9990.0, 33069.0, 144300.0, 661879.0, 143335.0, 32193.0, 10069.0, 3719.0, 1544.0, 759.0, 345.0, 183.0, 124.0, 73.0, 53.0, 28.0, 26.0, 12.0, 6.0, 8.0, 4.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1663818359375, -0.16054344177246094, -0.15470504760742188, -0.1488666534423828, -0.14302825927734375, -0.1371898651123047, -0.13135147094726562, -0.12551307678222656, -0.1196746826171875, -0.11383628845214844, -0.10799789428710938, -0.10215950012207031, -0.09632110595703125, -0.09048271179199219, -0.08464431762695312, -0.07880592346191406, -0.072967529296875, -0.06712913513183594, -0.061290740966796875, -0.05545234680175781, -0.04961395263671875, -0.04377555847167969, -0.037937164306640625, -0.03209877014160156, -0.0262603759765625, -0.020421981811523438, -0.014583587646484375, -0.008745193481445312, -0.00290679931640625, 0.0029315948486328125, 0.008769989013671875, 0.014608383178710938, 0.02044677734375, 0.026285171508789062, 0.032123565673828125, 0.03796195983886719, 0.04380035400390625, 0.04963874816894531, 0.055477142333984375, 0.06131553649902344, 0.0671539306640625, 0.07299232482910156, 0.07883071899414062, 0.08466911315917969, 0.09050750732421875, 0.09634590148925781, 0.10218429565429688, 0.10802268981933594, 0.113861083984375, 0.11969947814941406, 0.12553787231445312, 0.1313762664794922, 0.13721466064453125, 0.1430530548095703, 0.14889144897460938, 0.15472984313964844, 0.1605682373046875, 0.16640663146972656, 0.17224502563476562, 0.1780834197998047, 0.18392181396484375, 0.1897602081298828, 0.19559860229492188, 0.20143699645996094, 0.207275390625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 7.0, 5.0, 10.0, 4.0, 8.0, 7.0, 14.0, 12.0, 18.0, 26.0, 33.0, 42.0, 48.0, 53.0, 92.0, 100.0, 113.0, 80.0, 68.0, 54.0, 47.0, 41.0, 22.0, 26.0, 22.0, 16.0, 12.0, 8.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.186279296875, -0.1808300018310547, -0.17538070678710938, -0.16993141174316406, -0.16448211669921875, -0.15903282165527344, -0.15358352661132812, -0.1481342315673828, -0.1426849365234375, -0.1372356414794922, -0.13178634643554688, -0.12633705139160156, -0.12088775634765625, -0.11543846130371094, -0.10998916625976562, -0.10453987121582031, -0.099090576171875, -0.09364128112792969, -0.08819198608398438, -0.08274269104003906, -0.07729339599609375, -0.07184410095214844, -0.06639480590820312, -0.06094551086425781, -0.0554962158203125, -0.05004692077636719, -0.044597625732421875, -0.03914833068847656, -0.03369903564453125, -0.028249740600585938, -0.022800445556640625, -0.017351150512695312, -0.01190185546875, -0.0064525604248046875, -0.001003265380859375, 0.0044460296630859375, 0.00989532470703125, 0.015344619750976562, 0.020793914794921875, 0.026243209838867188, 0.0316925048828125, 0.03714179992675781, 0.042591094970703125, 0.04804039001464844, 0.05348968505859375, 0.05893898010253906, 0.06438827514648438, 0.06983757019042969, 0.075286865234375, 0.08073616027832031, 0.08618545532226562, 0.09163475036621094, 0.09708404541015625, 0.10253334045410156, 0.10798263549804688, 0.11343193054199219, 0.1188812255859375, 0.12433052062988281, 0.12977981567382812, 0.13522911071777344, 0.14067840576171875, 0.14612770080566406, 0.15157699584960938, 0.1570262908935547, 0.1624755859375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 9.0, 22.0, 22.0, 72.0, 133.0, 293.0, 273.0, 100.0, 45.0, 17.0, 13.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.506662368774414, -9.323845863342285, -9.141029357910156, -8.958213806152344, -8.775397300720215, -8.592580795288086, -8.409764289855957, -8.226947784423828, -8.044132232666016, -7.861315727233887, -7.678499698638916, -7.495683193206787, -7.312867164611816, -7.1300506591796875, -6.947234153747559, -6.764418125152588, -6.581601142883301, -6.398784637451172, -6.215968608856201, -6.033152103424072, -5.850336074829102, -5.667519569396973, -5.484703063964844, -5.301887035369873, -5.119071006774902, -4.936254501342773, -4.753438472747803, -4.570621967315674, -4.387805938720703, -4.204989433288574, -4.022172927856445, -3.8393568992614746, -3.6565403938293457, -3.473724126815796, -3.290907859802246, -3.108091354370117, -2.9252750873565674, -2.7424588203430176, -2.5596425533294678, -2.376826286315918, -2.194009780883789, -2.0111935138702393, -1.8283771276474, -1.64556086063385, -1.4627444744110107, -1.279928207397461, -1.0971119403839111, -0.9142955541610718, -0.7314794063568115, -0.5486630797386169, -0.36584678292274475, -0.18303048610687256, -0.00021415948867797852, 0.1826021671295166, 0.3654184341430664, 0.5482348203659058, 0.7310510873794556, 0.9138674139976501, 1.0966837406158447, 1.2795000076293945, 1.4623162746429443, 1.6451326608657837, 1.8279489278793335, 2.010765314102173, 2.1935815811157227]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 7.0, 15.0, 3.0, 6.0, 10.0, 12.0, 12.0, 11.0, 23.0, 15.0, 18.0, 27.0, 27.0, 29.0, 36.0, 46.0, 40.0, 44.0, 94.0, 102.0, 77.0, 58.0, 44.0, 34.0, 34.0, 27.0, 24.0, 19.0, 18.0, 21.0, 18.0, 12.0, 14.0, 3.0, 3.0, 7.0, 3.0, 1.0, 6.0, 4.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.229391574859619, -2.156015634536743, -2.082639694213867, -2.009263753890991, -1.9358878135681152, -1.8625118732452393, -1.7891359329223633, -1.7157599925994873, -1.6423840522766113, -1.5690081119537354, -1.4956321716308594, -1.4222562313079834, -1.3488802909851074, -1.2755043506622314, -1.2021284103393555, -1.1287524700164795, -1.055376648902893, -0.9820007085800171, -0.9086247682571411, -0.8352488279342651, -0.7618728876113892, -0.6884969472885132, -0.615121066570282, -0.541745126247406, -0.46836918592453003, -0.39499324560165405, -0.3216173052787781, -0.2482413947582245, -0.1748654544353485, -0.10148951411247253, -0.028113603591918945, 0.04526233673095703, 0.11863827705383301, 0.19201421737670898, 0.26539015769958496, 0.33876606822013855, 0.4121420085430145, 0.4855179488658905, 0.5588938593864441, 0.6322697997093201, 0.705645740032196, 0.779021680355072, 0.852397620677948, 0.9257735013961792, 0.9991494417190552, 1.0725253820419312, 1.1459013223648071, 1.219277262687683, 1.292653203010559, 1.366029143333435, 1.439405083656311, 1.512781023979187, 1.586156964302063, 1.659532904624939, 1.7329087257385254, 1.8062846660614014, 1.8796606063842773, 1.9530365467071533, 2.0264124870300293, 2.0997884273529053, 2.1731643676757812, 2.2465403079986572, 2.319916248321533, 2.393292188644409, 2.466668128967285]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 5.0, 3.0, 8.0, 13.0, 15.0, 22.0, 45.0, 62.0, 109.0, 159.0, 229.0, 416.0, 626.0, 1127.0, 2003.0, 3982.0, 8446.0, 21104.0, 72434.0, 515749.0, 2701538.0, 724299.0, 97517.0, 25140.0, 9751.0, 4401.0, 2167.0, 1191.0, 679.0, 400.0, 236.0, 120.0, 101.0, 61.0, 42.0, 36.0, 14.0, 8.0, 7.0, 8.0, 8.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1351318359375, -0.12963294982910156, -0.12413406372070312, -0.11863517761230469, -0.11313629150390625, -0.10763740539550781, -0.10213851928710938, -0.09663963317871094, -0.0911407470703125, -0.08564186096191406, -0.08014297485351562, -0.07464408874511719, -0.06914520263671875, -0.06364631652832031, -0.058147430419921875, -0.05264854431152344, -0.047149658203125, -0.04165077209472656, -0.036151885986328125, -0.030652999877929688, -0.02515411376953125, -0.019655227661132812, -0.014156341552734375, -0.008657455444335938, -0.0031585693359375, 0.0023403167724609375, 0.007839202880859375, 0.013338088989257812, 0.01883697509765625, 0.024335861206054688, 0.029834747314453125, 0.03533363342285156, 0.04083251953125, 0.04633140563964844, 0.051830291748046875, 0.05732917785644531, 0.06282806396484375, 0.06832695007324219, 0.07382583618164062, 0.07932472229003906, 0.0848236083984375, 0.09032249450683594, 0.09582138061523438, 0.10132026672363281, 0.10681915283203125, 0.11231803894042969, 0.11781692504882812, 0.12331581115722656, 0.128814697265625, 0.13431358337402344, 0.13981246948242188, 0.1453113555908203, 0.15081024169921875, 0.1563091278076172, 0.16180801391601562, 0.16730690002441406, 0.1728057861328125, 0.17830467224121094, 0.18380355834960938, 0.1893024444580078, 0.19480133056640625, 0.2003002166748047, 0.20579910278320312, 0.21129798889160156, 0.216796875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 0.0, 7.0, 4.0, 3.0, 7.0, 8.0, 10.0, 8.0, 10.0, 15.0, 16.0, 24.0, 28.0, 28.0, 43.0, 36.0, 38.0, 64.0, 51.0, 55.0, 67.0, 54.0, 45.0, 42.0, 60.0, 53.0, 41.0, 36.0, 32.0, 22.0, 25.0, 18.0, 15.0, 14.0, 5.0, 7.0, 3.0, 1.0, 4.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.1282958984375, -0.12468624114990234, -0.12107658386230469, -0.11746692657470703, -0.11385726928710938, -0.11024761199951172, -0.10663795471191406, -0.1030282974243164, -0.09941864013671875, -0.0958089828491211, -0.09219932556152344, -0.08858966827392578, -0.08498001098632812, -0.08137035369873047, -0.07776069641113281, -0.07415103912353516, -0.0705413818359375, -0.06693172454833984, -0.06332206726074219, -0.05971240997314453, -0.056102752685546875, -0.05249309539794922, -0.04888343811035156, -0.045273780822753906, -0.04166412353515625, -0.038054466247558594, -0.03444480895996094, -0.03083515167236328, -0.027225494384765625, -0.02361583709716797, -0.020006179809570312, -0.016396522521972656, -0.012786865234375, -0.009177207946777344, -0.0055675506591796875, -0.0019578933715820312, 0.001651763916015625, 0.005261421203613281, 0.008871078491210938, 0.012480735778808594, 0.01609039306640625, 0.019700050354003906, 0.023309707641601562, 0.02691936492919922, 0.030529022216796875, 0.03413867950439453, 0.03774833679199219, 0.041357994079589844, 0.0449676513671875, 0.048577308654785156, 0.05218696594238281, 0.05579662322998047, 0.059406280517578125, 0.06301593780517578, 0.06662559509277344, 0.0702352523803711, 0.07384490966796875, 0.0774545669555664, 0.08106422424316406, 0.08467388153076172, 0.08828353881835938, 0.09189319610595703, 0.09550285339355469, 0.09911251068115234, 0.10272216796875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 6.0, 7.0, 27.0, 50.0, 99.0, 206.0, 467.0, 1663.0, 36054.0, 4110738.0, 42155.0, 1899.0, 472.0, 235.0, 103.0, 51.0, 31.0, 9.0, 10.0, 7.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.115234375, -1.0786895751953125, -1.042144775390625, -1.0055999755859375, -0.96905517578125, -0.9325103759765625, -0.895965576171875, -0.8594207763671875, -0.8228759765625, -0.7863311767578125, -0.749786376953125, -0.7132415771484375, -0.67669677734375, -0.6401519775390625, -0.603607177734375, -0.5670623779296875, -0.530517578125, -0.4939727783203125, -0.457427978515625, -0.4208831787109375, -0.38433837890625, -0.3477935791015625, -0.311248779296875, -0.2747039794921875, -0.2381591796875, -0.2016143798828125, -0.165069580078125, -0.1285247802734375, -0.09197998046875, -0.0554351806640625, -0.018890380859375, 0.0176544189453125, 0.05419921875, 0.0907440185546875, 0.127288818359375, 0.1638336181640625, 0.20037841796875, 0.2369232177734375, 0.273468017578125, 0.3100128173828125, 0.3465576171875, 0.3831024169921875, 0.419647216796875, 0.4561920166015625, 0.49273681640625, 0.5292816162109375, 0.565826416015625, 0.6023712158203125, 0.638916015625, 0.6754608154296875, 0.712005615234375, 0.7485504150390625, 0.78509521484375, 0.8216400146484375, 0.858184814453125, 0.8947296142578125, 0.9312744140625, 0.9678192138671875, 1.004364013671875, 1.0409088134765625, 1.07745361328125, 1.1139984130859375, 1.150543212890625, 1.1870880126953125, 1.2236328125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 9.0, 10.0, 14.0, 13.0, 46.0, 74.0, 147.0, 321.0, 895.0, 1362.0, 704.0, 232.0, 117.0, 46.0, 33.0, 21.0, 17.0, 8.0, 6.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3408203125, -0.32318115234375, -0.3055419921875, -0.28790283203125, -0.270263671875, -0.25262451171875, -0.2349853515625, -0.21734619140625, -0.19970703125, -0.18206787109375, -0.1644287109375, -0.14678955078125, -0.129150390625, -0.11151123046875, -0.0938720703125, -0.07623291015625, -0.05859375, -0.04095458984375, -0.0233154296875, -0.00567626953125, 0.011962890625, 0.02960205078125, 0.0472412109375, 0.06488037109375, 0.08251953125, 0.10015869140625, 0.1177978515625, 0.13543701171875, 0.153076171875, 0.17071533203125, 0.1883544921875, 0.20599365234375, 0.2236328125, 0.24127197265625, 0.2589111328125, 0.27655029296875, 0.294189453125, 0.31182861328125, 0.3294677734375, 0.34710693359375, 0.36474609375, 0.38238525390625, 0.4000244140625, 0.41766357421875, 0.435302734375, 0.45294189453125, 0.4705810546875, 0.48822021484375, 0.505859375, 0.52349853515625, 0.5411376953125, 0.55877685546875, 0.576416015625, 0.59405517578125, 0.6116943359375, 0.62933349609375, 0.64697265625, 0.66461181640625, 0.6822509765625, 0.69989013671875, 0.717529296875, 0.73516845703125, 0.7528076171875, 0.77044677734375, 0.7880859375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 6.0, 15.0, 31.0, 113.0, 303.0, 325.0, 144.0, 54.0, 12.0, 7.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.330854415893555, -5.099521636962891, -4.868188858032227, -4.6368560791015625, -4.405523300170898, -4.174190521240234, -3.942857503890991, -3.711524724960327, -3.480191946029663, -3.248859167098999, -3.017526388168335, -2.786193370819092, -2.5548605918884277, -2.3235278129577637, -2.0921950340270996, -1.8608622550964355, -1.6295294761657715, -1.3981966972351074, -1.1668639183044434, -0.9355310201644897, -0.7041982412338257, -0.4728654623031616, -0.241532564163208, -0.010199785232543945, 0.22113299369812012, 0.45246580243110657, 0.683798611164093, 0.9151314496994019, 1.146464228630066, 1.37779700756073, 1.6091299057006836, 1.8404626846313477, 2.0717954635620117, 2.303128242492676, 2.53446102142334, 2.765793800354004, 2.997126579284668, 3.228459358215332, 3.459792375564575, 3.6911251544952393, 3.9224579334259033, 4.1537909507751465, 4.3851237297058105, 4.616456508636475, 4.847789287567139, 5.079122066497803, 5.310454845428467, 5.541787624359131, 5.773120403289795, 6.004453182220459, 6.235785961151123, 6.467118740081787, 6.698451519012451, 6.929784297943115, 7.1611175537109375, 7.392450332641602, 7.623783111572266, 7.85511589050293, 8.086448669433594, 8.317781448364258, 8.549114227294922, 8.780447006225586, 9.01177978515625, 9.243112564086914, 9.474445343017578]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 3.0, 9.0, 15.0, 9.0, 18.0, 20.0, 22.0, 18.0, 26.0, 30.0, 32.0, 21.0, 49.0, 35.0, 39.0, 39.0, 41.0, 44.0, 52.0, 41.0, 42.0, 36.0, 30.0, 44.0, 30.0, 35.0, 42.0, 30.0, 19.0, 24.0, 23.0, 12.0, 16.0, 14.0, 8.0, 7.0, 9.0, 5.0, 5.0, 3.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.5967812538146973, -1.5522418022155762, -1.5077024698257446, -1.4631630182266235, -1.418623685836792, -1.374084234237671, -1.3295447826385498, -1.2850053310394287, -1.2404659986495972, -1.195926547050476, -1.1513872146606445, -1.1068477630615234, -1.0623083114624023, -1.0177689790725708, -0.9732295274734497, -0.9286901354789734, -0.8841507434844971, -0.8396113514900208, -0.7950719594955444, -0.7505325078964233, -0.705993115901947, -0.6614537239074707, -0.6169142723083496, -0.5723748803138733, -0.527835488319397, -0.48329609632492065, -0.43875667452812195, -0.39421725273132324, -0.3496778607368469, -0.3051384687423706, -0.2605990469455719, -0.2160596251487732, -0.17152035236358643, -0.1269809454679489, -0.0824415385723114, -0.03790213167667389, 0.006637275218963623, 0.051176682114601135, 0.09571608901023865, 0.14025551080703735, 0.18479490280151367, 0.22933430969715118, 0.2738737165927887, 0.3184131383895874, 0.3629525303840637, 0.40749192237854004, 0.45203134417533875, 0.49657076597213745, 0.5411101579666138, 0.5856495499610901, 0.6301889419555664, 0.6747283935546875, 0.7192677855491638, 0.7638071775436401, 0.8083466291427612, 0.8528860211372375, 0.8974254131317139, 0.9419648051261902, 0.9865041971206665, 1.0310436487197876, 1.0755829811096191, 1.1201224327087402, 1.1646618843078613, 1.2092013359069824, 1.253740668296814]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 7.0, 2.0, 12.0, 17.0, 35.0, 49.0, 80.0, 118.0, 183.0, 297.0, 470.0, 726.0, 1243.0, 2306.0, 4080.0, 7861.0, 15336.0, 31552.0, 66481.0, 140028.0, 255316.0, 253884.0, 138860.0, 65442.0, 31369.0, 15318.0, 7758.0, 4122.0, 2310.0, 1247.0, 794.0, 464.0, 305.0, 193.0, 109.0, 75.0, 32.0, 33.0, 22.0, 14.0, 8.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.1629638671875, -0.15855884552001953, -0.15415382385253906, -0.1497488021850586, -0.14534378051757812, -0.14093875885009766, -0.1365337371826172, -0.13212871551513672, -0.12772369384765625, -0.12331867218017578, -0.11891365051269531, -0.11450862884521484, -0.11010360717773438, -0.1056985855102539, -0.10129356384277344, -0.09688854217529297, -0.0924835205078125, -0.08807849884033203, -0.08367347717285156, -0.0792684555053711, -0.07486343383789062, -0.07045841217041016, -0.06605339050292969, -0.06164836883544922, -0.05724334716796875, -0.05283832550048828, -0.04843330383300781, -0.044028282165527344, -0.039623260498046875, -0.035218238830566406, -0.030813217163085938, -0.02640819549560547, -0.022003173828125, -0.01759815216064453, -0.013193130493164062, -0.008788108825683594, -0.004383087158203125, 2.193450927734375e-05, 0.0044269561767578125, 0.008831977844238281, 0.01323699951171875, 0.01764202117919922, 0.022047042846679688, 0.026452064514160156, 0.030857086181640625, 0.035262107849121094, 0.03966712951660156, 0.04407215118408203, 0.0484771728515625, 0.05288219451904297, 0.05728721618652344, 0.061692237854003906, 0.06609725952148438, 0.07050228118896484, 0.07490730285644531, 0.07931232452392578, 0.08371734619140625, 0.08812236785888672, 0.09252738952636719, 0.09693241119384766, 0.10133743286132812, 0.1057424545288086, 0.11014747619628906, 0.11455249786376953, 0.11895751953125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 2.0, 1.0, 8.0, 4.0, 7.0, 7.0, 9.0, 8.0, 10.0, 13.0, 18.0, 21.0, 16.0, 31.0, 36.0, 43.0, 36.0, 40.0, 54.0, 41.0, 39.0, 60.0, 50.0, 48.0, 43.0, 42.0, 44.0, 42.0, 35.0, 38.0, 27.0, 25.0, 21.0, 17.0, 14.0, 15.0, 10.0, 8.0, 7.0, 7.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10272216796875, -0.09927082061767578, -0.09581947326660156, -0.09236812591552734, -0.08891677856445312, -0.0854654312133789, -0.08201408386230469, -0.07856273651123047, -0.07511138916015625, -0.07166004180908203, -0.06820869445800781, -0.0647573471069336, -0.061305999755859375, -0.057854652404785156, -0.05440330505371094, -0.05095195770263672, -0.0475006103515625, -0.04404926300048828, -0.04059791564941406, -0.037146568298339844, -0.033695220947265625, -0.030243873596191406, -0.026792526245117188, -0.02334117889404297, -0.01988983154296875, -0.01643848419189453, -0.012987136840820312, -0.009535789489746094, -0.006084442138671875, -0.0026330947875976562, 0.0008182525634765625, 0.004269599914550781, 0.007720947265625, 0.011172294616699219, 0.014623641967773438, 0.018074989318847656, 0.021526336669921875, 0.024977684020996094, 0.028429031372070312, 0.03188037872314453, 0.03533172607421875, 0.03878307342529297, 0.04223442077636719, 0.045685768127441406, 0.049137115478515625, 0.052588462829589844, 0.05603981018066406, 0.05949115753173828, 0.0629425048828125, 0.06639385223388672, 0.06984519958496094, 0.07329654693603516, 0.07674789428710938, 0.0801992416381836, 0.08365058898925781, 0.08710193634033203, 0.09055328369140625, 0.09400463104248047, 0.09745597839355469, 0.1009073257446289, 0.10435867309570312, 0.10781002044677734, 0.11126136779785156, 0.11471271514892578, 0.1181640625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 8.0, 16.0, 12.0, 25.0, 38.0, 56.0, 96.0, 153.0, 298.0, 584.0, 1346.0, 5590.0, 51167.0, 816805.0, 156794.0, 11501.0, 2278.0, 800.0, 420.0, 212.0, 145.0, 80.0, 44.0, 29.0, 20.0, 12.0, 7.0, 4.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5625, -0.5435562133789062, -0.5246124267578125, -0.5056686401367188, -0.486724853515625, -0.46778106689453125, -0.4488372802734375, -0.42989349365234375, -0.41094970703125, -0.39200592041015625, -0.3730621337890625, -0.35411834716796875, -0.335174560546875, -0.31623077392578125, -0.2972869873046875, -0.27834320068359375, -0.2593994140625, -0.24045562744140625, -0.2215118408203125, -0.20256805419921875, -0.183624267578125, -0.16468048095703125, -0.1457366943359375, -0.12679290771484375, -0.10784912109375, -0.08890533447265625, -0.0699615478515625, -0.05101776123046875, -0.032073974609375, -0.01313018798828125, 0.0058135986328125, 0.02475738525390625, 0.043701171875, 0.06264495849609375, 0.0815887451171875, 0.10053253173828125, 0.119476318359375, 0.13842010498046875, 0.1573638916015625, 0.17630767822265625, 0.19525146484375, 0.21419525146484375, 0.2331390380859375, 0.25208282470703125, 0.271026611328125, 0.28997039794921875, 0.3089141845703125, 0.32785797119140625, 0.3468017578125, 0.36574554443359375, 0.3846893310546875, 0.40363311767578125, 0.422576904296875, 0.44152069091796875, 0.4604644775390625, 0.47940826416015625, 0.49835205078125, 0.5172958374023438, 0.5362396240234375, 0.5551834106445312, 0.574127197265625, 0.5930709838867188, 0.6120147705078125, 0.6309585571289062, 0.64990234375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 3.0, 9.0, 2.0, 10.0, 13.0, 11.0, 22.0, 13.0, 27.0, 19.0, 33.0, 49.0, 40.0, 37.0, 44.0, 34.0, 49.0, 53.0, 44.0, 61.0, 53.0, 52.0, 40.0, 42.0, 34.0, 29.0, 31.0, 27.0, 23.0, 21.0, 18.0, 10.0, 5.0, 9.0, 6.0, 8.0, 7.0, 3.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.388916015625, -0.3754005432128906, -0.36188507080078125, -0.3483695983886719, -0.3348541259765625, -0.3213386535644531, -0.30782318115234375, -0.2943077087402344, -0.280792236328125, -0.2672767639160156, -0.25376129150390625, -0.24024581909179688, -0.2267303466796875, -0.21321487426757812, -0.19969940185546875, -0.18618392944335938, -0.17266845703125, -0.15915298461914062, -0.14563751220703125, -0.13212203979492188, -0.1186065673828125, -0.10509109497070312, -0.09157562255859375, -0.07806015014648438, -0.064544677734375, -0.051029205322265625, -0.03751373291015625, -0.023998260498046875, -0.0104827880859375, 0.003032684326171875, 0.01654815673828125, 0.030063629150390625, 0.0435791015625, 0.057094573974609375, 0.07061004638671875, 0.08412551879882812, 0.0976409912109375, 0.11115646362304688, 0.12467193603515625, 0.13818740844726562, 0.151702880859375, 0.16521835327148438, 0.17873382568359375, 0.19224929809570312, 0.2057647705078125, 0.21928024291992188, 0.23279571533203125, 0.24631118774414062, 0.25982666015625, 0.2733421325683594, 0.28685760498046875, 0.3003730773925781, 0.3138885498046875, 0.3274040222167969, 0.34091949462890625, 0.3544349670410156, 0.367950439453125, 0.3814659118652344, 0.39498138427734375, 0.4084968566894531, 0.4220123291015625, 0.4355278015136719, 0.44904327392578125, 0.4625587463378906, 0.47607421875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 5.0, 3.0, 4.0, 6.0, 2.0, 14.0, 15.0, 16.0, 21.0, 22.0, 39.0, 54.0, 103.0, 159.0, 254.0, 470.0, 928.0, 2261.0, 5734.0, 17160.0, 64421.0, 600292.0, 282868.0, 50800.0, 14046.0, 4838.0, 1952.0, 921.0, 488.0, 213.0, 141.0, 114.0, 52.0, 35.0, 27.0, 21.0, 9.0, 17.0, 7.0, 9.0, 2.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.1658935546875, -0.16069602966308594, -0.15549850463867188, -0.1503009796142578, -0.14510345458984375, -0.1399059295654297, -0.13470840454101562, -0.12951087951660156, -0.1243133544921875, -0.11911582946777344, -0.11391830444335938, -0.10872077941894531, -0.10352325439453125, -0.09832572937011719, -0.09312820434570312, -0.08793067932128906, -0.082733154296875, -0.07753562927246094, -0.07233810424804688, -0.06714057922363281, -0.06194305419921875, -0.05674552917480469, -0.051548004150390625, -0.04635047912597656, -0.0411529541015625, -0.03595542907714844, -0.030757904052734375, -0.025560379028320312, -0.02036285400390625, -0.015165328979492188, -0.009967803955078125, -0.0047702789306640625, 0.00042724609375, 0.0056247711181640625, 0.010822296142578125, 0.016019821166992188, 0.02121734619140625, 0.026414871215820312, 0.031612396240234375, 0.03680992126464844, 0.0420074462890625, 0.04720497131347656, 0.052402496337890625, 0.05760002136230469, 0.06279754638671875, 0.06799507141113281, 0.07319259643554688, 0.07839012145996094, 0.083587646484375, 0.08878517150878906, 0.09398269653320312, 0.09918022155761719, 0.10437774658203125, 0.10957527160644531, 0.11477279663085938, 0.11997032165527344, 0.1251678466796875, 0.13036537170410156, 0.13556289672851562, 0.1407604217529297, 0.14595794677734375, 0.1511554718017578, 0.15635299682617188, 0.16155052185058594, 0.166748046875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 5.0, 5.0, 5.0, 5.0, 6.0, 11.0, 7.0, 9.0, 17.0, 24.0, 23.0, 25.0, 45.0, 67.0, 90.0, 105.0, 141.0, 90.0, 81.0, 46.0, 50.0, 46.0, 24.0, 16.0, 19.0, 10.0, 5.0, 8.0, 5.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.543231964111328e-05, -5.371123552322388e-05, -5.199015140533447e-05, -5.026906728744507e-05, -4.8547983169555664e-05, -4.682689905166626e-05, -4.5105814933776855e-05, -4.338473081588745e-05, -4.166364669799805e-05, -3.994256258010864e-05, -3.822147846221924e-05, -3.6500394344329834e-05, -3.477931022644043e-05, -3.3058226108551025e-05, -3.133714199066162e-05, -2.9616057872772217e-05, -2.7894973754882812e-05, -2.6173889636993408e-05, -2.4452805519104004e-05, -2.27317214012146e-05, -2.1010637283325195e-05, -1.928955316543579e-05, -1.7568469047546387e-05, -1.5847384929656982e-05, -1.4126300811767578e-05, -1.2405216693878174e-05, -1.068413257598877e-05, -8.963048458099365e-06, -7.241964340209961e-06, -5.520880222320557e-06, -3.7997961044311523e-06, -2.078711986541748e-06, -3.5762786865234375e-07, 1.3634562492370605e-06, 3.084540367126465e-06, 4.805624485015869e-06, 6.5267086029052734e-06, 8.247792720794678e-06, 9.968876838684082e-06, 1.1689960956573486e-05, 1.341104507446289e-05, 1.5132129192352295e-05, 1.68532133102417e-05, 1.8574297428131104e-05, 2.0295381546020508e-05, 2.2016465663909912e-05, 2.3737549781799316e-05, 2.545863389968872e-05, 2.7179718017578125e-05, 2.890080213546753e-05, 3.0621886253356934e-05, 3.234297037124634e-05, 3.406405448913574e-05, 3.5785138607025146e-05, 3.750622272491455e-05, 3.9227306842803955e-05, 4.094839096069336e-05, 4.2669475078582764e-05, 4.439055919647217e-05, 4.611164331436157e-05, 4.7832727432250977e-05, 4.955381155014038e-05, 5.1274895668029785e-05, 5.299597978591919e-05, 5.4717063903808594e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 4.0, 5.0, 7.0, 4.0, 15.0, 20.0, 23.0, 50.0, 43.0, 82.0, 143.0, 222.0, 400.0, 815.0, 1881.0, 5130.0, 16049.0, 61455.0, 535718.0, 344333.0, 58214.0, 15286.0, 5015.0, 1843.0, 795.0, 404.0, 215.0, 142.0, 69.0, 46.0, 46.0, 31.0, 20.0, 13.0, 5.0, 7.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.191162109375, -0.18599319458007812, -0.18082427978515625, -0.17565536499023438, -0.1704864501953125, -0.16531753540039062, -0.16014862060546875, -0.15497970581054688, -0.149810791015625, -0.14464187622070312, -0.13947296142578125, -0.13430404663085938, -0.1291351318359375, -0.12396621704101562, -0.11879730224609375, -0.11362838745117188, -0.10845947265625, -0.10329055786132812, -0.09812164306640625, -0.09295272827148438, -0.0877838134765625, -0.08261489868164062, -0.07744598388671875, -0.07227706909179688, -0.067108154296875, -0.061939239501953125, -0.05677032470703125, -0.051601409912109375, -0.0464324951171875, -0.041263580322265625, -0.03609466552734375, -0.030925750732421875, -0.0257568359375, -0.020587921142578125, -0.01541900634765625, -0.010250091552734375, -0.0050811767578125, 8.7738037109375e-05, 0.00525665283203125, 0.010425567626953125, 0.015594482421875, 0.020763397216796875, 0.02593231201171875, 0.031101226806640625, 0.0362701416015625, 0.041439056396484375, 0.04660797119140625, 0.051776885986328125, 0.05694580078125, 0.062114715576171875, 0.06728363037109375, 0.07245254516601562, 0.0776214599609375, 0.08279037475585938, 0.08795928955078125, 0.09312820434570312, 0.098297119140625, 0.10346603393554688, 0.10863494873046875, 0.11380386352539062, 0.1189727783203125, 0.12414169311523438, 0.12931060791015625, 0.13447952270507812, 0.1396484375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 6.0, 2.0, 4.0, 4.0, 10.0, 3.0, 12.0, 15.0, 13.0, 13.0, 19.0, 28.0, 20.0, 37.0, 40.0, 50.0, 56.0, 70.0, 73.0, 78.0, 76.0, 64.0, 50.0, 35.0, 36.0, 35.0, 29.0, 16.0, 18.0, 12.0, 11.0, 15.0, 3.0, 9.0, 9.0, 4.0, 3.0, 7.0, 1.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.11663818359375, -0.1131439208984375, -0.109649658203125, -0.1061553955078125, -0.1026611328125, -0.0991668701171875, -0.095672607421875, -0.0921783447265625, -0.08868408203125, -0.0851898193359375, -0.081695556640625, -0.0782012939453125, -0.07470703125, -0.0712127685546875, -0.067718505859375, -0.0642242431640625, -0.06072998046875, -0.0572357177734375, -0.053741455078125, -0.0502471923828125, -0.0467529296875, -0.0432586669921875, -0.039764404296875, -0.0362701416015625, -0.03277587890625, -0.0292816162109375, -0.025787353515625, -0.0222930908203125, -0.018798828125, -0.0153045654296875, -0.011810302734375, -0.0083160400390625, -0.00482177734375, -0.0013275146484375, 0.002166748046875, 0.0056610107421875, 0.0091552734375, 0.0126495361328125, 0.016143798828125, 0.0196380615234375, 0.02313232421875, 0.0266265869140625, 0.030120849609375, 0.0336151123046875, 0.037109375, 0.0406036376953125, 0.044097900390625, 0.0475921630859375, 0.05108642578125, 0.0545806884765625, 0.058074951171875, 0.0615692138671875, 0.0650634765625, 0.0685577392578125, 0.072052001953125, 0.0755462646484375, 0.07904052734375, 0.0825347900390625, 0.086029052734375, 0.0895233154296875, 0.093017578125, 0.0965118408203125, 0.100006103515625, 0.1035003662109375, 0.10699462890625]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 26.0, 58.0, 181.0, 439.0, 197.0, 68.0, 21.0, 4.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.385429859161377, -7.177134037017822, -6.968838691711426, -6.760542869567871, -6.552247047424316, -6.343951225280762, -6.135655879974365, -5.9273600578308105, -5.719064712524414, -5.510768890380859, -5.302473545074463, -5.094177722930908, -4.8858819007873535, -4.677586555480957, -4.469290733337402, -4.260994911193848, -4.052699089050293, -3.8444035053253174, -3.6361076831817627, -3.427812099456787, -3.2195162773132324, -3.011220693588257, -2.8029251098632812, -2.5946292877197266, -2.386333703994751, -2.1780381202697754, -1.9697422981262207, -1.7614467144012451, -1.55315101146698, -1.3448553085327148, -1.1365597248077393, -0.9282640218734741, -0.719968318939209, -0.5116726160049438, -0.3033769726753235, -0.09508132934570312, 0.11321437358856201, 0.32151007652282715, 0.5298056602478027, 0.7381013631820679, 0.946397066116333, 1.1546927690505981, 1.3629884719848633, 1.5712840557098389, 1.779579758644104, 1.9878754615783691, 2.1961710453033447, 2.4044666290283203, 2.612762451171875, 2.8210580348968506, 3.0293538570404053, 3.237649440765381, 3.4459452629089355, 3.654240846633911, 3.8625364303588867, 4.070832252502441, 4.279128074645996, 4.487423896789551, 4.695719242095947, 4.904015064239502, 5.112310886383057, 5.320606231689453, 5.528902053833008, 5.7371978759765625, 5.945493221282959]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 6.0, 6.0, 9.0, 7.0, 9.0, 19.0, 19.0, 27.0, 28.0, 25.0, 37.0, 30.0, 26.0, 42.0, 52.0, 123.0, 112.0, 87.0, 47.0, 31.0, 48.0, 31.0, 22.0, 30.0, 26.0, 17.0, 21.0, 12.0, 8.0, 8.0, 6.0, 7.0, 4.0, 6.0, 2.0, 1.0, 7.0, 4.0, 0.0, 1.0], "bins": [-2.5819363594055176, -2.517704486846924, -2.453472375869751, -2.3892405033111572, -2.3250086307525635, -2.2607765197753906, -2.196544647216797, -2.132312774658203, -2.0680806636810303, -2.0038487911224365, -1.9396167993545532, -1.87538480758667, -1.8111528158187866, -1.7469208240509033, -1.6826889514923096, -1.6184569597244263, -1.5542250871658325, -1.4899930953979492, -1.4257612228393555, -1.3615292310714722, -1.2972972393035889, -1.2330653667449951, -1.1688333749771118, -1.1046013832092285, -1.0403695106506348, -0.9761375784873962, -0.9119055867195129, -0.8476736545562744, -0.7834416627883911, -0.7192097306251526, -0.6549777984619141, -0.5907458066940308, -0.5265136957168579, -0.462281733751297, -0.3980497717857361, -0.33381783962249756, -0.26958587765693665, -0.20535391569137573, -0.1411219835281372, -0.0768900215625763, -0.01265805959701538, 0.051573894917964935, 0.11580584943294525, 0.18003779649734497, 0.24426975846290588, 0.3085017204284668, 0.3727336525917053, 0.43696561455726624, 0.5011975765228271, 0.5654295086860657, 0.629661500453949, 0.6938934326171875, 0.7581254243850708, 0.8223573565483093, 0.8865892887115479, 0.9508212804794312, 1.0150532722473145, 1.0792852640151978, 1.1435171365737915, 1.2077491283416748, 1.271981120109558, 1.3362131118774414, 1.4004449844360352, 1.4646769762039185, 1.5289088487625122]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 5.0, 7.0, 8.0, 10.0, 9.0, 10.0, 17.0, 40.0, 31.0, 62.0, 87.0, 137.0, 242.0, 378.0, 644.0, 1144.0, 2350.0, 4978.0, 12175.0, 35094.0, 155429.0, 1285458.0, 2271652.0, 332697.0, 59519.0, 18170.0, 7116.0, 3226.0, 1551.0, 802.0, 488.0, 266.0, 152.0, 94.0, 64.0, 45.0, 36.0, 21.0, 20.0, 18.0, 10.0, 2.0, 7.0, 1.0, 5.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.208740234375, -0.2026348114013672, -0.19652938842773438, -0.19042396545410156, -0.18431854248046875, -0.17821311950683594, -0.17210769653320312, -0.1660022735595703, -0.1598968505859375, -0.1537914276123047, -0.14768600463867188, -0.14158058166503906, -0.13547515869140625, -0.12936973571777344, -0.12326431274414062, -0.11715888977050781, -0.111053466796875, -0.10494804382324219, -0.09884262084960938, -0.09273719787597656, -0.08663177490234375, -0.08052635192871094, -0.07442092895507812, -0.06831550598144531, -0.0622100830078125, -0.05610466003417969, -0.049999237060546875, -0.04389381408691406, -0.03778839111328125, -0.03168296813964844, -0.025577545166015625, -0.019472122192382812, -0.01336669921875, -0.0072612762451171875, -0.001155853271484375, 0.0049495697021484375, 0.01105499267578125, 0.017160415649414062, 0.023265838623046875, 0.029371261596679688, 0.0354766845703125, 0.04158210754394531, 0.047687530517578125, 0.05379295349121094, 0.05989837646484375, 0.06600379943847656, 0.07210922241210938, 0.07821464538574219, 0.084320068359375, 0.09042549133300781, 0.09653091430664062, 0.10263633728027344, 0.10874176025390625, 0.11484718322753906, 0.12095260620117188, 0.1270580291748047, 0.1331634521484375, 0.1392688751220703, 0.14537429809570312, 0.15147972106933594, 0.15758514404296875, 0.16369056701660156, 0.16979598999023438, 0.1759014129638672, 0.1820068359375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 7.0, 8.0, 7.0, 11.0, 23.0, 15.0, 30.0, 23.0, 23.0, 35.0, 27.0, 39.0, 42.0, 49.0, 63.0, 48.0, 48.0, 54.0, 35.0, 49.0, 55.0, 43.0, 47.0, 36.0, 34.0, 29.0, 29.0, 22.0, 18.0, 12.0, 12.0, 12.0, 4.0, 3.0, 4.0, 0.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1322021484375, -0.12861347198486328, -0.12502479553222656, -0.12143611907958984, -0.11784744262695312, -0.1142587661743164, -0.11067008972167969, -0.10708141326904297, -0.10349273681640625, -0.09990406036376953, -0.09631538391113281, -0.0927267074584961, -0.08913803100585938, -0.08554935455322266, -0.08196067810058594, -0.07837200164794922, -0.0747833251953125, -0.07119464874267578, -0.06760597229003906, -0.06401729583740234, -0.060428619384765625, -0.056839942932128906, -0.05325126647949219, -0.04966259002685547, -0.04607391357421875, -0.04248523712158203, -0.03889656066894531, -0.035307884216308594, -0.031719207763671875, -0.028130531311035156, -0.024541854858398438, -0.02095317840576172, -0.017364501953125, -0.013775825500488281, -0.010187149047851562, -0.006598472595214844, -0.003009796142578125, 0.0005788803100585938, 0.0041675567626953125, 0.007756233215332031, 0.01134490966796875, 0.014933586120605469, 0.018522262573242188, 0.022110939025878906, 0.025699615478515625, 0.029288291931152344, 0.03287696838378906, 0.03646564483642578, 0.0400543212890625, 0.04364299774169922, 0.04723167419433594, 0.050820350646972656, 0.054409027099609375, 0.057997703552246094, 0.06158638000488281, 0.06517505645751953, 0.06876373291015625, 0.07235240936279297, 0.07594108581542969, 0.0795297622680664, 0.08311843872070312, 0.08670711517333984, 0.09029579162597656, 0.09388446807861328, 0.09747314453125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 6.0, 9.0, 11.0, 14.0, 24.0, 21.0, 28.0, 33.0, 56.0, 66.0, 100.0, 134.0, 193.0, 286.0, 453.0, 817.0, 2183.0, 6690.0, 36391.0, 645059.0, 3388530.0, 93705.0, 13189.0, 3316.0, 1222.0, 594.0, 355.0, 218.0, 159.0, 110.0, 80.0, 51.0, 49.0, 47.0, 22.0, 17.0, 16.0, 9.0, 4.0, 2.0, 4.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.494140625, -0.4788017272949219, -0.46346282958984375, -0.4481239318847656, -0.4327850341796875, -0.4174461364746094, -0.40210723876953125, -0.3867683410644531, -0.371429443359375, -0.3560905456542969, -0.34075164794921875, -0.3254127502441406, -0.3100738525390625, -0.2947349548339844, -0.27939605712890625, -0.2640571594238281, -0.24871826171875, -0.23337936401367188, -0.21804046630859375, -0.20270156860351562, -0.1873626708984375, -0.17202377319335938, -0.15668487548828125, -0.14134597778320312, -0.126007080078125, -0.11066818237304688, -0.09532928466796875, -0.07999038696289062, -0.0646514892578125, -0.049312591552734375, -0.03397369384765625, -0.018634796142578125, -0.0032958984375, 0.012042999267578125, 0.02738189697265625, 0.042720794677734375, 0.0580596923828125, 0.07339859008789062, 0.08873748779296875, 0.10407638549804688, 0.119415283203125, 0.13475418090820312, 0.15009307861328125, 0.16543197631835938, 0.1807708740234375, 0.19610977172851562, 0.21144866943359375, 0.22678756713867188, 0.24212646484375, 0.2574653625488281, 0.27280426025390625, 0.2881431579589844, 0.3034820556640625, 0.3188209533691406, 0.33415985107421875, 0.3494987487792969, 0.364837646484375, 0.3801765441894531, 0.39551544189453125, 0.4108543395996094, 0.4261932373046875, 0.4415321350097656, 0.45687103271484375, 0.4722099304199219, 0.487548828125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 5.0, 6.0, 10.0, 16.0, 19.0, 17.0, 38.0, 27.0, 47.0, 75.0, 127.0, 208.0, 377.0, 653.0, 816.0, 617.0, 389.0, 211.0, 116.0, 70.0, 61.0, 35.0, 29.0, 18.0, 11.0, 24.0, 11.0, 4.0, 11.0, 7.0, 2.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.375244140625, -0.3636627197265625, -0.352081298828125, -0.3404998779296875, -0.32891845703125, -0.3173370361328125, -0.305755615234375, -0.2941741943359375, -0.2825927734375, -0.2710113525390625, -0.259429931640625, -0.2478485107421875, -0.23626708984375, -0.2246856689453125, -0.213104248046875, -0.2015228271484375, -0.18994140625, -0.1783599853515625, -0.166778564453125, -0.1551971435546875, -0.14361572265625, -0.1320343017578125, -0.120452880859375, -0.1088714599609375, -0.0972900390625, -0.0857086181640625, -0.074127197265625, -0.0625457763671875, -0.05096435546875, -0.0393829345703125, -0.027801513671875, -0.0162200927734375, -0.004638671875, 0.0069427490234375, 0.018524169921875, 0.0301055908203125, 0.04168701171875, 0.0532684326171875, 0.064849853515625, 0.0764312744140625, 0.0880126953125, 0.0995941162109375, 0.111175537109375, 0.1227569580078125, 0.13433837890625, 0.1459197998046875, 0.157501220703125, 0.1690826416015625, 0.1806640625, 0.1922454833984375, 0.203826904296875, 0.2154083251953125, 0.22698974609375, 0.2385711669921875, 0.250152587890625, 0.2617340087890625, 0.2733154296875, 0.2848968505859375, 0.296478271484375, 0.3080596923828125, 0.31964111328125, 0.3312225341796875, 0.342803955078125, 0.3543853759765625, 0.365966796875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 7.0, 3.0, 4.0, 5.0, 7.0, 9.0, 12.0, 16.0, 31.0, 38.0, 55.0, 56.0, 75.0, 87.0, 104.0, 107.0, 86.0, 85.0, 48.0, 40.0, 29.0, 26.0, 13.0, 15.0, 8.0, 7.0, 6.0, 3.0, 5.0, 4.0, 2.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.9248285293579102, -1.8579356670379639, -1.7910428047180176, -1.7241499423980713, -1.657257080078125, -1.5903642177581787, -1.5234713554382324, -1.4565784931182861, -1.3896856307983398, -1.3227927684783936, -1.2558999061584473, -1.189007043838501, -1.1221141815185547, -1.0552213191986084, -0.9883284568786621, -0.9214355945587158, -0.8545427322387695, -0.7876498699188232, -0.720757007598877, -0.6538641452789307, -0.5869712829589844, -0.5200784206390381, -0.4531855583190918, -0.3862926959991455, -0.3193998336791992, -0.25250697135925293, -0.18561410903930664, -0.11872124671936035, -0.05182838439941406, 0.015064477920532227, 0.08195734024047852, 0.1488502025604248, 0.2157430648803711, 0.2826359272003174, 0.34952878952026367, 0.41642165184020996, 0.48331451416015625, 0.5502073764801025, 0.6171002388000488, 0.6839931011199951, 0.7508859634399414, 0.8177788257598877, 0.884671688079834, 0.9515645503997803, 1.0184574127197266, 1.0853502750396729, 1.1522431373596191, 1.2191359996795654, 1.2860288619995117, 1.352921724319458, 1.4198145866394043, 1.4867074489593506, 1.5536003112792969, 1.6204931735992432, 1.6873860359191895, 1.7542788982391357, 1.821171760559082, 1.8880646228790283, 1.9549574851989746, 2.021850347518921, 2.088743209838867, 2.1556360721588135, 2.2225289344787598, 2.289421796798706, 2.3563146591186523]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 9.0, 8.0, 10.0, 10.0, 10.0, 14.0, 7.0, 19.0, 20.0, 22.0, 18.0, 19.0, 33.0, 43.0, 45.0, 43.0, 43.0, 66.0, 43.0, 35.0, 29.0, 39.0, 47.0, 47.0, 53.0, 42.0, 26.0, 34.0, 32.0, 19.0, 27.0, 14.0, 6.0, 16.0, 13.0, 8.0, 7.0, 6.0, 2.0, 6.0, 3.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.4452383518218994, -1.3960517644882202, -1.3468650579452515, -1.2976784706115723, -1.2484917640686035, -1.1993051767349243, -1.1501185894012451, -1.1009318828582764, -1.0517452955245972, -1.002558708190918, -0.9533720016479492, -0.90418541431427, -0.854998767375946, -0.8058121204376221, -0.7566254734992981, -0.7074388265609741, -0.6582521796226501, -0.6090655326843262, -0.5598788857460022, -0.5106922388076782, -0.461505651473999, -0.41231900453567505, -0.3631323575973511, -0.3139457404613495, -0.2647590935230255, -0.21557246148586273, -0.16638582944869995, -0.11719918251037598, -0.0680125504732132, -0.018825918436050415, 0.03036072850227356, 0.07954734563827515, 0.12873399257659912, 0.1779206246137619, 0.22710725665092468, 0.27629390358924866, 0.32548052072525024, 0.3746671676635742, 0.4238538146018982, 0.4730404317378998, 0.5222270488739014, 0.5714136958122253, 0.6206003427505493, 0.6697869300842285, 0.7189735770225525, 0.7681602239608765, 0.8173468708992004, 0.8665335178375244, 0.9157201647758484, 0.9649068117141724, 1.0140933990478516, 1.0632801055908203, 1.1124666929244995, 1.1616532802581787, 1.2108399868011475, 1.2600265741348267, 1.3092132806777954, 1.3583998680114746, 1.4075865745544434, 1.4567731618881226, 1.5059598684310913, 1.5551464557647705, 1.6043331623077393, 1.6535197496414185, 1.7027063369750977]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 10.0, 8.0, 13.0, 22.0, 33.0, 39.0, 55.0, 104.0, 152.0, 254.0, 355.0, 558.0, 875.0, 1360.0, 2296.0, 3639.0, 6249.0, 10898.0, 19990.0, 38392.0, 76343.0, 158275.0, 271769.0, 224658.0, 112795.0, 54991.0, 28151.0, 14992.0, 8561.0, 4821.0, 2922.0, 1822.0, 1136.0, 716.0, 436.0, 298.0, 178.0, 137.0, 68.0, 65.0, 46.0, 22.0, 19.0, 14.0, 10.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.16748046875, -0.16220855712890625, -0.1569366455078125, -0.15166473388671875, -0.146392822265625, -0.14112091064453125, -0.1358489990234375, -0.13057708740234375, -0.12530517578125, -0.12003326416015625, -0.1147613525390625, -0.10948944091796875, -0.104217529296875, -0.09894561767578125, -0.0936737060546875, -0.08840179443359375, -0.0831298828125, -0.07785797119140625, -0.0725860595703125, -0.06731414794921875, -0.062042236328125, -0.05677032470703125, -0.0514984130859375, -0.04622650146484375, -0.04095458984375, -0.03568267822265625, -0.0304107666015625, -0.02513885498046875, -0.019866943359375, -0.01459503173828125, -0.0093231201171875, -0.00405120849609375, 0.001220703125, 0.00649261474609375, 0.0117645263671875, 0.01703643798828125, 0.022308349609375, 0.02758026123046875, 0.0328521728515625, 0.03812408447265625, 0.04339599609375, 0.04866790771484375, 0.0539398193359375, 0.05921173095703125, 0.064483642578125, 0.06975555419921875, 0.0750274658203125, 0.08029937744140625, 0.0855712890625, 0.09084320068359375, 0.0961151123046875, 0.10138702392578125, 0.106658935546875, 0.11193084716796875, 0.1172027587890625, 0.12247467041015625, 0.12774658203125, 0.13301849365234375, 0.1382904052734375, 0.14356231689453125, 0.148834228515625, 0.15410614013671875, 0.1593780517578125, 0.16464996337890625, 0.169921875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 1.0, 7.0, 6.0, 6.0, 7.0, 10.0, 14.0, 16.0, 15.0, 21.0, 16.0, 30.0, 30.0, 30.0, 37.0, 41.0, 56.0, 54.0, 39.0, 43.0, 53.0, 46.0, 46.0, 47.0, 40.0, 35.0, 36.0, 41.0, 26.0, 25.0, 35.0, 14.0, 11.0, 16.0, 15.0, 9.0, 5.0, 5.0, 7.0, 3.0, 4.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.130615234375, -0.12669754028320312, -0.12277984619140625, -0.11886215209960938, -0.1149444580078125, -0.11102676391601562, -0.10710906982421875, -0.10319137573242188, -0.099273681640625, -0.09535598754882812, -0.09143829345703125, -0.08752059936523438, -0.0836029052734375, -0.07968521118164062, -0.07576751708984375, -0.07184982299804688, -0.06793212890625, -0.06401443481445312, -0.06009674072265625, -0.056179046630859375, -0.0522613525390625, -0.048343658447265625, -0.04442596435546875, -0.040508270263671875, -0.036590576171875, -0.032672882080078125, -0.02875518798828125, -0.024837493896484375, -0.0209197998046875, -0.017002105712890625, -0.01308441162109375, -0.009166717529296875, -0.0052490234375, -0.001331329345703125, 0.00258636474609375, 0.006504058837890625, 0.0104217529296875, 0.014339447021484375, 0.01825714111328125, 0.022174835205078125, 0.026092529296875, 0.030010223388671875, 0.03392791748046875, 0.037845611572265625, 0.0417633056640625, 0.045680999755859375, 0.04959869384765625, 0.053516387939453125, 0.05743408203125, 0.061351776123046875, 0.06526947021484375, 0.06918716430664062, 0.0731048583984375, 0.07702255249023438, 0.08094024658203125, 0.08485794067382812, 0.088775634765625, 0.09269332885742188, 0.09661102294921875, 0.10052871704101562, 0.1044464111328125, 0.10836410522460938, 0.11228179931640625, 0.11619949340820312, 0.1201171875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 6.0, 6.0, 12.0, 18.0, 32.0, 66.0, 81.0, 128.0, 201.0, 435.0, 917.0, 2468.0, 14113.0, 354960.0, 655397.0, 15212.0, 2538.0, 975.0, 420.0, 236.0, 133.0, 68.0, 41.0, 42.0, 12.0, 11.0, 8.0, 8.0, 7.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8447265625, -0.8191452026367188, -0.7935638427734375, -0.7679824829101562, -0.742401123046875, -0.7168197631835938, -0.6912384033203125, -0.6656570434570312, -0.64007568359375, -0.6144943237304688, -0.5889129638671875, -0.5633316040039062, -0.537750244140625, -0.5121688842773438, -0.4865875244140625, -0.46100616455078125, -0.4354248046875, -0.40984344482421875, -0.3842620849609375, -0.35868072509765625, -0.333099365234375, -0.30751800537109375, -0.2819366455078125, -0.25635528564453125, -0.23077392578125, -0.20519256591796875, -0.1796112060546875, -0.15402984619140625, -0.128448486328125, -0.10286712646484375, -0.0772857666015625, -0.05170440673828125, -0.026123046875, -0.00054168701171875, 0.0250396728515625, 0.05062103271484375, 0.076202392578125, 0.10178375244140625, 0.1273651123046875, 0.15294647216796875, 0.17852783203125, 0.20410919189453125, 0.2296905517578125, 0.25527191162109375, 0.280853271484375, 0.30643463134765625, 0.3320159912109375, 0.35759735107421875, 0.3831787109375, 0.40876007080078125, 0.4343414306640625, 0.45992279052734375, 0.485504150390625, 0.5110855102539062, 0.5366668701171875, 0.5622482299804688, 0.58782958984375, 0.6134109497070312, 0.6389923095703125, 0.6645736694335938, 0.690155029296875, 0.7157363891601562, 0.7413177490234375, 0.7668991088867188, 0.79248046875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 5.0, 4.0, 9.0, 9.0, 10.0, 5.0, 7.0, 13.0, 27.0, 13.0, 26.0, 26.0, 24.0, 29.0, 41.0, 28.0, 51.0, 37.0, 46.0, 60.0, 50.0, 55.0, 39.0, 48.0, 39.0, 36.0, 44.0, 42.0, 23.0, 32.0, 19.0, 23.0, 17.0, 5.0, 12.0, 9.0, 4.0, 8.0, 10.0, 8.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.4755859375, -0.4607734680175781, -0.44596099853515625, -0.4311485290527344, -0.4163360595703125, -0.4015235900878906, -0.38671112060546875, -0.3718986511230469, -0.357086181640625, -0.3422737121582031, -0.32746124267578125, -0.3126487731933594, -0.2978363037109375, -0.2830238342285156, -0.26821136474609375, -0.2533988952636719, -0.23858642578125, -0.22377395629882812, -0.20896148681640625, -0.19414901733398438, -0.1793365478515625, -0.16452407836914062, -0.14971160888671875, -0.13489913940429688, -0.120086669921875, -0.10527420043945312, -0.09046173095703125, -0.07564926147460938, -0.0608367919921875, -0.046024322509765625, -0.03121185302734375, -0.016399383544921875, -0.0015869140625, 0.013225555419921875, 0.02803802490234375, 0.042850494384765625, 0.0576629638671875, 0.07247543334960938, 0.08728790283203125, 0.10210037231445312, 0.116912841796875, 0.13172531127929688, 0.14653778076171875, 0.16135025024414062, 0.1761627197265625, 0.19097518920898438, 0.20578765869140625, 0.22060012817382812, 0.23541259765625, 0.2502250671386719, 0.26503753662109375, 0.2798500061035156, 0.2946624755859375, 0.3094749450683594, 0.32428741455078125, 0.3390998840332031, 0.353912353515625, 0.3687248229980469, 0.38353729248046875, 0.3983497619628906, 0.4131622314453125, 0.4279747009277344, 0.44278717041015625, 0.4575996398925781, 0.472412109375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 5.0, 10.0, 10.0, 16.0, 19.0, 26.0, 31.0, 42.0, 76.0, 110.0, 175.0, 252.0, 500.0, 863.0, 1779.0, 4073.0, 11737.0, 47825.0, 653345.0, 272757.0, 37894.0, 10039.0, 3569.0, 1483.0, 752.0, 403.0, 261.0, 161.0, 106.0, 75.0, 48.0, 38.0, 25.0, 19.0, 12.0, 11.0, 4.0, 0.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1866455078125, -0.18040847778320312, -0.17417144775390625, -0.16793441772460938, -0.1616973876953125, -0.15546035766601562, -0.14922332763671875, -0.14298629760742188, -0.136749267578125, -0.13051223754882812, -0.12427520751953125, -0.11803817749023438, -0.1118011474609375, -0.10556411743164062, -0.09932708740234375, -0.09309005737304688, -0.08685302734375, -0.08061599731445312, -0.07437896728515625, -0.06814193725585938, -0.0619049072265625, -0.055667877197265625, -0.04943084716796875, -0.043193817138671875, -0.036956787109375, -0.030719757080078125, -0.02448272705078125, -0.018245697021484375, -0.0120086669921875, -0.005771636962890625, 0.00046539306640625, 0.006702423095703125, 0.012939453125, 0.019176483154296875, 0.02541351318359375, 0.031650543212890625, 0.0378875732421875, 0.044124603271484375, 0.05036163330078125, 0.056598663330078125, 0.062835693359375, 0.06907272338867188, 0.07530975341796875, 0.08154678344726562, 0.0877838134765625, 0.09402084350585938, 0.10025787353515625, 0.10649490356445312, 0.11273193359375, 0.11896896362304688, 0.12520599365234375, 0.13144302368164062, 0.1376800537109375, 0.14391708374023438, 0.15015411376953125, 0.15639114379882812, 0.162628173828125, 0.16886520385742188, 0.17510223388671875, 0.18133926391601562, 0.1875762939453125, 0.19381332397460938, 0.20005035400390625, 0.20628738403320312, 0.2125244140625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 5.0, 5.0, 2.0, 6.0, 3.0, 4.0, 5.0, 15.0, 11.0, 14.0, 21.0, 27.0, 31.0, 63.0, 66.0, 106.0, 135.0, 143.0, 95.0, 68.0, 49.0, 32.0, 21.0, 11.0, 16.0, 9.0, 7.0, 6.0, 6.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.00010824203491210938, -0.00010538846254348755, -0.00010253489017486572, -9.96813178062439e-05, -9.682774543762207e-05, -9.397417306900024e-05, -9.112060070037842e-05, -8.826702833175659e-05, -8.541345596313477e-05, -8.255988359451294e-05, -7.970631122589111e-05, -7.685273885726929e-05, -7.399916648864746e-05, -7.114559412002563e-05, -6.829202175140381e-05, -6.543844938278198e-05, -6.258487701416016e-05, -5.973130464553833e-05, -5.6877732276916504e-05, -5.402415990829468e-05, -5.117058753967285e-05, -4.8317015171051025e-05, -4.54634428024292e-05, -4.260987043380737e-05, -3.975629806518555e-05, -3.690272569656372e-05, -3.4049153327941895e-05, -3.119558095932007e-05, -2.8342008590698242e-05, -2.5488436222076416e-05, -2.263486385345459e-05, -1.9781291484832764e-05, -1.6927719116210938e-05, -1.4074146747589111e-05, -1.1220574378967285e-05, -8.367002010345459e-06, -5.513429641723633e-06, -2.6598572731018066e-06, 1.9371509552001953e-07, 3.0472874641418457e-06, 5.900859832763672e-06, 8.754432201385498e-06, 1.1608004570007324e-05, 1.446157693862915e-05, 1.7315149307250977e-05, 2.0168721675872803e-05, 2.302229404449463e-05, 2.5875866413116455e-05, 2.872943878173828e-05, 3.158301115036011e-05, 3.4436583518981934e-05, 3.729015588760376e-05, 4.0143728256225586e-05, 4.299730062484741e-05, 4.585087299346924e-05, 4.8704445362091064e-05, 5.155801773071289e-05, 5.441159009933472e-05, 5.726516246795654e-05, 6.011873483657837e-05, 6.29723072052002e-05, 6.582587957382202e-05, 6.867945194244385e-05, 7.153302431106567e-05, 7.43865966796875e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 3.0, 4.0, 5.0, 10.0, 10.0, 19.0, 28.0, 23.0, 45.0, 58.0, 90.0, 152.0, 227.0, 409.0, 715.0, 1521.0, 3344.0, 9768.0, 41417.0, 304467.0, 620112.0, 47960.0, 11131.0, 3643.0, 1528.0, 703.0, 436.0, 233.0, 133.0, 117.0, 63.0, 53.0, 35.0, 21.0, 21.0, 14.0, 10.0, 10.0, 5.0, 3.0, 1.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.190185546875, -0.1845989227294922, -0.17901229858398438, -0.17342567443847656, -0.16783905029296875, -0.16225242614746094, -0.15666580200195312, -0.1510791778564453, -0.1454925537109375, -0.1399059295654297, -0.13431930541992188, -0.12873268127441406, -0.12314605712890625, -0.11755943298339844, -0.11197280883789062, -0.10638618469238281, -0.100799560546875, -0.09521293640136719, -0.08962631225585938, -0.08403968811035156, -0.07845306396484375, -0.07286643981933594, -0.06727981567382812, -0.06169319152832031, -0.0561065673828125, -0.05051994323730469, -0.044933319091796875, -0.03934669494628906, -0.03376007080078125, -0.028173446655273438, -0.022586822509765625, -0.017000198364257812, -0.01141357421875, -0.0058269500732421875, -0.000240325927734375, 0.0053462982177734375, 0.01093292236328125, 0.016519546508789062, 0.022106170654296875, 0.027692794799804688, 0.0332794189453125, 0.03886604309082031, 0.044452667236328125, 0.05003929138183594, 0.05562591552734375, 0.06121253967285156, 0.06679916381835938, 0.07238578796386719, 0.077972412109375, 0.08355903625488281, 0.08914566040039062, 0.09473228454589844, 0.10031890869140625, 0.10590553283691406, 0.11149215698242188, 0.11707878112792969, 0.1226654052734375, 0.1282520294189453, 0.13383865356445312, 0.13942527770996094, 0.14501190185546875, 0.15059852600097656, 0.15618515014648438, 0.1617717742919922, 0.1673583984375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 0.0, 5.0, 8.0, 3.0, 6.0, 8.0, 11.0, 17.0, 24.0, 39.0, 39.0, 64.0, 64.0, 94.0, 115.0, 127.0, 89.0, 62.0, 48.0, 44.0, 33.0, 26.0, 13.0, 17.0, 11.0, 9.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.180419921875, -0.17522811889648438, -0.17003631591796875, -0.16484451293945312, -0.1596527099609375, -0.15446090698242188, -0.14926910400390625, -0.14407730102539062, -0.138885498046875, -0.13369369506835938, -0.12850189208984375, -0.12331008911132812, -0.1181182861328125, -0.11292648315429688, -0.10773468017578125, -0.10254287719726562, -0.09735107421875, -0.09215927124023438, -0.08696746826171875, -0.08177566528320312, -0.0765838623046875, -0.07139205932617188, -0.06620025634765625, -0.061008453369140625, -0.055816650390625, -0.050624847412109375, -0.04543304443359375, -0.040241241455078125, -0.0350494384765625, -0.029857635498046875, -0.02466583251953125, -0.019474029541015625, -0.0142822265625, -0.009090423583984375, -0.00389862060546875, 0.001293182373046875, 0.0064849853515625, 0.011676788330078125, 0.01686859130859375, 0.022060394287109375, 0.027252197265625, 0.032444000244140625, 0.03763580322265625, 0.042827606201171875, 0.0480194091796875, 0.053211212158203125, 0.05840301513671875, 0.06359481811523438, 0.06878662109375, 0.07397842407226562, 0.07917022705078125, 0.08436203002929688, 0.0895538330078125, 0.09474563598632812, 0.09993743896484375, 0.10512924194335938, 0.110321044921875, 0.11551284790039062, 0.12070465087890625, 0.12589645385742188, 0.1310882568359375, 0.13628005981445312, 0.14147186279296875, 0.14666366577148438, 0.15185546875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 9.0, 3.0, 3.0, 5.0, 10.0, 12.0, 31.0, 44.0, 92.0, 149.0, 389.0, 129.0, 64.0, 33.0, 16.0, 8.0, 5.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.377230167388916, -5.225335597991943, -5.073441028594971, -4.921546459197998, -4.769651412963867, -4.6177568435668945, -4.465862274169922, -4.313967704772949, -4.162073135375977, -4.010178565979004, -3.8582839965820312, -3.7063891887664795, -3.554494619369507, -3.402600049972534, -3.2507052421569824, -3.0988106727600098, -2.946916103363037, -2.7950215339660645, -2.643126964569092, -2.49123215675354, -2.3393375873565674, -2.1874430179595947, -2.035548210144043, -1.8836536407470703, -1.7317590713500977, -1.579864501953125, -1.4279698133468628, -1.2760751247406006, -1.124180555343628, -0.9722859263420105, -0.8203912973403931, -0.6684966087341309, -0.5166025161743164, -0.364707887172699, -0.21281325817108154, -0.06091862916946411, 0.09097599983215332, 0.24287062883377075, 0.3947652578353882, 0.5466599464416504, 0.698554515838623, 0.8504491448402405, 1.002343773841858, 1.1542384624481201, 1.3061330318450928, 1.4580276012420654, 1.6099222898483276, 1.7618169784545898, 1.9137115478515625, 2.065606117248535, 2.217500686645508, 2.3693954944610596, 2.5212900638580322, 2.673184633255005, 2.8250794410705566, 2.9769740104675293, 3.128868579864502, 3.2807631492614746, 3.4326577186584473, 3.584552526473999, 3.7364470958709717, 3.8883416652679443, 4.040236473083496, 4.192131042480469, 4.344025611877441]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 5.0, 9.0, 6.0, 6.0, 13.0, 6.0, 8.0, 15.0, 15.0, 21.0, 14.0, 14.0, 29.0, 22.0, 30.0, 28.0, 27.0, 38.0, 79.0, 119.0, 120.0, 55.0, 33.0, 29.0, 30.0, 24.0, 19.0, 17.0, 17.0, 23.0, 15.0, 19.0, 15.0, 13.0, 13.0, 9.0, 8.0, 7.0, 3.0, 4.0, 4.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0], "bins": [-1.6989660263061523, -1.6455979347229004, -1.5922298431396484, -1.5388617515563965, -1.4854936599731445, -1.4321255683898926, -1.3787574768066406, -1.3253892660140991, -1.2720211744308472, -1.2186530828475952, -1.1652849912643433, -1.1119168996810913, -1.0585488080978394, -1.0051805973052979, -0.9518125653266907, -0.898444414138794, -0.8450763821601868, -0.7917082905769348, -0.7383401989936829, -0.6849720478057861, -0.6316039562225342, -0.5782358646392822, -0.5248677730560303, -0.47149965167045593, -0.418131560087204, -0.364763468503952, -0.3113953471183777, -0.25802725553512573, -0.20465914905071259, -0.15129104256629944, -0.09792295098304749, -0.044554829597473145, 0.008813261985778809, 0.06218136474490166, 0.1155494675040245, 0.16891756653785706, 0.2222856730222702, 0.27565377950668335, 0.3290218710899353, 0.38238999247550964, 0.4357580840587616, 0.48912617564201355, 0.5424942970275879, 0.5958623886108398, 0.6492304801940918, 0.7025985717773438, 0.7559666633605957, 0.8093348145484924, 0.8627029061317444, 0.9160709977149963, 0.9694390892982483, 1.022807240486145, 1.076175332069397, 1.129543423652649, 1.1829115152359009, 1.2362796068191528, 1.2896476984024048, 1.3430157899856567, 1.3963838815689087, 1.4497519731521606, 1.5031200647354126, 1.556488275527954, 1.609856367111206, 1.663224458694458, 1.71659255027771]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 1.0, 1.0, 3.0, 8.0, 10.0, 9.0, 11.0, 29.0, 36.0, 61.0, 76.0, 114.0, 180.0, 301.0, 471.0, 799.0, 1390.0, 2586.0, 4982.0, 10777.0, 25950.0, 77301.0, 332413.0, 1615830.0, 1643095.0, 348134.0, 80668.0, 26844.0, 10883.0, 5085.0, 2689.0, 1429.0, 810.0, 493.0, 293.0, 170.0, 121.0, 72.0, 56.0, 30.0, 21.0, 15.0, 14.0, 9.0, 4.0, 3.0, 6.0, 1.0, 0.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.2310791015625, -0.22407913208007812, -0.21707916259765625, -0.21007919311523438, -0.2030792236328125, -0.19607925415039062, -0.18907928466796875, -0.18207931518554688, -0.175079345703125, -0.16807937622070312, -0.16107940673828125, -0.15407943725585938, -0.1470794677734375, -0.14007949829101562, -0.13307952880859375, -0.12607955932617188, -0.11907958984375, -0.11207962036132812, -0.10507965087890625, -0.09807968139648438, -0.0910797119140625, -0.08407974243164062, -0.07707977294921875, -0.07007980346679688, -0.063079833984375, -0.056079864501953125, -0.04907989501953125, -0.042079925537109375, -0.0350799560546875, -0.028079986572265625, -0.02108001708984375, -0.014080047607421875, -0.007080078125, -8.0108642578125e-05, 0.00691986083984375, 0.013919830322265625, 0.0209197998046875, 0.027919769287109375, 0.03491973876953125, 0.041919708251953125, 0.048919677734375, 0.055919647216796875, 0.06291961669921875, 0.06991958618164062, 0.0769195556640625, 0.08391952514648438, 0.09091949462890625, 0.09791946411132812, 0.10491943359375, 0.11191940307617188, 0.11891937255859375, 0.12591934204101562, 0.1329193115234375, 0.13991928100585938, 0.14691925048828125, 0.15391921997070312, 0.160919189453125, 0.16791915893554688, 0.17491912841796875, 0.18191909790039062, 0.1889190673828125, 0.19591903686523438, 0.20291900634765625, 0.20991897583007812, 0.2169189453125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 1.0, 3.0, 4.0, 3.0, 7.0, 5.0, 9.0, 9.0, 16.0, 11.0, 23.0, 10.0, 19.0, 30.0, 19.0, 32.0, 32.0, 37.0, 52.0, 49.0, 34.0, 45.0, 47.0, 39.0, 43.0, 51.0, 46.0, 36.0, 37.0, 35.0, 34.0, 36.0, 28.0, 27.0, 21.0, 14.0, 12.0, 12.0, 8.0, 11.0, 8.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.11566162109375, -0.11236381530761719, -0.10906600952148438, -0.10576820373535156, -0.10247039794921875, -0.09917259216308594, -0.09587478637695312, -0.09257698059082031, -0.0892791748046875, -0.08598136901855469, -0.08268356323242188, -0.07938575744628906, -0.07608795166015625, -0.07279014587402344, -0.06949234008789062, -0.06619453430175781, -0.062896728515625, -0.05959892272949219, -0.056301116943359375, -0.05300331115722656, -0.04970550537109375, -0.04640769958496094, -0.043109893798828125, -0.03981208801269531, -0.0365142822265625, -0.03321647644042969, -0.029918670654296875, -0.026620864868164062, -0.02332305908203125, -0.020025253295898438, -0.016727447509765625, -0.013429641723632812, -0.0101318359375, -0.0068340301513671875, -0.003536224365234375, -0.0002384185791015625, 0.00305938720703125, 0.0063571929931640625, 0.009654998779296875, 0.012952804565429688, 0.0162506103515625, 0.019548416137695312, 0.022846221923828125, 0.026144027709960938, 0.02944183349609375, 0.03273963928222656, 0.036037445068359375, 0.03933525085449219, 0.042633056640625, 0.04593086242675781, 0.049228668212890625, 0.05252647399902344, 0.05582427978515625, 0.05912208557128906, 0.062419891357421875, 0.06571769714355469, 0.0690155029296875, 0.07231330871582031, 0.07561111450195312, 0.07890892028808594, 0.08220672607421875, 0.08550453186035156, 0.08880233764648438, 0.09210014343261719, 0.09539794921875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 8.0, 6.0, 9.0, 16.0, 50.0, 150.0, 488.0, 3265.0, 4095718.0, 92723.0, 1420.0, 291.0, 95.0, 35.0, 9.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.974609375, -2.8748779296875, -2.775146484375, -2.6754150390625, -2.57568359375, -2.4759521484375, -2.376220703125, -2.2764892578125, -2.1767578125, -2.0770263671875, -1.977294921875, -1.8775634765625, -1.77783203125, -1.6781005859375, -1.578369140625, -1.4786376953125, -1.37890625, -1.2791748046875, -1.179443359375, -1.0797119140625, -0.97998046875, -0.8802490234375, -0.780517578125, -0.6807861328125, -0.5810546875, -0.4813232421875, -0.381591796875, -0.2818603515625, -0.18212890625, -0.0823974609375, 0.017333984375, 0.1170654296875, 0.216796875, 0.3165283203125, 0.416259765625, 0.5159912109375, 0.61572265625, 0.7154541015625, 0.815185546875, 0.9149169921875, 1.0146484375, 1.1143798828125, 1.214111328125, 1.3138427734375, 1.41357421875, 1.5133056640625, 1.613037109375, 1.7127685546875, 1.8125, 1.9122314453125, 2.011962890625, 2.1116943359375, 2.21142578125, 2.3111572265625, 2.410888671875, 2.5106201171875, 2.6103515625, 2.7100830078125, 2.809814453125, 2.9095458984375, 3.00927734375, 3.1090087890625, 3.208740234375, 3.3084716796875, 3.408203125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 9.0, 27.0, 76.0, 164.0, 419.0, 1117.0, 1403.0, 515.0, 217.0, 64.0, 32.0, 20.0, 8.0, 3.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6328125, -1.5899658203125, -1.547119140625, -1.5042724609375, -1.46142578125, -1.4185791015625, -1.375732421875, -1.3328857421875, -1.2900390625, -1.2471923828125, -1.204345703125, -1.1614990234375, -1.11865234375, -1.0758056640625, -1.032958984375, -0.9901123046875, -0.947265625, -0.9044189453125, -0.861572265625, -0.8187255859375, -0.77587890625, -0.7330322265625, -0.690185546875, -0.6473388671875, -0.6044921875, -0.5616455078125, -0.518798828125, -0.4759521484375, -0.43310546875, -0.3902587890625, -0.347412109375, -0.3045654296875, -0.26171875, -0.2188720703125, -0.176025390625, -0.1331787109375, -0.09033203125, -0.0474853515625, -0.004638671875, 0.0382080078125, 0.0810546875, 0.1239013671875, 0.166748046875, 0.2095947265625, 0.25244140625, 0.2952880859375, 0.338134765625, 0.3809814453125, 0.423828125, 0.4666748046875, 0.509521484375, 0.5523681640625, 0.59521484375, 0.6380615234375, 0.680908203125, 0.7237548828125, 0.7666015625, 0.8094482421875, 0.852294921875, 0.8951416015625, 0.93798828125, 0.9808349609375, 1.023681640625, 1.0665283203125, 1.109375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 5.0, 12.0, 24.0, 66.0, 284.0, 373.0, 156.0, 55.0, 20.0, 7.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.826801300048828, -20.357345581054688, -19.88789176940918, -19.41843605041504, -18.94898223876953, -18.47952651977539, -18.01007080078125, -17.540616989135742, -17.0711612701416, -16.60170555114746, -16.132251739501953, -15.662796020507812, -15.193341255187988, -14.723886489868164, -14.25443172454834, -13.784976959228516, -13.315522193908691, -12.846067428588867, -12.376612663269043, -11.907157897949219, -11.437702178955078, -10.968247413635254, -10.49879264831543, -10.029337882995605, -9.559883117675781, -9.090428352355957, -8.620973587036133, -8.151517868041992, -7.682063102722168, -7.212608337402344, -6.7431535720825195, -6.273698806762695, -5.804244041442871, -5.334789276123047, -4.8653340339660645, -4.39587926864624, -3.926424264907837, -3.4569692611694336, -2.9875144958496094, -2.518059492111206, -2.0486044883728027, -1.5791494846343994, -1.1096946001052856, -0.6402397155761719, -0.17078471183776855, 0.29867029190063477, 0.768125057220459, 1.2375800609588623, 1.7070350646972656, 2.176490068435669, 2.6459450721740723, 3.1153998374938965, 3.5848548412323, 4.054309844970703, 4.523764610290527, 4.993219375610352, 5.462674617767334, 5.932129383087158, 6.401584625244141, 6.871039390563965, 7.340494155883789, 7.8099493980407715, 8.279403686523438, 8.748859405517578, 9.218314170837402]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 7.0, 9.0, 13.0, 23.0, 26.0, 49.0, 47.0, 60.0, 74.0, 73.0, 123.0, 116.0, 87.0, 59.0, 61.0, 42.0, 38.0, 27.0, 17.0, 9.0, 17.0, 6.0, 4.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5703020095825195, -6.390491962432861, -6.210681438446045, -6.030871391296387, -5.8510613441467285, -5.67125129699707, -5.491440773010254, -5.311630725860596, -5.1318206787109375, -4.952010631561279, -4.772200107574463, -4.592390060424805, -4.4125800132751465, -4.232769966125488, -4.052959442138672, -3.8731493949890137, -3.6933391094207764, -3.513528823852539, -3.333718776702881, -3.1539084911346436, -2.9740984439849854, -2.794288158416748, -2.61447811126709, -2.4346678256988525, -2.2548575401306152, -2.075047254562378, -1.8952372074127197, -1.7154269218444824, -1.5356168746948242, -1.355806589126587, -1.1759964227676392, -0.9961862564086914, -0.8163762092590332, -0.6365660429000854, -0.4567558467388153, -0.27694565057754517, -0.09713548421859741, 0.08267468214035034, 0.26248490810394287, 0.4422950744628906, 0.6221052408218384, 0.8019154071807861, 0.9817255735397339, 1.1615357398986816, 1.341346025466919, 1.5211560726165771, 1.7009663581848145, 1.8807765245437622, 2.06058669090271, 2.2403969764709473, 2.4202070236206055, 2.6000173091888428, 2.779827356338501, 2.9596376419067383, 3.1394476890563965, 3.319257974624634, 3.499068260192871, 3.6788785457611084, 3.8586885929107666, 4.038498878479004, 4.218308925628662, 4.39811897277832, 4.577929496765137, 4.757739543914795, 4.937549591064453]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 4.0, 6.0, 7.0, 9.0, 9.0, 16.0, 29.0, 53.0, 67.0, 99.0, 182.0, 335.0, 631.0, 1322.0, 3124.0, 7955.0, 25235.0, 109732.0, 630626.0, 207893.0, 41470.0, 11899.0, 4179.0, 1805.0, 776.0, 412.0, 237.0, 169.0, 100.0, 53.0, 25.0, 27.0, 21.0, 15.0, 10.0, 7.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.440185546875, -0.42784881591796875, -0.4155120849609375, -0.40317535400390625, -0.390838623046875, -0.37850189208984375, -0.3661651611328125, -0.35382843017578125, -0.34149169921875, -0.32915496826171875, -0.3168182373046875, -0.30448150634765625, -0.292144775390625, -0.27980804443359375, -0.2674713134765625, -0.25513458251953125, -0.2427978515625, -0.23046112060546875, -0.2181243896484375, -0.20578765869140625, -0.193450927734375, -0.18111419677734375, -0.1687774658203125, -0.15644073486328125, -0.14410400390625, -0.13176727294921875, -0.1194305419921875, -0.10709381103515625, -0.094757080078125, -0.08242034912109375, -0.0700836181640625, -0.05774688720703125, -0.04541015625, -0.03307342529296875, -0.0207366943359375, -0.00839996337890625, 0.003936767578125, 0.01627349853515625, 0.0286102294921875, 0.04094696044921875, 0.05328369140625, 0.06562042236328125, 0.0779571533203125, 0.09029388427734375, 0.102630615234375, 0.11496734619140625, 0.1273040771484375, 0.13964080810546875, 0.1519775390625, 0.16431427001953125, 0.1766510009765625, 0.18898773193359375, 0.201324462890625, 0.21366119384765625, 0.2259979248046875, 0.23833465576171875, 0.25067138671875, 0.26300811767578125, 0.2753448486328125, 0.28768157958984375, 0.300018310546875, 0.31235504150390625, 0.3246917724609375, 0.33702850341796875, 0.349365234375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 7.0, 10.0, 15.0, 21.0, 37.0, 30.0, 52.0, 53.0, 63.0, 73.0, 90.0, 89.0, 90.0, 82.0, 71.0, 61.0, 46.0, 30.0, 26.0, 12.0, 9.0, 13.0, 6.0, 7.0, 5.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.381591796875, -0.3721351623535156, -0.36267852783203125, -0.3532218933105469, -0.3437652587890625, -0.3343086242675781, -0.32485198974609375, -0.3153953552246094, -0.305938720703125, -0.2964820861816406, -0.28702545166015625, -0.2775688171386719, -0.2681121826171875, -0.2586555480957031, -0.24919891357421875, -0.23974227905273438, -0.23028564453125, -0.22082901000976562, -0.21137237548828125, -0.20191574096679688, -0.1924591064453125, -0.18300247192382812, -0.17354583740234375, -0.16408920288085938, -0.154632568359375, -0.14517593383789062, -0.13571929931640625, -0.12626266479492188, -0.1168060302734375, -0.10734939575195312, -0.09789276123046875, -0.08843612670898438, -0.0789794921875, -0.06952285766601562, -0.06006622314453125, -0.050609588623046875, -0.0411529541015625, -0.031696319580078125, -0.02223968505859375, -0.012783050537109375, -0.003326416015625, 0.006130218505859375, 0.01558685302734375, 0.025043487548828125, 0.0345001220703125, 0.043956756591796875, 0.05341339111328125, 0.06287002563476562, 0.07232666015625, 0.08178329467773438, 0.09123992919921875, 0.10069656372070312, 0.1101531982421875, 0.11960983276367188, 0.12906646728515625, 0.13852310180664062, 0.147979736328125, 0.15743637084960938, 0.16689300537109375, 0.17634963989257812, 0.1858062744140625, 0.19526290893554688, 0.20471954345703125, 0.21417617797851562, 0.2236328125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 5.0, 2.0, 1.0, 2.0, 7.0, 11.0, 7.0, 11.0, 16.0, 27.0, 43.0, 39.0, 66.0, 97.0, 144.0, 199.0, 370.0, 659.0, 1381.0, 4158.0, 23916.0, 831063.0, 167201.0, 13792.0, 2897.0, 1104.0, 516.0, 283.0, 175.0, 104.0, 74.0, 45.0, 45.0, 19.0, 14.0, 13.0, 12.0, 10.0, 13.0, 4.0, 3.0, 6.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.61083984375, -0.592254638671875, -0.57366943359375, -0.555084228515625, -0.5364990234375, -0.517913818359375, -0.49932861328125, -0.480743408203125, -0.462158203125, -0.443572998046875, -0.42498779296875, -0.406402587890625, -0.3878173828125, -0.369232177734375, -0.35064697265625, -0.332061767578125, -0.3134765625, -0.294891357421875, -0.27630615234375, -0.257720947265625, -0.2391357421875, -0.220550537109375, -0.20196533203125, -0.183380126953125, -0.164794921875, -0.146209716796875, -0.12762451171875, -0.109039306640625, -0.0904541015625, -0.071868896484375, -0.05328369140625, -0.034698486328125, -0.01611328125, 0.002471923828125, 0.02105712890625, 0.039642333984375, 0.0582275390625, 0.076812744140625, 0.09539794921875, 0.113983154296875, 0.132568359375, 0.151153564453125, 0.16973876953125, 0.188323974609375, 0.2069091796875, 0.225494384765625, 0.24407958984375, 0.262664794921875, 0.28125, 0.299835205078125, 0.31842041015625, 0.337005615234375, 0.3555908203125, 0.374176025390625, 0.39276123046875, 0.411346435546875, 0.429931640625, 0.448516845703125, 0.46710205078125, 0.485687255859375, 0.5042724609375, 0.522857666015625, 0.54144287109375, 0.560028076171875, 0.57861328125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 5.0, 3.0, 8.0, 7.0, 8.0, 10.0, 12.0, 20.0, 28.0, 26.0, 28.0, 33.0, 43.0, 54.0, 59.0, 90.0, 89.0, 92.0, 75.0, 73.0, 44.0, 36.0, 28.0, 35.0, 22.0, 18.0, 14.0, 10.0, 11.0, 4.0, 6.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.044921875, -1.0139999389648438, -0.9830780029296875, -0.9521560668945312, -0.921234130859375, -0.8903121948242188, -0.8593902587890625, -0.8284683227539062, -0.79754638671875, -0.7666244506835938, -0.7357025146484375, -0.7047805786132812, -0.673858642578125, -0.6429367065429688, -0.6120147705078125, -0.5810928344726562, -0.5501708984375, -0.5192489624023438, -0.4883270263671875, -0.45740509033203125, -0.426483154296875, -0.39556121826171875, -0.3646392822265625, -0.33371734619140625, -0.30279541015625, -0.27187347412109375, -0.2409515380859375, -0.21002960205078125, -0.179107666015625, -0.14818572998046875, -0.1172637939453125, -0.08634185791015625, -0.055419921875, -0.02449798583984375, 0.0064239501953125, 0.03734588623046875, 0.068267822265625, 0.09918975830078125, 0.1301116943359375, 0.16103363037109375, 0.19195556640625, 0.22287750244140625, 0.2537994384765625, 0.28472137451171875, 0.315643310546875, 0.34656524658203125, 0.3774871826171875, 0.40840911865234375, 0.4393310546875, 0.47025299072265625, 0.5011749267578125, 0.5320968627929688, 0.563018798828125, 0.5939407348632812, 0.6248626708984375, 0.6557846069335938, 0.68670654296875, 0.7176284790039062, 0.7485504150390625, 0.7794723510742188, 0.810394287109375, 0.8413162231445312, 0.8722381591796875, 0.9031600952148438, 0.93408203125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 4.0, 6.0, 1.0, 5.0, 5.0, 11.0, 9.0, 11.0, 19.0, 26.0, 42.0, 71.0, 117.0, 237.0, 494.0, 1102.0, 3282.0, 13319.0, 130405.0, 866691.0, 24722.0, 4988.0, 1646.0, 633.0, 279.0, 148.0, 93.0, 55.0, 43.0, 20.0, 25.0, 8.0, 3.0, 6.0, 4.0, 5.0, 7.0, 3.0, 1.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.154541015625, -0.14941978454589844, -0.14429855346679688, -0.1391773223876953, -0.13405609130859375, -0.1289348602294922, -0.12381362915039062, -0.11869239807128906, -0.1135711669921875, -0.10844993591308594, -0.10332870483398438, -0.09820747375488281, -0.09308624267578125, -0.08796501159667969, -0.08284378051757812, -0.07772254943847656, -0.072601318359375, -0.06748008728027344, -0.062358856201171875, -0.05723762512207031, -0.05211639404296875, -0.04699516296386719, -0.041873931884765625, -0.03675270080566406, -0.0316314697265625, -0.026510238647460938, -0.021389007568359375, -0.016267776489257812, -0.01114654541015625, -0.0060253143310546875, -0.000904083251953125, 0.0042171478271484375, 0.00933837890625, 0.014459609985351562, 0.019580841064453125, 0.024702072143554688, 0.02982330322265625, 0.03494453430175781, 0.040065765380859375, 0.04518699645996094, 0.0503082275390625, 0.05542945861816406, 0.060550689697265625, 0.06567192077636719, 0.07079315185546875, 0.07591438293457031, 0.08103561401367188, 0.08615684509277344, 0.091278076171875, 0.09639930725097656, 0.10152053833007812, 0.10664176940917969, 0.11176300048828125, 0.11688423156738281, 0.12200546264648438, 0.12712669372558594, 0.1322479248046875, 0.13736915588378906, 0.14249038696289062, 0.1476116180419922, 0.15273284912109375, 0.1578540802001953, 0.16297531127929688, 0.16809654235839844, 0.1732177734375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 4.0, 3.0, 8.0, 6.0, 11.0, 6.0, 12.0, 19.0, 27.0, 35.0, 55.0, 100.0, 183.0, 202.0, 111.0, 77.0, 42.0, 27.0, 16.0, 7.0, 5.0, 7.0, 8.0, 6.0, 2.0, 7.0, 5.0, 3.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.796287536621094e-05, -7.602013647556305e-05, -7.407739758491516e-05, -7.213465869426727e-05, -7.019191980361938e-05, -6.82491809129715e-05, -6.630644202232361e-05, -6.436370313167572e-05, -6.242096424102783e-05, -6.0478225350379944e-05, -5.8535486459732056e-05, -5.659274756908417e-05, -5.465000867843628e-05, -5.270726978778839e-05, -5.07645308971405e-05, -4.8821792006492615e-05, -4.6879053115844727e-05, -4.493631422519684e-05, -4.299357533454895e-05, -4.105083644390106e-05, -3.9108097553253174e-05, -3.7165358662605286e-05, -3.52226197719574e-05, -3.327988088130951e-05, -3.133714199066162e-05, -2.9394403100013733e-05, -2.7451664209365845e-05, -2.5508925318717957e-05, -2.356618642807007e-05, -2.162344753742218e-05, -1.9680708646774292e-05, -1.7737969756126404e-05, -1.5795230865478516e-05, -1.3852491974830627e-05, -1.190975308418274e-05, -9.967014193534851e-06, -8.024275302886963e-06, -6.081536412239075e-06, -4.1387975215911865e-06, -2.1960586309432983e-06, -2.5331974029541016e-07, 1.689419150352478e-06, 3.632158041000366e-06, 5.574896931648254e-06, 7.517635822296143e-06, 9.46037471294403e-06, 1.1403113603591919e-05, 1.3345852494239807e-05, 1.5288591384887695e-05, 1.7231330275535583e-05, 1.917406916618347e-05, 2.111680805683136e-05, 2.3059546947479248e-05, 2.5002285838127136e-05, 2.6945024728775024e-05, 2.8887763619422913e-05, 3.08305025100708e-05, 3.277324140071869e-05, 3.471598029136658e-05, 3.6658719182014465e-05, 3.8601458072662354e-05, 4.054419696331024e-05, 4.248693585395813e-05, 4.442967474460602e-05, 4.6372413635253906e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 3.0, 7.0, 9.0, 18.0, 21.0, 31.0, 42.0, 93.0, 126.0, 259.0, 453.0, 947.0, 2076.0, 4988.0, 15497.0, 80974.0, 868933.0, 54024.0, 12340.0, 4272.0, 1707.0, 791.0, 400.0, 225.0, 117.0, 70.0, 50.0, 28.0, 25.0, 12.0, 10.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0933837890625, -0.08984756469726562, -0.08631134033203125, -0.08277511596679688, -0.0792388916015625, -0.07570266723632812, -0.07216644287109375, -0.06863021850585938, -0.065093994140625, -0.061557769775390625, -0.05802154541015625, -0.054485321044921875, -0.0509490966796875, -0.047412872314453125, -0.04387664794921875, -0.040340423583984375, -0.03680419921875, -0.033267974853515625, -0.02973175048828125, -0.026195526123046875, -0.0226593017578125, -0.019123077392578125, -0.01558685302734375, -0.012050628662109375, -0.008514404296875, -0.004978179931640625, -0.00144195556640625, 0.002094268798828125, 0.0056304931640625, 0.009166717529296875, 0.01270294189453125, 0.016239166259765625, 0.019775390625, 0.023311614990234375, 0.02684783935546875, 0.030384063720703125, 0.0339202880859375, 0.037456512451171875, 0.04099273681640625, 0.044528961181640625, 0.048065185546875, 0.051601409912109375, 0.05513763427734375, 0.058673858642578125, 0.0622100830078125, 0.06574630737304688, 0.06928253173828125, 0.07281875610351562, 0.07635498046875, 0.07989120483398438, 0.08342742919921875, 0.08696365356445312, 0.0904998779296875, 0.09403610229492188, 0.09757232666015625, 0.10110855102539062, 0.104644775390625, 0.10818099975585938, 0.11171722412109375, 0.11525344848632812, 0.1187896728515625, 0.12232589721679688, 0.12586212158203125, 0.12939834594726562, 0.1329345703125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 6.0, 5.0, 6.0, 10.0, 10.0, 10.0, 13.0, 20.0, 20.0, 39.0, 46.0, 71.0, 118.0, 139.0, 122.0, 118.0, 72.0, 50.0, 27.0, 19.0, 12.0, 18.0, 9.0, 13.0, 4.0, 8.0, 5.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1019287109375, -0.09814262390136719, -0.09435653686523438, -0.09057044982910156, -0.08678436279296875, -0.08299827575683594, -0.07921218872070312, -0.07542610168457031, -0.0716400146484375, -0.06785392761230469, -0.06406784057617188, -0.06028175354003906, -0.05649566650390625, -0.05270957946777344, -0.048923492431640625, -0.04513740539550781, -0.041351318359375, -0.03756523132324219, -0.033779144287109375, -0.029993057250976562, -0.02620697021484375, -0.022420883178710938, -0.018634796142578125, -0.014848709106445312, -0.0110626220703125, -0.0072765350341796875, -0.003490447998046875, 0.0002956390380859375, 0.00408172607421875, 0.007867813110351562, 0.011653900146484375, 0.015439987182617188, 0.01922607421875, 0.023012161254882812, 0.026798248291015625, 0.030584335327148438, 0.03437042236328125, 0.03815650939941406, 0.041942596435546875, 0.04572868347167969, 0.0495147705078125, 0.05330085754394531, 0.057086944580078125, 0.06087303161621094, 0.06465911865234375, 0.06844520568847656, 0.07223129272460938, 0.07601737976074219, 0.079803466796875, 0.08358955383300781, 0.08737564086914062, 0.09116172790527344, 0.09494781494140625, 0.09873390197753906, 0.10251998901367188, 0.10630607604980469, 0.1100921630859375, 0.11387825012207031, 0.11766433715820312, 0.12145042419433594, 0.12523651123046875, 0.12902259826660156, 0.13280868530273438, 0.1365947723388672, 0.140380859375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 14.0, 24.0, 38.0, 71.0, 307.0, 352.0, 93.0, 44.0, 25.0, 9.0, 8.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.391907691955566, -4.250250339508057, -4.108593463897705, -3.9669361114501953, -3.8252789974212646, -3.683621883392334, -3.5419647693634033, -3.4003076553344727, -3.258650302886963, -3.1169931888580322, -2.9753360748291016, -2.833678722381592, -2.692021608352661, -2.5503644943237305, -2.4087073802948, -2.267050266265869, -2.1253931522369385, -1.9837360382080078, -1.8420788049697876, -1.700421690940857, -1.5587644577026367, -1.417107343673706, -1.2754502296447754, -1.1337931156158447, -0.9921358823776245, -0.8504787087440491, -0.7088215351104736, -0.567164421081543, -0.42550724744796753, -0.2838500738143921, -0.14219295978546143, -0.0005357861518859863, 0.14112138748168945, 0.2827785611152649, 0.42443570494651794, 0.566092848777771, 0.7077500224113464, 0.8494071960449219, 0.9910643100738525, 1.1327214241027832, 1.2743786573410034, 1.416035771369934, 1.5576930046081543, 1.699350118637085, 1.8410072326660156, 1.9826644659042358, 2.124321460723877, 2.2659788131713867, 2.4076359272003174, 2.549293041229248, 2.6909501552581787, 2.8326072692871094, 2.974264621734619, 3.11592173576355, 3.2575788497924805, 3.399235963821411, 3.540893077850342, 3.6825501918792725, 3.824207305908203, 3.965864658355713, 4.1075215339660645, 4.249178886413574, 4.390835762023926, 4.5324931144714355, 4.674150466918945]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 5.0, 2.0, 4.0, 0.0, 8.0, 10.0, 10.0, 13.0, 7.0, 14.0, 13.0, 15.0, 18.0, 25.0, 17.0, 17.0, 25.0, 46.0, 272.0, 198.0, 39.0, 23.0, 15.0, 20.0, 21.0, 27.0, 25.0, 8.0, 21.0, 18.0, 10.0, 5.0, 8.0, 6.0, 4.0, 2.0, 6.0, 4.0, 2.0, 2.0, 3.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.2743568420410156, -2.2071855068206787, -2.1400139331817627, -2.072842597961426, -2.0056710243225098, -1.9384996891021729, -1.8713282346725464, -1.80415678024292, -1.7369853258132935, -1.669813871383667, -1.6026424169540405, -1.535470962524414, -1.4682996273040771, -1.4011280536651611, -1.3339567184448242, -1.2667852640151978, -1.1996138095855713, -1.1324423551559448, -1.0652709007263184, -0.9980995059013367, -0.9309280514717102, -0.8637565970420837, -0.796585202217102, -0.7294137477874756, -0.6622422933578491, -0.5950708389282227, -0.5278993844985962, -0.4607279896736145, -0.39355653524398804, -0.3263850808143616, -0.2592136561870575, -0.19204223155975342, -0.12487101554870605, -0.057699576020240784, 0.009471863508224487, 0.07664330303668976, 0.14381474256515503, 0.2109861969947815, 0.27815762162208557, 0.34532904624938965, 0.4125005006790161, 0.4796719551086426, 0.546843409538269, 0.6140148043632507, 0.6811862587928772, 0.7483577132225037, 0.8155291080474854, 0.8827005624771118, 0.9498720169067383, 1.0170434713363647, 1.0842149257659912, 1.1513863801956177, 1.2185578346252441, 1.285729169845581, 1.3529006242752075, 1.420072078704834, 1.4872435331344604, 1.554414987564087, 1.6215864419937134, 1.6887578964233398, 1.7559292316436768, 1.8231008052825928, 1.8902721405029297, 1.9574435949325562, 2.0246150493621826]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 7.0, 5.0, 3.0, 8.0, 18.0, 13.0, 12.0, 18.0, 15.0, 23.0, 18.0, 43.0, 52.0, 67.0, 244.0, 151.0, 45.0, 46.0, 42.0, 32.0, 23.0, 30.0, 24.0, 15.0, 10.0, 10.0, 6.0, 6.0, 4.0, 6.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.231201171875, -0.2241363525390625, -0.217071533203125, -0.2100067138671875, -0.20294189453125, -0.1958770751953125, -0.188812255859375, -0.1817474365234375, -0.1746826171875, -0.1676177978515625, -0.160552978515625, -0.1534881591796875, -0.14642333984375, -0.1393585205078125, -0.132293701171875, -0.1252288818359375, -0.1181640625, -0.1110992431640625, -0.104034423828125, -0.0969696044921875, -0.08990478515625, -0.0828399658203125, -0.075775146484375, -0.0687103271484375, -0.0616455078125, -0.0545806884765625, -0.047515869140625, -0.0404510498046875, -0.03338623046875, -0.0263214111328125, -0.019256591796875, -0.0121917724609375, -0.005126953125, 0.0019378662109375, 0.009002685546875, 0.0160675048828125, 0.02313232421875, 0.0301971435546875, 0.037261962890625, 0.0443267822265625, 0.0513916015625, 0.0584564208984375, 0.065521240234375, 0.0725860595703125, 0.07965087890625, 0.0867156982421875, 0.093780517578125, 0.1008453369140625, 0.10791015625, 0.1149749755859375, 0.122039794921875, 0.1291046142578125, 0.13616943359375, 0.1432342529296875, 0.150299072265625, 0.1573638916015625, 0.1644287109375, 0.1714935302734375, 0.178558349609375, 0.1856231689453125, 0.19268798828125, 0.1997528076171875, 0.206817626953125, 0.2138824462890625, 0.220947265625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 3.0, 8.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 3.0, 13.0, 16.0, 24.0, 22.0, 45.0, 76.0, 108.0, 236.0, 680.0, 2962.0, 29733.0, 8344713.0, 7915.0, 1299.0, 389.0, 139.0, 65.0, 34.0, 22.0, 25.0, 10.0, 3.0, 11.0, 7.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 0.0, 0.0, 0.0, 6.0], "bins": [-2.6175713539123535, -2.5364673137664795, -2.4553635120391846, -2.3742594718933105, -2.2931556701660156, -2.2120516300201416, -2.1309478282928467, -2.0498437881469727, -1.9687398672103882, -1.8876359462738037, -1.8065320253372192, -1.7254281044006348, -1.6443240642547607, -1.5632202625274658, -1.4821162223815918, -1.4010123014450073, -1.3199083805084229, -1.2388044595718384, -1.157700538635254, -1.0765966176986694, -0.9954926371574402, -0.9143887162208557, -0.8332847356796265, -0.752180814743042, -0.6710768938064575, -0.589972972869873, -0.5088690519332886, -0.4277650713920593, -0.34666115045547485, -0.2655572295188904, -0.18445327877998352, -0.10334932804107666, -0.02224564552307129, 0.05885829031467438, 0.13996222615242004, 0.2210661619901657, 0.3021700978279114, 0.38327401876449585, 0.4643779695034027, 0.5454819202423096, 0.626585841178894, 0.7076897621154785, 0.788793683052063, 0.8698976635932922, 0.9510015845298767, 1.0321054458618164, 1.1132094860076904, 1.194313406944275, 1.2754173278808594, 1.3565212488174438, 1.4376251697540283, 1.5187290906906128, 1.5998330116271973, 1.6809370517730713, 1.7620409727096558, 1.8431448936462402, 1.9242488145828247, 2.005352735519409, 2.086456775665283, 2.167560577392578, 2.248664617538452, 2.329768419265747, 2.410872459411621, 2.491976261138916, 2.57308030128479]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 7.0, 4.0, 1.0, 3.0, 9.0, 5.0, 2.0, 6.0, 2.0, 9.0, 3.0, 2.0, 4.0, 5.0, 8.0, 2.0, 3.0, 3.0, 6.0, 1.0, 1.0, 4.0, 0.0, 1.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.8287630081176758, -1.7596369981765747, -1.6905111074447632, -1.621385097503662, -1.5522592067718506, -1.4831331968307495, -1.4140071868896484, -1.344881296157837, -1.2757552862167358, -1.2066292762756348, -1.1375033855438232, -1.0683773756027222, -0.9992514252662659, -0.9301254749298096, -0.8609994649887085, -0.7918735146522522, -0.7227475643157959, -0.6536216139793396, -0.5844956636428833, -0.5153696537017822, -0.4462437033653259, -0.37711775302886963, -0.30799177289009094, -0.23886579275131226, -0.16973984241485596, -0.10061387717723846, -0.03148791193962097, 0.03763805329799652, 0.10676401853561401, 0.1758899688720703, 0.245015949010849, 0.3141419291496277, 0.3832676410675049, 0.4523935914039612, 0.5215195417404175, 0.5906455516815186, 0.6597715020179749, 0.7288974523544312, 0.7980234622955322, 0.8671494126319885, 0.9362753629684448, 1.005401372909546, 1.0745272636413574, 1.1436532735824585, 1.2127792835235596, 1.281905174255371, 1.3510311841964722, 1.4201571941375732, 1.4892830848693848, 1.5584090948104858, 1.6275349855422974, 1.6966609954833984, 1.76578688621521, 1.834912896156311, 1.904038906097412, 1.9731647968292236, 2.042290687561035, 2.1114165782928467, 2.1805427074432373, 2.249668598175049, 2.3187944889068604, 2.387920379638672, 2.4570465087890625, 2.526172399520874, 2.5952985286712646]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 9.0, 16.0, 13.0, 17.0, 26.0, 29.0, 45.0, 94.0, 160.0, 370.0, 885.0, 2699.0, 10178.0, 55171.0, 291858.0, 134716.0, 20769.0, 4775.0, 1434.0, 510.0, 221.0, 99.0, 61.0, 36.0, 26.0, 15.0, 16.0, 5.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.701171875, -2.61328125, -2.525390625, -2.4375, -2.349609375, -2.26171875, -2.173828125, -2.0859375, -1.998046875, -1.91015625, -1.822265625, -1.734375, -1.646484375, -1.55859375, -1.470703125, -1.3828125, -1.294921875, -1.20703125, -1.119140625, -1.03125, -0.943359375, -0.85546875, -0.767578125, -0.6796875, -0.591796875, -0.50390625, -0.416015625, -0.328125, -0.240234375, -0.15234375, -0.064453125, 0.0234375, 0.111328125, 0.19921875, 0.287109375, 0.375, 0.462890625, 0.55078125, 0.638671875, 0.7265625, 0.814453125, 0.90234375, 0.990234375, 1.078125, 1.166015625, 1.25390625, 1.341796875, 1.4296875, 1.517578125, 1.60546875, 1.693359375, 1.78125, 1.869140625, 1.95703125, 2.044921875, 2.1328125, 2.220703125, 2.30859375, 2.396484375, 2.484375, 2.572265625, 2.66015625, 2.748046875, 2.8359375, 2.923828125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 2.0, 1.0, 2.0, 9.0, 15.0, 17.0, 22.0, 25.0, 38.0, 38.0, 47.0, 54.0, 72.0, 93.0, 89.0, 88.0, 81.0, 74.0, 60.0, 44.0, 37.0, 30.0, 17.0, 18.0, 12.0, 9.0, 5.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 2.0], "bins": [-0.3427734375, -0.3348102569580078, -0.3268470764160156, -0.31888389587402344, -0.31092071533203125, -0.30295753479003906, -0.2949943542480469, -0.2870311737060547, -0.2790679931640625, -0.2711048126220703, -0.2631416320800781, -0.25517845153808594, -0.24721527099609375, -0.23925209045410156, -0.23128890991210938, -0.2233257293701172, -0.215362548828125, -0.2073993682861328, -0.19943618774414062, -0.19147300720214844, -0.18350982666015625, -0.17554664611816406, -0.16758346557617188, -0.1596202850341797, -0.1516571044921875, -0.1436939239501953, -0.13573074340820312, -0.12776756286621094, -0.11980438232421875, -0.11184120178222656, -0.10387802124023438, -0.09591484069824219, -0.08795166015625, -0.07998847961425781, -0.07202529907226562, -0.06406211853027344, -0.05609893798828125, -0.04813575744628906, -0.040172576904296875, -0.03220939636230469, -0.0242462158203125, -0.016283035278320312, -0.008319854736328125, -0.0003566741943359375, 0.00760650634765625, 0.015569686889648438, 0.023532867431640625, 0.03149604797363281, 0.039459228515625, 0.04742240905761719, 0.055385589599609375, 0.06334877014160156, 0.07131195068359375, 0.07927513122558594, 0.08723831176757812, 0.09520149230957031, 0.1031646728515625, 0.11112785339355469, 0.11909103393554688, 0.12705421447753906, 0.13501739501953125, 0.14298057556152344, 0.15094375610351562, 0.1589069366455078, 0.1668701171875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 6.0, 11.0, 12.0, 14.0, 19.0, 45.0, 75.0, 82.0, 80.0, 56.0, 29.0, 14.0, 8.0, 6.0, 4.0, 7.0, 3.0, 1.0, 3.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.5827906131744385, -1.5232466459274292, -1.46370267868042, -1.4041587114334106, -1.3446147441864014, -1.285070776939392, -1.2255268096923828, -1.1659828424453735, -1.1064388751983643, -1.046894907951355, -0.9873509407043457, -0.9278069734573364, -0.8682630062103271, -0.8087190389633179, -0.7491750717163086, -0.6896311044692993, -0.6300871968269348, -0.5705432295799255, -0.5109992623329163, -0.451455295085907, -0.3919113278388977, -0.3323673903942108, -0.27282342314720154, -0.21327945590019226, -0.15373548865318298, -0.0941915214061737, -0.034647561609745026, 0.024896398186683655, 0.08444036543369293, 0.14398431777954102, 0.2035282850265503, 0.26307225227355957, 0.32261621952056885, 0.3821601867675781, 0.4417041540145874, 0.5012481212615967, 0.560792088508606, 0.6203360557556152, 0.6798800230026245, 0.7394239902496338, 0.7989679574966431, 0.8585119247436523, 0.9180558919906616, 0.9775998592376709, 1.0371438264846802, 1.0966877937316895, 1.1562317609786987, 1.215775728225708, 1.2753195762634277, 1.334863543510437, 1.3944075107574463, 1.4539514780044556, 1.5134954452514648, 1.5730394124984741, 1.6325833797454834, 1.6921273469924927, 1.751671314239502, 1.8112152814865112, 1.8707592487335205, 1.9303032159805298, 1.989847183227539, 2.049391031265259, 2.1089351177215576, 2.1684789657592773, 2.228023052215576]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 3.0, 5.0, 4.0, 4.0, 6.0, 8.0, 8.0, 17.0, 26.0, 82.0, 118.0, 93.0, 46.0, 22.0, 4.0, 4.0, 10.0, 7.0, 5.0, 6.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3065214157104492, -1.265740156173706, -1.2249587774276733, -1.1841775178909302, -1.143396258354187, -1.1026148796081543, -1.0618336200714111, -1.021052360534668, -0.9802709817886353, -0.9394896626472473, -0.8987084031105042, -0.8579270839691162, -0.8171457648277283, -0.7763644456863403, -0.7355831861495972, -0.6948018670082092, -0.6540206074714661, -0.6132392883300781, -0.572458028793335, -0.531676709651947, -0.4908953905105591, -0.45011410117149353, -0.409332811832428, -0.36855149269104004, -0.3277702033519745, -0.28698891401290894, -0.246207594871521, -0.20542630553245544, -0.1646450012922287, -0.12386369705200195, -0.0830824077129364, -0.04230108857154846, -0.0015197992324829102, 0.03926150128245354, 0.08004280179738998, 0.12082409858703613, 0.16160540282726288, 0.20238670706748962, 0.24316799640655518, 0.2839493155479431, 0.32473060488700867, 0.3655118942260742, 0.40629321336746216, 0.4470745027065277, 0.48785579204559326, 0.5286371111869812, 0.5694184303283691, 0.6101996898651123, 0.6509810090065002, 0.6917623281478882, 0.7325435876846313, 0.7733249068260193, 0.8141062259674072, 0.8548874855041504, 0.8956688046455383, 0.9364501237869263, 0.9772313833236694, 1.0180126428604126, 1.0587940216064453, 1.0995752811431885, 1.1403565406799316, 1.1811379194259644, 1.2219191789627075, 1.2627005577087402, 1.3034818172454834]}, "eval/loss": 4.200125694274902, "eval/wer": 1.9598968663228877, "eval/runtime": 786.8447, "eval/samples_per_second": 3.358, "eval/steps_per_second": 0.281} \ No newline at end of file +{"train/loss": 4.4907, "train/learning_rate": 3.1914893617021275e-07, "train/epoch": 1.0, "train/global_step": 594, "_runtime": 5718, "_timestamp": 1646079957, "_step": 595, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 10.0, 548.0, 448.0, 11.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.368497848510742, -13.00784683227539, -8.647195816040039, -4.2865447998046875, 0.07410621643066406, 4.434757232666016, 8.795408248901367, 13.156059265136719, 17.51671028137207, 21.877361297607422, 26.238012313842773, 30.598663330078125, 34.959312438964844, 39.31996536254883, 43.68061828613281, 48.04126739501953, 52.40191650390625, 56.76256561279297, 61.12321853637695, 65.48387145996094, 69.84452056884766, 74.20516967773438, 78.56582641601562, 82.92647552490234, 87.28712463378906, 91.64777374267578, 96.0084228515625, 100.36907958984375, 104.72972869873047, 109.09037780761719, 113.45103454589844, 117.81168365478516, 122.17233276367188, 126.5329818725586, 130.8936309814453, 135.25428771972656, 139.61492919921875, 143.9755859375, 148.33624267578125, 152.69688415527344, 157.0575408935547, 161.41819763183594, 165.77883911132812, 170.13949584960938, 174.50015258789062, 178.8607940673828, 183.22145080566406, 187.58209228515625, 191.9427490234375, 196.30340576171875, 200.66404724121094, 205.0247039794922, 209.38534545898438, 213.74600219726562, 218.10665893554688, 222.46730041503906, 226.8279571533203, 231.18861389160156, 235.54925537109375, 239.909912109375, 244.27056884765625, 248.63121032714844, 252.9918670654297, 257.3525085449219, 261.7131652832031]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 6.0, 1.0, 2.0, 11.0, 7.0, 6.0, 16.0, 13.0, 18.0, 20.0, 23.0, 27.0, 29.0, 25.0, 36.0, 44.0, 38.0, 33.0, 30.0, 39.0, 56.0, 53.0, 59.0, 39.0, 36.0, 41.0, 37.0, 33.0, 35.0, 27.0, 23.0, 28.0, 28.0, 21.0, 13.0, 16.0, 5.0, 5.0, 10.0, 4.0, 2.0, 3.0, 5.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.572723388671875, -20.85820770263672, -20.143692016601562, -19.429176330566406, -18.71466064453125, -18.00014305114746, -17.285627365112305, -16.57111167907715, -15.856595993041992, -15.142080307006836, -14.42756462097168, -13.713047981262207, -12.99853229522705, -12.284016609191895, -11.569499969482422, -10.854984283447266, -10.14046859741211, -9.425952911376953, -8.711437225341797, -7.996920585632324, -7.282404899597168, -6.567889213562012, -5.853373050689697, -5.138856887817383, -4.424341201782227, -3.709825277328491, -2.995309352874756, -2.2807934284210205, -1.5662775039672852, -0.8517615795135498, -0.13724565505981445, 0.5772705078125, 1.2917861938476562, 2.0063021183013916, 2.720818042755127, 3.4353339672088623, 4.149849891662598, 4.864365577697754, 5.578881740570068, 6.293397903442383, 7.007913589477539, 7.722429275512695, 8.436944961547852, 9.151461601257324, 9.86597728729248, 10.580492973327637, 11.29500961303711, 12.009525299072266, 12.724040985107422, 13.438556671142578, 14.153072357177734, 14.867588996887207, 15.582104682922363, 16.296621322631836, 17.011137008666992, 17.72565269470215, 18.440168380737305, 19.15468406677246, 19.869199752807617, 20.583715438842773, 21.298233032226562, 22.01274871826172, 22.727264404296875, 23.44178009033203, 24.156295776367188]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 6.0, 8.0, 3.0, 8.0, 11.0, 10.0, 16.0, 22.0, 17.0, 19.0, 23.0, 36.0, 22.0, 35.0, 33.0, 30.0, 43.0, 39.0, 48.0, 41.0, 45.0, 49.0, 46.0, 42.0, 34.0, 30.0, 45.0, 35.0, 27.0, 33.0, 26.0, 30.0, 17.0, 16.0, 13.0, 6.0, 9.0, 5.0, 9.0, 10.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1904296875, -1.1525115966796875, -1.114593505859375, -1.0766754150390625, -1.03875732421875, -1.0008392333984375, -0.962921142578125, -0.9250030517578125, -0.8870849609375, -0.8491668701171875, -0.811248779296875, -0.7733306884765625, -0.73541259765625, -0.6974945068359375, -0.659576416015625, -0.6216583251953125, -0.583740234375, -0.5458221435546875, -0.507904052734375, -0.4699859619140625, -0.43206787109375, -0.3941497802734375, -0.356231689453125, -0.3183135986328125, -0.2803955078125, -0.2424774169921875, -0.204559326171875, -0.1666412353515625, -0.12872314453125, -0.0908050537109375, -0.052886962890625, -0.0149688720703125, 0.02294921875, 0.0608673095703125, 0.098785400390625, 0.1367034912109375, 0.17462158203125, 0.2125396728515625, 0.250457763671875, 0.2883758544921875, 0.3262939453125, 0.3642120361328125, 0.402130126953125, 0.4400482177734375, 0.47796630859375, 0.5158843994140625, 0.553802490234375, 0.5917205810546875, 0.629638671875, 0.6675567626953125, 0.705474853515625, 0.7433929443359375, 0.78131103515625, 0.8192291259765625, 0.857147216796875, 0.8950653076171875, 0.9329833984375, 0.9709014892578125, 1.008819580078125, 1.0467376708984375, 1.08465576171875, 1.1225738525390625, 1.160491943359375, 1.1984100341796875, 1.236328125]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 5.0, 8.0, 8.0, 9.0, 9.0, 24.0, 24.0, 33.0, 36.0, 57.0, 95.0, 129.0, 192.0, 308.0, 504.0, 775.0, 1315.0, 2239.0, 4421.0, 11468.0, 39459.0, 231150.0, 2016112.0, 1650216.0, 182969.0, 33397.0, 10070.0, 4090.0, 2023.0, 1151.0, 684.0, 434.0, 304.0, 161.0, 139.0, 71.0, 53.0, 40.0, 27.0, 16.0, 17.0, 9.0, 9.0, 5.0, 7.0, 5.0, 5.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0], "bins": [-3.978515625, -3.861297607421875, -3.74407958984375, -3.626861572265625, -3.5096435546875, -3.392425537109375, -3.27520751953125, -3.157989501953125, -3.040771484375, -2.923553466796875, -2.80633544921875, -2.689117431640625, -2.5718994140625, -2.454681396484375, -2.33746337890625, -2.220245361328125, -2.10302734375, -1.985809326171875, -1.86859130859375, -1.751373291015625, -1.6341552734375, -1.516937255859375, -1.39971923828125, -1.282501220703125, -1.165283203125, -1.048065185546875, -0.93084716796875, -0.813629150390625, -0.6964111328125, -0.579193115234375, -0.46197509765625, -0.344757080078125, -0.2275390625, -0.110321044921875, 0.00689697265625, 0.124114990234375, 0.2413330078125, 0.358551025390625, 0.47576904296875, 0.592987060546875, 0.710205078125, 0.827423095703125, 0.94464111328125, 1.061859130859375, 1.1790771484375, 1.296295166015625, 1.41351318359375, 1.530731201171875, 1.64794921875, 1.765167236328125, 1.88238525390625, 1.999603271484375, 2.1168212890625, 2.234039306640625, 2.35125732421875, 2.468475341796875, 2.585693359375, 2.702911376953125, 2.82012939453125, 2.937347412109375, 3.0545654296875, 3.171783447265625, 3.28900146484375, 3.406219482421875, 3.5234375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 9.0, 20.0, 42.0, 64.0, 79.0, 143.0, 234.0, 413.0, 711.0, 810.0, 625.0, 349.0, 214.0, 124.0, 92.0, 54.0, 22.0, 21.0, 17.0, 11.0, 4.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.83984375, -7.62384033203125, -7.4078369140625, -7.19183349609375, -6.975830078125, -6.75982666015625, -6.5438232421875, -6.32781982421875, -6.11181640625, -5.89581298828125, -5.6798095703125, -5.46380615234375, -5.247802734375, -5.03179931640625, -4.8157958984375, -4.59979248046875, -4.3837890625, -4.16778564453125, -3.9517822265625, -3.73577880859375, -3.519775390625, -3.30377197265625, -3.0877685546875, -2.87176513671875, -2.65576171875, -2.43975830078125, -2.2237548828125, -2.00775146484375, -1.791748046875, -1.57574462890625, -1.3597412109375, -1.14373779296875, -0.927734375, -0.71173095703125, -0.4957275390625, -0.27972412109375, -0.063720703125, 0.15228271484375, 0.3682861328125, 0.58428955078125, 0.80029296875, 1.01629638671875, 1.2322998046875, 1.44830322265625, 1.664306640625, 1.88031005859375, 2.0963134765625, 2.31231689453125, 2.5283203125, 2.74432373046875, 2.9603271484375, 3.17633056640625, 3.392333984375, 3.60833740234375, 3.8243408203125, 4.04034423828125, 4.25634765625, 4.47235107421875, 4.6883544921875, 4.90435791015625, 5.120361328125, 5.33636474609375, 5.5523681640625, 5.76837158203125, 5.984375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 5.0, 6.0, 18.0, 21.0, 35.0, 81.0, 168.0, 287.0, 534.0, 1220.0, 3921.0, 70392.0, 4064315.0, 47327.0, 3595.0, 1183.0, 491.0, 299.0, 137.0, 85.0, 63.0, 28.0, 18.0, 7.0, 8.0, 8.0, 7.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-23.046875, -22.358154296875, -21.66943359375, -20.980712890625, -20.2919921875, -19.603271484375, -18.91455078125, -18.225830078125, -17.537109375, -16.848388671875, -16.15966796875, -15.470947265625, -14.7822265625, -14.093505859375, -13.40478515625, -12.716064453125, -12.02734375, -11.338623046875, -10.64990234375, -9.961181640625, -9.2724609375, -8.583740234375, -7.89501953125, -7.206298828125, -6.517578125, -5.828857421875, -5.14013671875, -4.451416015625, -3.7626953125, -3.073974609375, -2.38525390625, -1.696533203125, -1.0078125, -0.319091796875, 0.36962890625, 1.058349609375, 1.7470703125, 2.435791015625, 3.12451171875, 3.813232421875, 4.501953125, 5.190673828125, 5.87939453125, 6.568115234375, 7.2568359375, 7.945556640625, 8.63427734375, 9.322998046875, 10.01171875, 10.700439453125, 11.38916015625, 12.077880859375, 12.7666015625, 13.455322265625, 14.14404296875, 14.832763671875, 15.521484375, 16.210205078125, 16.89892578125, 17.587646484375, 18.2763671875, 18.965087890625, 19.65380859375, 20.342529296875, 21.03125]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 294.0, 709.0, 10.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-229.29066467285156, -224.8906707763672, -220.4906768798828, -216.09068298339844, -211.69068908691406, -207.2906951904297, -202.8907012939453, -198.49069213867188, -194.0906982421875, -189.69070434570312, -185.29071044921875, -180.89071655273438, -176.49072265625, -172.09072875976562, -167.69073486328125, -163.29074096679688, -158.8907470703125, -154.49075317382812, -150.09075927734375, -145.69076538085938, -141.290771484375, -136.89077758789062, -132.49078369140625, -128.09078979492188, -123.69078826904297, -119.2907943725586, -114.89080047607422, -110.49080657958984, -106.09080505371094, -101.69081115722656, -97.29081726074219, -92.89082336425781, -88.49083709716797, -84.0908432006836, -79.69084930419922, -75.29085540771484, -70.89085388183594, -66.49085998535156, -62.09086608886719, -57.69087219238281, -53.29087829589844, -48.89088439941406, -44.49089050292969, -40.09089279174805, -35.69089889526367, -31.290904998779297, -26.89090919494629, -22.49091339111328, -18.090919494628906, -13.690924644470215, -9.290929794311523, -4.890934944152832, -0.4909400939941406, 3.9090538024902344, 8.309049606323242, 12.70904541015625, 17.109039306640625, 21.509033203125, 25.909029006958008, 30.309024810791016, 34.70901870727539, 39.109012603759766, 43.509010314941406, 47.90900421142578, 52.308998107910156]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 6.0, 6.0, 10.0, 6.0, 6.0, 14.0, 15.0, 15.0, 26.0, 29.0, 35.0, 34.0, 42.0, 38.0, 39.0, 54.0, 38.0, 63.0, 40.0, 40.0, 52.0, 53.0, 38.0, 40.0, 48.0, 33.0, 21.0, 27.0, 22.0, 18.0, 18.0, 21.0, 11.0, 9.0, 6.0, 9.0, 5.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.034442901611328, -19.45001220703125, -18.865581512451172, -18.281150817871094, -17.696720123291016, -17.11229133605957, -16.527860641479492, -15.943429946899414, -15.358999252319336, -14.774568557739258, -14.19013786315918, -13.605708122253418, -13.02127742767334, -12.436846733093262, -11.8524169921875, -11.267986297607422, -10.683555603027344, -10.099124908447266, -9.514694213867188, -8.930264472961426, -8.345833778381348, -7.7614030838012695, -7.17697286605835, -6.59254264831543, -6.008111953735352, -5.423681259155273, -4.8392510414123535, -4.254820823669434, -3.6703901290893555, -3.0859596729278564, -2.5015292167663574, -1.9170989990234375, -1.3326702117919922, -0.7482397556304932, -0.16380929946899414, 0.4206211566925049, 1.005051612854004, 1.589482069015503, 2.173912525177002, 2.758342742919922, 3.3427734375, 3.927203893661499, 4.511634349822998, 5.096064567565918, 5.680495262145996, 6.264925956726074, 6.849356174468994, 7.433786392211914, 8.018217086791992, 8.60264778137207, 9.187078475952148, 9.77150821685791, 10.355938911437988, 10.940369606018066, 11.524799346923828, 12.109230041503906, 12.693660736083984, 13.278091430664062, 13.86252212524414, 14.446951866149902, 15.03138256072998, 15.615813255310059, 16.20024299621582, 16.7846736907959, 17.369104385375977]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 1.0, 4.0, 0.0, 5.0, 3.0, 11.0, 5.0, 7.0, 10.0, 11.0, 6.0, 12.0, 18.0, 21.0, 13.0, 23.0, 20.0, 24.0, 29.0, 31.0, 27.0, 27.0, 33.0, 26.0, 34.0, 34.0, 44.0, 45.0, 47.0, 45.0, 32.0, 33.0, 23.0, 33.0, 25.0, 33.0, 25.0, 27.0, 22.0, 18.0, 24.0, 20.0, 11.0, 14.0, 10.0, 10.0, 12.0, 7.0, 3.0, 6.0, 4.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.06640625, -1.032379150390625, -0.99835205078125, -0.964324951171875, -0.9302978515625, -0.896270751953125, -0.86224365234375, -0.828216552734375, -0.794189453125, -0.760162353515625, -0.72613525390625, -0.692108154296875, -0.6580810546875, -0.624053955078125, -0.59002685546875, -0.555999755859375, -0.52197265625, -0.487945556640625, -0.45391845703125, -0.419891357421875, -0.3858642578125, -0.351837158203125, -0.31781005859375, -0.283782958984375, -0.249755859375, -0.215728759765625, -0.18170166015625, -0.147674560546875, -0.1136474609375, -0.079620361328125, -0.04559326171875, -0.011566162109375, 0.0224609375, 0.056488037109375, 0.09051513671875, 0.124542236328125, 0.1585693359375, 0.192596435546875, 0.22662353515625, 0.260650634765625, 0.294677734375, 0.328704833984375, 0.36273193359375, 0.396759033203125, 0.4307861328125, 0.464813232421875, 0.49884033203125, 0.532867431640625, 0.56689453125, 0.600921630859375, 0.63494873046875, 0.668975830078125, 0.7030029296875, 0.737030029296875, 0.77105712890625, 0.805084228515625, 0.839111328125, 0.873138427734375, 0.90716552734375, 0.941192626953125, 0.9752197265625, 1.009246826171875, 1.04327392578125, 1.077301025390625, 1.111328125]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 6.0, 8.0, 11.0, 24.0, 24.0, 25.0, 50.0, 86.0, 137.0, 213.0, 302.0, 403.0, 732.0, 1084.0, 1653.0, 2619.0, 4081.0, 6619.0, 10496.0, 17099.0, 27926.0, 45922.0, 78847.0, 149047.0, 323990.0, 165198.0, 84497.0, 49332.0, 29557.0, 18126.0, 11362.0, 6977.0, 4440.0, 2777.0, 1726.0, 1103.0, 729.0, 455.0, 319.0, 174.0, 112.0, 90.0, 57.0, 44.0, 21.0, 19.0, 17.0, 8.0, 8.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.2437744140625, -0.23628807067871094, -0.22880172729492188, -0.2213153839111328, -0.21382904052734375, -0.2063426971435547, -0.19885635375976562, -0.19137001037597656, -0.1838836669921875, -0.17639732360839844, -0.16891098022460938, -0.1614246368408203, -0.15393829345703125, -0.1464519500732422, -0.13896560668945312, -0.13147926330566406, -0.123992919921875, -0.11650657653808594, -0.10902023315429688, -0.10153388977050781, -0.09404754638671875, -0.08656120300292969, -0.07907485961914062, -0.07158851623535156, -0.0641021728515625, -0.05661582946777344, -0.049129486083984375, -0.04164314270019531, -0.03415679931640625, -0.026670455932617188, -0.019184112548828125, -0.011697769165039062, -0.00421142578125, 0.0032749176025390625, 0.010761260986328125, 0.018247604370117188, 0.02573394775390625, 0.03322029113769531, 0.040706634521484375, 0.04819297790527344, 0.0556793212890625, 0.06316566467285156, 0.07065200805664062, 0.07813835144042969, 0.08562469482421875, 0.09311103820800781, 0.10059738159179688, 0.10808372497558594, 0.115570068359375, 0.12305641174316406, 0.13054275512695312, 0.1380290985107422, 0.14551544189453125, 0.1530017852783203, 0.16048812866210938, 0.16797447204589844, 0.1754608154296875, 0.18294715881347656, 0.19043350219726562, 0.1979198455810547, 0.20540618896484375, 0.2128925323486328, 0.22037887573242188, 0.22786521911621094, 0.2353515625]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 8.0, 3.0, 6.0, 6.0, 5.0, 7.0, 8.0, 11.0, 12.0, 16.0, 14.0, 23.0, 32.0, 29.0, 29.0, 26.0, 21.0, 38.0, 31.0, 35.0, 40.0, 44.0, 41.0, 1065.0, 35.0, 35.0, 43.0, 31.0, 38.0, 30.0, 34.0, 22.0, 22.0, 18.0, 29.0, 28.0, 14.0, 13.0, 18.0, 15.0, 10.0, 11.0, 12.0, 8.0, 5.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.72607421875, -0.703216552734375, -0.68035888671875, -0.657501220703125, -0.6346435546875, -0.611785888671875, -0.58892822265625, -0.566070556640625, -0.543212890625, -0.520355224609375, -0.49749755859375, -0.474639892578125, -0.4517822265625, -0.428924560546875, -0.40606689453125, -0.383209228515625, -0.3603515625, -0.337493896484375, -0.31463623046875, -0.291778564453125, -0.2689208984375, -0.246063232421875, -0.22320556640625, -0.200347900390625, -0.177490234375, -0.154632568359375, -0.13177490234375, -0.108917236328125, -0.0860595703125, -0.063201904296875, -0.04034423828125, -0.017486572265625, 0.00537109375, 0.028228759765625, 0.05108642578125, 0.073944091796875, 0.0968017578125, 0.119659423828125, 0.14251708984375, 0.165374755859375, 0.188232421875, 0.211090087890625, 0.23394775390625, 0.256805419921875, 0.2796630859375, 0.302520751953125, 0.32537841796875, 0.348236083984375, 0.37109375, 0.393951416015625, 0.41680908203125, 0.439666748046875, 0.4625244140625, 0.485382080078125, 0.50823974609375, 0.531097412109375, 0.553955078125, 0.576812744140625, 0.59967041015625, 0.622528076171875, 0.6453857421875, 0.668243408203125, 0.69110107421875, 0.713958740234375, 0.73681640625]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 4.0, 6.0, 6.0, 12.0, 19.0, 34.0, 51.0, 71.0, 83.0, 133.0, 169.0, 292.0, 432.0, 528.0, 813.0, 1101.0, 1715.0, 2372.0, 3365.0, 5158.0, 7405.0, 10987.0, 16247.0, 24782.0, 39352.0, 63459.0, 112377.0, 1253693.0, 263974.0, 111353.0, 63116.0, 38834.0, 24805.0, 16195.0, 10821.0, 7183.0, 4971.0, 3420.0, 2335.0, 1677.0, 1175.0, 764.0, 542.0, 415.0, 300.0, 191.0, 108.0, 92.0, 73.0, 40.0, 38.0, 20.0, 6.0, 13.0, 6.0, 6.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.194580078125, -0.18849754333496094, -0.18241500854492188, -0.1763324737548828, -0.17024993896484375, -0.1641674041748047, -0.15808486938476562, -0.15200233459472656, -0.1459197998046875, -0.13983726501464844, -0.13375473022460938, -0.1276721954345703, -0.12158966064453125, -0.11550712585449219, -0.10942459106445312, -0.10334205627441406, -0.097259521484375, -0.09117698669433594, -0.08509445190429688, -0.07901191711425781, -0.07292938232421875, -0.06684684753417969, -0.060764312744140625, -0.05468177795410156, -0.0485992431640625, -0.04251670837402344, -0.036434173583984375, -0.030351638793945312, -0.02426910400390625, -0.018186569213867188, -0.012104034423828125, -0.0060214996337890625, 6.103515625e-05, 0.0061435699462890625, 0.012226104736328125, 0.018308639526367188, 0.02439117431640625, 0.030473709106445312, 0.036556243896484375, 0.04263877868652344, 0.0487213134765625, 0.05480384826660156, 0.060886383056640625, 0.06696891784667969, 0.07305145263671875, 0.07913398742675781, 0.08521652221679688, 0.09129905700683594, 0.097381591796875, 0.10346412658691406, 0.10954666137695312, 0.11562919616699219, 0.12171173095703125, 0.1277942657470703, 0.13387680053710938, 0.13995933532714844, 0.1460418701171875, 0.15212440490722656, 0.15820693969726562, 0.1642894744873047, 0.17037200927734375, 0.1764545440673828, 0.18253707885742188, 0.18861961364746094, 0.1947021484375]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 3.0, 4.0, 7.0, 12.0, 21.0, 28.0, 35.0, 57.0, 67.0, 86.0, 110.0, 125.0, 110.0, 99.0, 74.0, 56.0, 39.0, 30.0, 12.0, 10.0, 7.0, 7.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002193450927734375, -0.00021141767501831055, -0.0002034902572631836, -0.00019556283950805664, -0.0001876354217529297, -0.00017970800399780273, -0.00017178058624267578, -0.00016385316848754883, -0.00015592575073242188, -0.00014799833297729492, -0.00014007091522216797, -0.00013214349746704102, -0.00012421607971191406, -0.00011628866195678711, -0.00010836124420166016, -0.0001004338264465332, -9.250640869140625e-05, -8.45789909362793e-05, -7.665157318115234e-05, -6.872415542602539e-05, -6.079673767089844e-05, -5.2869319915771484e-05, -4.494190216064453e-05, -3.701448440551758e-05, -2.9087066650390625e-05, -2.1159648895263672e-05, -1.3232231140136719e-05, -5.304813385009766e-06, 2.6226043701171875e-06, 1.055002212524414e-05, 1.8477439880371094e-05, 2.6404857635498047e-05, 3.4332275390625e-05, 4.225969314575195e-05, 5.0187110900878906e-05, 5.811452865600586e-05, 6.604194641113281e-05, 7.396936416625977e-05, 8.189678192138672e-05, 8.982419967651367e-05, 9.775161743164062e-05, 0.00010567903518676758, 0.00011360645294189453, 0.00012153387069702148, 0.00012946128845214844, 0.0001373887062072754, 0.00014531612396240234, 0.0001532435417175293, 0.00016117095947265625, 0.0001690983772277832, 0.00017702579498291016, 0.0001849532127380371, 0.00019288063049316406, 0.00020080804824829102, 0.00020873546600341797, 0.00021666288375854492, 0.00022459030151367188, 0.00023251771926879883, 0.00024044513702392578, 0.00024837255477905273, 0.0002562999725341797, 0.00026422739028930664, 0.0002721548080444336, 0.00028008222579956055, 0.0002880096435546875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 8.0, 9.0, 11.0, 16.0, 31.0, 39.0, 73.0, 113.0, 195.0, 287.0, 619.0, 2068.0, 1042181.0, 1615.0, 552.0, 292.0, 177.0, 100.0, 71.0, 37.0, 16.0, 21.0, 13.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.004764556884765625, -0.0046176910400390625, -0.0044708251953125, -0.0043239593505859375, -0.004177093505859375, -0.0040302276611328125, -0.00388336181640625, -0.0037364959716796875, -0.003589630126953125, -0.0034427642822265625, -0.0032958984375, -0.0031490325927734375, -0.003002166748046875, -0.0028553009033203125, -0.00270843505859375, -0.0025615692138671875, -0.002414703369140625, -0.0022678375244140625, -0.0021209716796875, -0.0019741058349609375, -0.001827239990234375, -0.0016803741455078125, -0.00153350830078125, -0.0013866424560546875, -0.001239776611328125, -0.0010929107666015625, -0.000946044921875, -0.0007991790771484375, -0.000652313232421875, -0.0005054473876953125, -0.00035858154296875, -0.0002117156982421875, -6.4849853515625e-05, 8.20159912109375e-05, 0.0002288818359375, 0.0003757476806640625, 0.000522613525390625, 0.0006694793701171875, 0.00081634521484375, 0.0009632110595703125, 0.001110076904296875, 0.0012569427490234375, 0.00140380859375, 0.0015506744384765625, 0.001697540283203125, 0.0018444061279296875, 0.00199127197265625, 0.0021381378173828125, 0.002285003662109375, 0.0024318695068359375, 0.0025787353515625, 0.0027256011962890625, 0.002872467041015625, 0.0030193328857421875, 0.00316619873046875, 0.0033130645751953125, 0.003459930419921875, 0.0036067962646484375, 0.003753662109375, 0.0039005279541015625, 0.004047393798828125, 0.0041942596435546875, 0.00434112548828125, 0.0044879913330078125, 0.004634857177734375]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 16.0, 303.0, 585.0, 105.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00050628453027457, -0.0004960133810527623, -0.000485742260934785, -0.0004754711117129773, -0.00046519996249116957, -0.0004549288423731923, -0.0004446576931513846, -0.0004343865439295769, -0.00042411539470776916, -0.00041384424548596144, -0.0004035731253679842, -0.00039330197614617646, -0.00038303082692436874, -0.0003727597068063915, -0.00036248855758458376, -0.00035221740836277604, -0.0003419462882447988, -0.00033167513902299106, -0.0003214040189050138, -0.0003111328696832061, -0.00030086172046139836, -0.00029059057123959064, -0.0002803194511216134, -0.00027004830189980567, -0.0002597771817818284, -0.0002495060325600207, -0.0002392348978901282, -0.0002289637632202357, -0.000218692613998428, -0.0002084214793285355, -0.000198150344658643, -0.0001878791954368353, -0.00017760807531885803, -0.00016733694064896554, -0.00015706579142715782, -0.00014679465675726533, -0.0001365235075354576, -0.00012625237286556512, -0.00011598123819567263, -0.00010571009624982253, -9.543895430397242e-05, -8.516781235812232e-05, -7.489667041227221e-05, -6.462553574237972e-05, -5.435439379652962e-05, -4.408325185067952e-05, -3.381211718078703e-05, -2.3540975234936923e-05, -1.3269833289086819e-05, -2.998693162226118e-06, 7.272446964634582e-06, 1.754358527250588e-05, 2.7814727218355983e-05, 3.808586916420609e-05, 4.835700383409858e-05, 5.862814577994868e-05, 6.889928772579879e-05, 7.917042967164889e-05, 8.9441571617499e-05, 9.971270628739148e-05, 0.00010998384823324159, 0.00012025499017909169, 0.00013052612484898418, 0.00014079725951887667, 0.0001510684087406844]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 7.0, 3.0, 9.0, 8.0, 13.0, 19.0, 21.0, 16.0, 18.0, 19.0, 29.0, 37.0, 24.0, 35.0, 30.0, 53.0, 46.0, 35.0, 43.0, 42.0, 33.0, 40.0, 47.0, 52.0, 35.0, 40.0, 26.0, 26.0, 35.0, 30.0, 25.0, 21.0, 18.0, 12.0, 12.0, 7.0, 6.0, 11.0, 4.0, 8.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.325410842895508e-05, -7.086247205734253e-05, -6.847083568572998e-05, -6.607919931411743e-05, -6.368756294250488e-05, -6.129592657089233e-05, -5.8904290199279785e-05, -5.6512653827667236e-05, -5.412101745605469e-05, -5.172938108444214e-05, -4.933774471282959e-05, -4.694610834121704e-05, -4.455447196960449e-05, -4.216283559799194e-05, -3.9771199226379395e-05, -3.7379562854766846e-05, -3.49879264831543e-05, -3.259629011154175e-05, -3.02046537399292e-05, -2.781301736831665e-05, -2.54213809967041e-05, -2.3029744625091553e-05, -2.0638108253479004e-05, -1.8246471881866455e-05, -1.5854835510253906e-05, -1.3463199138641357e-05, -1.1071562767028809e-05, -8.67992639541626e-06, -6.288290023803711e-06, -3.896653652191162e-06, -1.5050172805786133e-06, 8.866190910339355e-07, 3.2782554626464844e-06, 5.669891834259033e-06, 8.061528205871582e-06, 1.0453164577484131e-05, 1.284480094909668e-05, 1.5236437320709229e-05, 1.7628073692321777e-05, 2.0019710063934326e-05, 2.2411346435546875e-05, 2.4802982807159424e-05, 2.7194619178771973e-05, 2.958625555038452e-05, 3.197789192199707e-05, 3.436952829360962e-05, 3.676116466522217e-05, 3.915280103683472e-05, 4.1544437408447266e-05, 4.3936073780059814e-05, 4.632771015167236e-05, 4.871934652328491e-05, 5.111098289489746e-05, 5.350261926651001e-05, 5.589425563812256e-05, 5.828589200973511e-05, 6.0677528381347656e-05, 6.30691647529602e-05, 6.546080112457275e-05, 6.78524374961853e-05, 7.024407386779785e-05, 7.26357102394104e-05, 7.502734661102295e-05, 7.74189829826355e-05, 7.981061935424805e-05]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 1.0, 4.0, 0.0, 5.0, 3.0, 11.0, 5.0, 7.0, 10.0, 11.0, 6.0, 12.0, 18.0, 21.0, 13.0, 23.0, 20.0, 24.0, 29.0, 31.0, 27.0, 27.0, 33.0, 26.0, 34.0, 34.0, 44.0, 45.0, 47.0, 45.0, 32.0, 33.0, 23.0, 33.0, 25.0, 33.0, 25.0, 27.0, 22.0, 18.0, 24.0, 20.0, 11.0, 14.0, 10.0, 10.0, 12.0, 7.0, 3.0, 6.0, 4.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.06640625, -1.032379150390625, -0.99835205078125, -0.964324951171875, -0.9302978515625, -0.896270751953125, -0.86224365234375, -0.828216552734375, -0.794189453125, -0.760162353515625, -0.72613525390625, -0.692108154296875, -0.6580810546875, -0.624053955078125, -0.59002685546875, -0.555999755859375, -0.52197265625, -0.487945556640625, -0.45391845703125, -0.419891357421875, -0.3858642578125, -0.351837158203125, -0.31781005859375, -0.283782958984375, -0.249755859375, -0.215728759765625, -0.18170166015625, -0.147674560546875, -0.1136474609375, -0.079620361328125, -0.04559326171875, -0.011566162109375, 0.0224609375, 0.056488037109375, 0.09051513671875, 0.124542236328125, 0.1585693359375, 0.192596435546875, 0.22662353515625, 0.260650634765625, 0.294677734375, 0.328704833984375, 0.36273193359375, 0.396759033203125, 0.4307861328125, 0.464813232421875, 0.49884033203125, 0.532867431640625, 0.56689453125, 0.600921630859375, 0.63494873046875, 0.668975830078125, 0.7030029296875, 0.737030029296875, 0.77105712890625, 0.805084228515625, 0.839111328125, 0.873138427734375, 0.90716552734375, 0.941192626953125, 0.9752197265625, 1.009246826171875, 1.04327392578125, 1.077301025390625, 1.111328125]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 4.0, 5.0, 3.0, 5.0, 4.0, 9.0, 11.0, 21.0, 27.0, 37.0, 45.0, 73.0, 88.0, 110.0, 171.0, 270.0, 334.0, 519.0, 719.0, 1083.0, 1663.0, 2503.0, 4059.0, 7399.0, 17489.0, 70645.0, 506436.0, 354813.0, 48849.0, 14066.0, 6385.0, 3654.0, 2283.0, 1491.0, 957.0, 718.0, 507.0, 319.0, 196.0, 162.0, 125.0, 80.0, 74.0, 47.0, 29.0, 20.0, 13.0, 11.0, 10.0, 10.0, 6.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.953125, -4.79278564453125, -4.6324462890625, -4.47210693359375, -4.311767578125, -4.15142822265625, -3.9910888671875, -3.83074951171875, -3.67041015625, -3.51007080078125, -3.3497314453125, -3.18939208984375, -3.029052734375, -2.86871337890625, -2.7083740234375, -2.54803466796875, -2.3876953125, -2.22735595703125, -2.0670166015625, -1.90667724609375, -1.746337890625, -1.58599853515625, -1.4256591796875, -1.26531982421875, -1.10498046875, -0.94464111328125, -0.7843017578125, -0.62396240234375, -0.463623046875, -0.30328369140625, -0.1429443359375, 0.01739501953125, 0.177734375, 0.33807373046875, 0.4984130859375, 0.65875244140625, 0.819091796875, 0.97943115234375, 1.1397705078125, 1.30010986328125, 1.46044921875, 1.62078857421875, 1.7811279296875, 1.94146728515625, 2.101806640625, 2.26214599609375, 2.4224853515625, 2.58282470703125, 2.7431640625, 2.90350341796875, 3.0638427734375, 3.22418212890625, 3.384521484375, 3.54486083984375, 3.7052001953125, 3.86553955078125, 4.02587890625, 4.18621826171875, 4.3465576171875, 4.50689697265625, 4.667236328125, 4.82757568359375, 4.9879150390625, 5.14825439453125, 5.30859375]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 3.0, 0.0, 1.0, 5.0, 3.0, 6.0, 2.0, 3.0, 4.0, 11.0, 7.0, 8.0, 15.0, 13.0, 16.0, 18.0, 19.0, 20.0, 26.0, 18.0, 28.0, 24.0, 47.0, 38.0, 41.0, 68.0, 104.0, 239.0, 1374.0, 266.0, 128.0, 80.0, 39.0, 46.0, 37.0, 51.0, 27.0, 24.0, 31.0, 30.0, 29.0, 19.0, 13.0, 18.0, 15.0, 13.0, 9.0, 8.0, 3.0, 0.0, 6.0, 4.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0], "bins": [-3.6875, -3.580596923828125, -3.47369384765625, -3.366790771484375, -3.2598876953125, -3.152984619140625, -3.04608154296875, -2.939178466796875, -2.832275390625, -2.725372314453125, -2.61846923828125, -2.511566162109375, -2.4046630859375, -2.297760009765625, -2.19085693359375, -2.083953857421875, -1.97705078125, -1.870147705078125, -1.76324462890625, -1.656341552734375, -1.5494384765625, -1.442535400390625, -1.33563232421875, -1.228729248046875, -1.121826171875, -1.014923095703125, -0.90802001953125, -0.801116943359375, -0.6942138671875, -0.587310791015625, -0.48040771484375, -0.373504638671875, -0.2666015625, -0.159698486328125, -0.05279541015625, 0.054107666015625, 0.1610107421875, 0.267913818359375, 0.37481689453125, 0.481719970703125, 0.588623046875, 0.695526123046875, 0.80242919921875, 0.909332275390625, 1.0162353515625, 1.123138427734375, 1.23004150390625, 1.336944580078125, 1.44384765625, 1.550750732421875, 1.65765380859375, 1.764556884765625, 1.8714599609375, 1.978363037109375, 2.08526611328125, 2.192169189453125, 2.299072265625, 2.405975341796875, 2.51287841796875, 2.619781494140625, 2.7266845703125, 2.833587646484375, 2.94049072265625, 3.047393798828125, 3.154296875]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 5.0, 4.0, 6.0, 8.0, 8.0, 12.0, 11.0, 13.0, 18.0, 26.0, 18.0, 34.0, 35.0, 39.0, 59.0, 87.0, 118.0, 233.0, 451.0, 1447.0, 31931.0, 3073544.0, 35047.0, 1408.0, 469.0, 224.0, 127.0, 66.0, 54.0, 28.0, 27.0, 27.0, 20.0, 26.0, 14.0, 10.0, 8.0, 9.0, 8.0, 7.0, 4.0, 2.0, 4.0, 8.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.515625, -12.07666015625, -11.6376953125, -11.19873046875, -10.759765625, -10.32080078125, -9.8818359375, -9.44287109375, -9.00390625, -8.56494140625, -8.1259765625, -7.68701171875, -7.248046875, -6.80908203125, -6.3701171875, -5.93115234375, -5.4921875, -5.05322265625, -4.6142578125, -4.17529296875, -3.736328125, -3.29736328125, -2.8583984375, -2.41943359375, -1.98046875, -1.54150390625, -1.1025390625, -0.66357421875, -0.224609375, 0.21435546875, 0.6533203125, 1.09228515625, 1.53125, 1.97021484375, 2.4091796875, 2.84814453125, 3.287109375, 3.72607421875, 4.1650390625, 4.60400390625, 5.04296875, 5.48193359375, 5.9208984375, 6.35986328125, 6.798828125, 7.23779296875, 7.6767578125, 8.11572265625, 8.5546875, 8.99365234375, 9.4326171875, 9.87158203125, 10.310546875, 10.74951171875, 11.1884765625, 11.62744140625, 12.06640625, 12.50537109375, 12.9443359375, 13.38330078125, 13.822265625, 14.26123046875, 14.7001953125, 15.13916015625, 15.578125]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 960.0, 56.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.90650177001953, -50.222145080566406, -44.53778839111328, -38.853431701660156, -33.16907501220703, -27.48472023010254, -21.800365447998047, -16.116008758544922, -10.431652069091797, -4.74729585647583, 0.9370603561401367, 6.621416091918945, 12.30577278137207, 17.990129470825195, 23.674484252929688, 29.358840942382812, 35.04319763183594, 40.72755432128906, 46.41191101074219, 52.09626770019531, 57.78062438964844, 63.46498107910156, 69.14933776855469, 74.83369445800781, 80.51805114746094, 86.20240783691406, 91.88676452636719, 97.57112121582031, 103.25547790527344, 108.93983459472656, 114.62419128417969, 120.30854797363281, 125.99290466308594, 131.67726135253906, 137.3616180419922, 143.0459747314453, 148.73033142089844, 154.41468811035156, 160.0990447998047, 165.7834014892578, 171.46775817871094, 177.15211486816406, 182.8364715576172, 188.5208282470703, 194.20518493652344, 199.88954162597656, 205.5738983154297, 211.2582550048828, 216.94259643554688, 222.626953125, 228.31130981445312, 233.99566650390625, 239.68002319335938, 245.3643798828125, 251.04873657226562, 256.73309326171875, 262.4174499511719, 268.101806640625, 273.7861633300781, 279.47052001953125, 285.1548767089844, 290.8392333984375, 296.5235900878906, 302.20794677734375, 307.8923034667969]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 0.0, 3.0, 5.0, 6.0, 8.0, 9.0, 3.0, 4.0, 16.0, 16.0, 9.0, 23.0, 25.0, 15.0, 32.0, 31.0, 39.0, 36.0, 38.0, 23.0, 49.0, 56.0, 42.0, 45.0, 47.0, 28.0, 32.0, 42.0, 41.0, 33.0, 35.0, 29.0, 22.0, 25.0, 11.0, 23.0, 18.0, 8.0, 24.0, 13.0, 8.0, 13.0, 2.0, 5.0, 8.0, 5.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.243245124816895, -10.839468955993652, -10.43569278717041, -10.031916618347168, -9.628141403198242, -9.224365234375, -8.820589065551758, -8.416812896728516, -8.013036727905273, -7.609260559082031, -7.205484390258789, -6.801708698272705, -6.397932529449463, -5.994156360626221, -5.590380668640137, -5.1866044998168945, -4.782828330993652, -4.37905216217041, -3.975276231765747, -3.571500301361084, -3.167724132537842, -2.7639479637145996, -2.3601720333099365, -1.9563961029052734, -1.5526199340820312, -1.1488438844680786, -0.745067834854126, -0.34129178524017334, 0.0624842643737793, 0.4662604331970215, 0.8700363636016846, 1.2738122940063477, 1.6775875091552734, 2.0813636779785156, 2.4851396083831787, 2.888915538787842, 3.292691707611084, 3.696467876434326, 4.10024356842041, 4.504019737243652, 4.9077959060668945, 5.311572074890137, 5.715348243713379, 6.119123935699463, 6.522900104522705, 6.926676273345947, 7.330451965332031, 7.734228134155273, 8.138004302978516, 8.541780471801758, 8.945556640625, 9.349332809448242, 9.753108978271484, 10.156885147094727, 10.560660362243652, 10.964436531066895, 11.368212699890137, 11.771988868713379, 12.175765037536621, 12.579541206359863, 12.983316421508789, 13.387092590332031, 13.790868759155273, 14.194644927978516, 14.598421096801758]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 6.0, 4.0, 15.0, 6.0, 12.0, 14.0, 8.0, 18.0, 16.0, 19.0, 20.0, 26.0, 32.0, 22.0, 24.0, 29.0, 27.0, 25.0, 24.0, 41.0, 44.0, 48.0, 39.0, 45.0, 34.0, 43.0, 26.0, 28.0, 34.0, 26.0, 29.0, 22.0, 30.0, 30.0, 21.0, 18.0, 9.0, 14.0, 15.0, 20.0, 10.0, 7.0, 6.0, 6.0, 4.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-1.2529296875, -1.21636962890625, -1.1798095703125, -1.14324951171875, -1.106689453125, -1.07012939453125, -1.0335693359375, -0.99700927734375, -0.96044921875, -0.92388916015625, -0.8873291015625, -0.85076904296875, -0.814208984375, -0.77764892578125, -0.7410888671875, -0.70452880859375, -0.66796875, -0.63140869140625, -0.5948486328125, -0.55828857421875, -0.521728515625, -0.48516845703125, -0.4486083984375, -0.41204833984375, -0.37548828125, -0.33892822265625, -0.3023681640625, -0.26580810546875, -0.229248046875, -0.19268798828125, -0.1561279296875, -0.11956787109375, -0.0830078125, -0.04644775390625, -0.0098876953125, 0.02667236328125, 0.063232421875, 0.09979248046875, 0.1363525390625, 0.17291259765625, 0.20947265625, 0.24603271484375, 0.2825927734375, 0.31915283203125, 0.355712890625, 0.39227294921875, 0.4288330078125, 0.46539306640625, 0.501953125, 0.53851318359375, 0.5750732421875, 0.61163330078125, 0.648193359375, 0.68475341796875, 0.7213134765625, 0.75787353515625, 0.79443359375, 0.83099365234375, 0.8675537109375, 0.90411376953125, 0.940673828125, 0.97723388671875, 1.0137939453125, 1.05035400390625, 1.0869140625]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 8.0, 6.0, 15.0, 9.0, 24.0, 30.0, 36.0, 52.0, 57.0, 83.0, 103.0, 152.0, 242.0, 359.0, 511.0, 827.0, 1439.0, 2827.0, 6366.0, 17360.0, 66136.0, 514416.0, 2859697.0, 617148.0, 73559.0, 18923.0, 6806.0, 3008.0, 1502.0, 908.0, 507.0, 353.0, 229.0, 174.0, 109.0, 74.0, 63.0, 42.0, 35.0, 24.0, 12.0, 17.0, 11.0, 10.0, 5.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-5.0390625, -4.8887939453125, -4.738525390625, -4.5882568359375, -4.43798828125, -4.2877197265625, -4.137451171875, -3.9871826171875, -3.8369140625, -3.6866455078125, -3.536376953125, -3.3861083984375, -3.23583984375, -3.0855712890625, -2.935302734375, -2.7850341796875, -2.634765625, -2.4844970703125, -2.334228515625, -2.1839599609375, -2.03369140625, -1.8834228515625, -1.733154296875, -1.5828857421875, -1.4326171875, -1.2823486328125, -1.132080078125, -0.9818115234375, -0.83154296875, -0.6812744140625, -0.531005859375, -0.3807373046875, -0.23046875, -0.0802001953125, 0.070068359375, 0.2203369140625, 0.37060546875, 0.5208740234375, 0.671142578125, 0.8214111328125, 0.9716796875, 1.1219482421875, 1.272216796875, 1.4224853515625, 1.57275390625, 1.7230224609375, 1.873291015625, 2.0235595703125, 2.173828125, 2.3240966796875, 2.474365234375, 2.6246337890625, 2.77490234375, 2.9251708984375, 3.075439453125, 3.2257080078125, 3.3759765625, 3.5262451171875, 3.676513671875, 3.8267822265625, 3.97705078125, 4.1273193359375, 4.277587890625, 4.4278564453125, 4.578125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 10.0, 3.0, 18.0, 17.0, 46.0, 78.0, 125.0, 169.0, 311.0, 493.0, 590.0, 711.0, 511.0, 339.0, 231.0, 157.0, 112.0, 64.0, 33.0, 21.0, 22.0, 6.0, 4.0, 3.0, 7.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.078125, -8.86236572265625, -8.6466064453125, -8.43084716796875, -8.215087890625, -7.99932861328125, -7.7835693359375, -7.56781005859375, -7.35205078125, -7.13629150390625, -6.9205322265625, -6.70477294921875, -6.489013671875, -6.27325439453125, -6.0574951171875, -5.84173583984375, -5.6259765625, -5.41021728515625, -5.1944580078125, -4.97869873046875, -4.762939453125, -4.54718017578125, -4.3314208984375, -4.11566162109375, -3.89990234375, -3.68414306640625, -3.4683837890625, -3.25262451171875, -3.036865234375, -2.82110595703125, -2.6053466796875, -2.38958740234375, -2.173828125, -1.95806884765625, -1.7423095703125, -1.52655029296875, -1.310791015625, -1.09503173828125, -0.8792724609375, -0.66351318359375, -0.44775390625, -0.23199462890625, -0.0162353515625, 0.19952392578125, 0.415283203125, 0.63104248046875, 0.8468017578125, 1.06256103515625, 1.2783203125, 1.49407958984375, 1.7098388671875, 1.92559814453125, 2.141357421875, 2.35711669921875, 2.5728759765625, 2.78863525390625, 3.00439453125, 3.22015380859375, 3.4359130859375, 3.65167236328125, 3.867431640625, 4.08319091796875, 4.2989501953125, 4.51470947265625, 4.73046875]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [5.0, 4.0, 12.0, 13.0, 10.0, 25.0, 56.0, 73.0, 113.0, 192.0, 535.0, 2456.0, 449861.0, 3734267.0, 5573.0, 676.0, 218.0, 99.0, 53.0, 19.0, 20.0, 8.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.5625, -10.68359375, -9.8046875, -8.92578125, -8.046875, -7.16796875, -6.2890625, -5.41015625, -4.53125, -3.65234375, -2.7734375, -1.89453125, -1.015625, -0.13671875, 0.7421875, 1.62109375, 2.5, 3.37890625, 4.2578125, 5.13671875, 6.015625, 6.89453125, 7.7734375, 8.65234375, 9.53125, 10.41015625, 11.2890625, 12.16796875, 13.046875, 13.92578125, 14.8046875, 15.68359375, 16.5625, 17.44140625, 18.3203125, 19.19921875, 20.078125, 20.95703125, 21.8359375, 22.71484375, 23.59375, 24.47265625, 25.3515625, 26.23046875, 27.109375, 27.98828125, 28.8671875, 29.74609375, 30.625, 31.50390625, 32.3828125, 33.26171875, 34.140625, 35.01953125, 35.8984375, 36.77734375, 37.65625, 38.53515625, 39.4140625, 40.29296875, 41.171875, 42.05078125, 42.9296875, 43.80859375, 44.6875]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 770.0, 245.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.78044128417969, -51.89575958251953, -46.01108169555664, -40.12640380859375, -34.241722106933594, -28.35704231262207, -22.472362518310547, -16.587684631347656, -10.7030029296875, -4.818323135375977, 1.0663566589355469, 6.95103645324707, 12.835716247558594, 18.720396041870117, 24.60507583618164, 30.48975372314453, 36.37443542480469, 42.259117126464844, 48.143795013427734, 54.028472900390625, 59.91315460205078, 65.79783630371094, 71.68251037597656, 77.56719207763672, 83.45187377929688, 89.33655548095703, 95.22123718261719, 101.10591125488281, 106.99059295654297, 112.87527465820312, 118.75994873046875, 124.6446304321289, 130.529296875, 136.41397094726562, 142.2986602783203, 148.18333435058594, 154.06802368164062, 159.95269775390625, 165.83737182617188, 171.7220458984375, 177.6067352294922, 183.4914093017578, 189.3760986328125, 195.26077270507812, 201.14544677734375, 207.03013610839844, 212.91481018066406, 218.79949951171875, 224.68417358398438, 230.56884765625, 236.4535369873047, 242.3382110595703, 248.222900390625, 254.10757446289062, 259.99224853515625, 265.8769226074219, 271.7615966796875, 277.6462707519531, 283.53094482421875, 289.4156494140625, 295.3003234863281, 301.18499755859375, 307.0696716308594, 312.954345703125, 318.83905029296875]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 7.0, 7.0, 7.0, 16.0, 8.0, 15.0, 19.0, 24.0, 19.0, 23.0, 30.0, 34.0, 32.0, 36.0, 44.0, 37.0, 35.0, 48.0, 48.0, 43.0, 51.0, 43.0, 48.0, 50.0, 34.0, 39.0, 32.0, 29.0, 35.0, 20.0, 10.0, 19.0, 13.0, 9.0, 9.0, 8.0, 8.0, 7.0, 6.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-23.02631378173828, -22.363508224487305, -21.700700759887695, -21.03789520263672, -20.37508773803711, -19.712282180786133, -19.049474716186523, -18.386669158935547, -17.723861694335938, -17.06105613708496, -16.39824867248535, -15.735442161560059, -15.072635650634766, -14.409830093383789, -13.747023582458496, -13.084217071533203, -12.421411514282227, -11.758605003356934, -11.09579849243164, -10.432991981506348, -9.770185470581055, -9.107379913330078, -8.444573402404785, -7.781766891479492, -7.118960380554199, -6.456153869628906, -5.793347358703613, -5.1305413246154785, -4.4677348136901855, -3.8049283027648926, -3.1421220302581787, -2.479315757751465, -1.8165092468261719, -1.1537028551101685, -0.49089646339416504, 0.17190992832183838, 0.8347163200378418, 1.4975228309631348, 2.1603291034698486, 2.8231353759765625, 3.4859418869018555, 4.148748397827148, 4.811554908752441, 5.474360942840576, 6.137167453765869, 6.799973964691162, 7.462779998779297, 8.12558650970459, 8.788393020629883, 9.451199531555176, 10.114006042480469, 10.776812553405762, 11.439619064331055, 12.102424621582031, 12.765231132507324, 13.428037643432617, 14.09084415435791, 14.753650665283203, 15.416457176208496, 16.07926368713379, 16.742069244384766, 17.404876708984375, 18.06768226623535, 18.730487823486328, 19.393295288085938]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 5.0, 6.0, 5.0, 9.0, 10.0, 9.0, 8.0, 15.0, 19.0, 15.0, 26.0, 24.0, 29.0, 25.0, 26.0, 24.0, 31.0, 39.0, 38.0, 33.0, 36.0, 37.0, 43.0, 47.0, 37.0, 36.0, 32.0, 37.0, 38.0, 29.0, 24.0, 29.0, 26.0, 19.0, 25.0, 24.0, 26.0, 10.0, 11.0, 7.0, 11.0, 9.0, 4.0, 7.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0], "bins": [-1.3779296875, -1.339202880859375, -1.30047607421875, -1.261749267578125, -1.2230224609375, -1.184295654296875, -1.14556884765625, -1.106842041015625, -1.068115234375, -1.029388427734375, -0.99066162109375, -0.951934814453125, -0.9132080078125, -0.874481201171875, -0.83575439453125, -0.797027587890625, -0.75830078125, -0.719573974609375, -0.68084716796875, -0.642120361328125, -0.6033935546875, -0.564666748046875, -0.52593994140625, -0.487213134765625, -0.448486328125, -0.409759521484375, -0.37103271484375, -0.332305908203125, -0.2935791015625, -0.254852294921875, -0.21612548828125, -0.177398681640625, -0.138671875, -0.099945068359375, -0.06121826171875, -0.022491455078125, 0.0162353515625, 0.054962158203125, 0.09368896484375, 0.132415771484375, 0.171142578125, 0.209869384765625, 0.24859619140625, 0.287322998046875, 0.3260498046875, 0.364776611328125, 0.40350341796875, 0.442230224609375, 0.48095703125, 0.519683837890625, 0.55841064453125, 0.597137451171875, 0.6358642578125, 0.674591064453125, 0.71331787109375, 0.752044677734375, 0.790771484375, 0.829498291015625, 0.86822509765625, 0.906951904296875, 0.9456787109375, 0.984405517578125, 1.02313232421875, 1.061859130859375, 1.1005859375]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 12.0, 17.0, 24.0, 24.0, 39.0, 52.0, 80.0, 112.0, 193.0, 282.0, 465.0, 691.0, 1142.0, 1924.0, 3093.0, 5257.0, 8927.0, 15091.0, 25303.0, 42881.0, 74932.0, 145783.0, 314831.0, 189454.0, 91957.0, 51160.0, 30220.0, 18036.0, 10646.0, 6194.0, 3791.0, 2289.0, 1371.0, 814.0, 464.0, 333.0, 219.0, 155.0, 98.0, 73.0, 44.0, 28.0, 20.0, 10.0, 9.0, 5.0, 4.0, 1.0, 4.0, 5.0, 3.0, 1.0], "bins": [-0.28564453125, -0.27740478515625, -0.2691650390625, -0.26092529296875, -0.252685546875, -0.24444580078125, -0.2362060546875, -0.22796630859375, -0.2197265625, -0.21148681640625, -0.2032470703125, -0.19500732421875, -0.186767578125, -0.17852783203125, -0.1702880859375, -0.16204833984375, -0.15380859375, -0.14556884765625, -0.1373291015625, -0.12908935546875, -0.120849609375, -0.11260986328125, -0.1043701171875, -0.09613037109375, -0.087890625, -0.07965087890625, -0.0714111328125, -0.06317138671875, -0.054931640625, -0.04669189453125, -0.0384521484375, -0.03021240234375, -0.02197265625, -0.01373291015625, -0.0054931640625, 0.00274658203125, 0.010986328125, 0.01922607421875, 0.0274658203125, 0.03570556640625, 0.0439453125, 0.05218505859375, 0.0604248046875, 0.06866455078125, 0.076904296875, 0.08514404296875, 0.0933837890625, 0.10162353515625, 0.10986328125, 0.11810302734375, 0.1263427734375, 0.13458251953125, 0.142822265625, 0.15106201171875, 0.1593017578125, 0.16754150390625, 0.17578125, 0.18402099609375, 0.1922607421875, 0.20050048828125, 0.208740234375, 0.21697998046875, 0.2252197265625, 0.23345947265625, 0.24169921875]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 7.0, 3.0, 6.0, 12.0, 12.0, 14.0, 22.0, 12.0, 22.0, 22.0, 33.0, 31.0, 35.0, 44.0, 35.0, 43.0, 38.0, 46.0, 46.0, 1063.0, 47.0, 40.0, 48.0, 38.0, 36.0, 38.0, 24.0, 21.0, 31.0, 33.0, 24.0, 23.0, 13.0, 18.0, 7.0, 8.0, 7.0, 6.0, 4.0, 6.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.830078125, -0.8025436401367188, -0.7750091552734375, -0.7474746704101562, -0.719940185546875, -0.6924057006835938, -0.6648712158203125, -0.6373367309570312, -0.60980224609375, -0.5822677612304688, -0.5547332763671875, -0.5271987915039062, -0.499664306640625, -0.47212982177734375, -0.4445953369140625, -0.41706085205078125, -0.3895263671875, -0.36199188232421875, -0.3344573974609375, -0.30692291259765625, -0.279388427734375, -0.25185394287109375, -0.2243194580078125, -0.19678497314453125, -0.16925048828125, -0.14171600341796875, -0.1141815185546875, -0.08664703369140625, -0.059112548828125, -0.03157806396484375, -0.0040435791015625, 0.02349090576171875, 0.051025390625, 0.07855987548828125, 0.1060943603515625, 0.13362884521484375, 0.161163330078125, 0.18869781494140625, 0.2162322998046875, 0.24376678466796875, 0.27130126953125, 0.29883575439453125, 0.3263702392578125, 0.35390472412109375, 0.381439208984375, 0.40897369384765625, 0.4365081787109375, 0.46404266357421875, 0.4915771484375, 0.5191116333007812, 0.5466461181640625, 0.5741806030273438, 0.601715087890625, 0.6292495727539062, 0.6567840576171875, 0.6843185424804688, 0.71185302734375, 0.7393875122070312, 0.7669219970703125, 0.7944564819335938, 0.821990966796875, 0.8495254516601562, 0.8770599365234375, 0.9045944213867188, 0.93212890625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 3.0, 5.0, 10.0, 12.0, 14.0, 27.0, 36.0, 58.0, 71.0, 109.0, 165.0, 246.0, 347.0, 516.0, 717.0, 1119.0, 1657.0, 2609.0, 3925.0, 6104.0, 9618.0, 15148.0, 24681.0, 41662.0, 73662.0, 147079.0, 1361971.0, 189366.0, 89605.0, 49602.0, 28669.0, 17219.0, 10838.0, 7004.0, 4461.0, 2947.0, 1915.0, 1246.0, 875.0, 585.0, 381.0, 270.0, 187.0, 135.0, 91.0, 48.0, 44.0, 27.0, 26.0, 12.0, 5.0, 5.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.23046875, -0.22294998168945312, -0.21543121337890625, -0.20791244506835938, -0.2003936767578125, -0.19287490844726562, -0.18535614013671875, -0.17783737182617188, -0.170318603515625, -0.16279983520507812, -0.15528106689453125, -0.14776229858398438, -0.1402435302734375, -0.13272476196289062, -0.12520599365234375, -0.11768722534179688, -0.11016845703125, -0.10264968872070312, -0.09513092041015625, -0.08761215209960938, -0.0800933837890625, -0.07257461547851562, -0.06505584716796875, -0.057537078857421875, -0.050018310546875, -0.042499542236328125, -0.03498077392578125, -0.027462005615234375, -0.0199432373046875, -0.012424468994140625, -0.00490570068359375, 0.002613067626953125, 0.0101318359375, 0.017650604248046875, 0.02516937255859375, 0.032688140869140625, 0.0402069091796875, 0.047725677490234375, 0.05524444580078125, 0.06276321411132812, 0.070281982421875, 0.07780075073242188, 0.08531951904296875, 0.09283828735351562, 0.1003570556640625, 0.10787582397460938, 0.11539459228515625, 0.12291336059570312, 0.13043212890625, 0.13795089721679688, 0.14546966552734375, 0.15298843383789062, 0.1605072021484375, 0.16802597045898438, 0.17554473876953125, 0.18306350708007812, 0.190582275390625, 0.19810104370117188, 0.20561981201171875, 0.21313858032226562, 0.2206573486328125, 0.22817611694335938, 0.23569488525390625, 0.24321365356445312, 0.250732421875]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 6.0, 2.0, 3.0, 4.0, 2.0, 8.0, 11.0, 17.0, 10.0, 13.0, 19.0, 21.0, 27.0, 24.0, 40.0, 35.0, 39.0, 32.0, 34.0, 42.0, 50.0, 43.0, 40.0, 50.0, 46.0, 50.0, 42.0, 42.0, 37.0, 26.0, 23.0, 29.0, 24.0, 18.0, 13.0, 13.0, 15.0, 13.0, 11.0, 7.0, 5.0, 1.0, 6.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-9.79304313659668e-05, -9.470432996749878e-05, -9.147822856903076e-05, -8.825212717056274e-05, -8.502602577209473e-05, -8.179992437362671e-05, -7.857382297515869e-05, -7.534772157669067e-05, -7.212162017822266e-05, -6.889551877975464e-05, -6.566941738128662e-05, -6.24433159828186e-05, -5.9217214584350586e-05, -5.599111318588257e-05, -5.276501178741455e-05, -4.953891038894653e-05, -4.6312808990478516e-05, -4.30867075920105e-05, -3.986060619354248e-05, -3.663450479507446e-05, -3.3408403396606445e-05, -3.0182301998138428e-05, -2.695620059967041e-05, -2.3730099201202393e-05, -2.0503997802734375e-05, -1.7277896404266357e-05, -1.405179500579834e-05, -1.0825693607330322e-05, -7.599592208862305e-06, -4.373490810394287e-06, -1.1473894119262695e-06, 2.078711986541748e-06, 5.304813385009766e-06, 8.530914783477783e-06, 1.17570161819458e-05, 1.4983117580413818e-05, 1.8209218978881836e-05, 2.1435320377349854e-05, 2.466142177581787e-05, 2.788752317428589e-05, 3.1113624572753906e-05, 3.4339725971221924e-05, 3.756582736968994e-05, 4.079192876815796e-05, 4.4018030166625977e-05, 4.7244131565093994e-05, 5.047023296356201e-05, 5.369633436203003e-05, 5.692243576049805e-05, 6.0148537158966064e-05, 6.337463855743408e-05, 6.66007399559021e-05, 6.982684135437012e-05, 7.305294275283813e-05, 7.627904415130615e-05, 7.950514554977417e-05, 8.273124694824219e-05, 8.59573483467102e-05, 8.918344974517822e-05, 9.240955114364624e-05, 9.563565254211426e-05, 9.886175394058228e-05, 0.00010208785533905029, 0.00010531395673751831, 0.00010854005813598633]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 8.0, 5.0, 10.0, 10.0, 14.0, 12.0, 20.0, 25.0, 26.0, 44.0, 58.0, 63.0, 74.0, 83.0, 118.0, 126.0, 157.0, 226.0, 332.0, 527.0, 1289.0, 217665.0, 823049.0, 2369.0, 642.0, 440.0, 254.0, 193.0, 135.0, 109.0, 89.0, 80.0, 63.0, 45.0, 38.0, 22.0, 27.0, 17.0, 22.0, 17.0, 12.0, 10.0, 14.0, 4.0, 8.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0], "bins": [-0.0021381378173828125, -0.002075508236885071, -0.002012878656387329, -0.0019502490758895874, -0.0018876194953918457, -0.001824989914894104, -0.0017623603343963623, -0.0016997307538986206, -0.001637101173400879, -0.0015744715929031372, -0.0015118420124053955, -0.0014492124319076538, -0.0013865828514099121, -0.0013239532709121704, -0.0012613236904144287, -0.001198694109916687, -0.0011360645294189453, -0.0010734349489212036, -0.001010805368423462, -0.0009481757879257202, -0.0008855462074279785, -0.0008229166269302368, -0.0007602870464324951, -0.0006976574659347534, -0.0006350278854370117, -0.00057239830493927, -0.0005097687244415283, -0.0004471391439437866, -0.0003845095634460449, -0.0003218799829483032, -0.0002592504024505615, -0.00019662082195281982, -0.00013399124145507812, -7.136166095733643e-05, -8.732080459594727e-06, 5.389750003814697e-05, 0.00011652708053588867, 0.00017915666103363037, 0.00024178624153137207, 0.00030441582202911377, 0.00036704540252685547, 0.00042967498302459717, 0.0004923045635223389, 0.0005549341440200806, 0.0006175637245178223, 0.000680193305015564, 0.0007428228855133057, 0.0008054524660110474, 0.0008680820465087891, 0.0009307116270065308, 0.0009933412075042725, 0.0010559707880020142, 0.0011186003684997559, 0.0011812299489974976, 0.0012438595294952393, 0.001306489109992981, 0.0013691186904907227, 0.0014317482709884644, 0.001494377851486206, 0.0015570074319839478, 0.0016196370124816895, 0.0016822665929794312, 0.0017448961734771729, 0.0018075257539749146, 0.0018701553344726562]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 24.0, 106.0, 240.0, 321.0, 211.0, 81.0, 25.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000263611989794299, -0.0002574029203969985, -0.0002511938218958676, -0.0002449847524985671, -0.0002387756685493514, -0.00023256658460013568, -0.00022635750065091997, -0.00022014841670170426, -0.00021393934730440378, -0.00020773026335518807, -0.00020152117940597236, -0.00019531211000867188, -0.00018910302605945617, -0.00018289394211024046, -0.00017668485816102475, -0.00017047577421180904, -0.00016426670481450856, -0.00015805762086529285, -0.00015184853691607714, -0.00014563946751877666, -0.00013943038356956095, -0.00013322129962034523, -0.00012701221567112952, -0.00012080313899787143, -0.0001145940477726981, -0.0001083849638234824, -0.0001021758871502243, -9.596680320100859e-05, -8.975772652775049e-05, -8.354864257853478e-05, -7.733955862931907e-05, -7.113048195606098e-05, -6.492140528280288e-05, -5.871232497156598e-05, -5.2503244660329074e-05, -4.6294160711113364e-05, -4.008508403785527e-05, -3.387600008863956e-05, -2.7666919777402654e-05, -2.145783946616575e-05, -1.5248759154928848e-05, -9.039678843691945e-06, -2.8305976229603402e-06, 3.3784835977712646e-06, 9.587563909008168e-06, 1.5796646039234474e-05, 2.2005726350471377e-05, 2.821480666170828e-05, 3.4423886972945184e-05, 4.0632967284182087e-05, 4.684204759541899e-05, 5.30511315446347e-05, 5.9260208217892796e-05, 6.54692921671085e-05, 7.16783688403666e-05, 7.788745278958231e-05, 8.409653673879802e-05, 9.030562068801373e-05, 9.651469736127183e-05, 0.00010272378131048754, 0.00010893285798374563, 0.00011514194193296134, 0.00012135102588217705, 0.00012756010983139277, 0.00013376917922869325]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 3.0, 6.0, 7.0, 5.0, 7.0, 11.0, 16.0, 10.0, 15.0, 15.0, 18.0, 29.0, 30.0, 29.0, 26.0, 29.0, 36.0, 22.0, 56.0, 41.0, 40.0, 39.0, 47.0, 40.0, 49.0, 31.0, 29.0, 37.0, 29.0, 33.0, 35.0, 32.0, 24.0, 22.0, 18.0, 14.0, 21.0, 12.0, 9.0, 12.0, 7.0, 4.0, 3.0, 3.0, 1.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.598234176635742e-05, -6.400793790817261e-05, -6.203353404998779e-05, -6.005913019180298e-05, -5.8084726333618164e-05, -5.611032247543335e-05, -5.4135918617248535e-05, -5.216151475906372e-05, -5.0187110900878906e-05, -4.821270704269409e-05, -4.623830318450928e-05, -4.426389932632446e-05, -4.228949546813965e-05, -4.0315091609954834e-05, -3.834068775177002e-05, -3.6366283893585205e-05, -3.439188003540039e-05, -3.2417476177215576e-05, -3.0443072319030762e-05, -2.8468668460845947e-05, -2.6494264602661133e-05, -2.451986074447632e-05, -2.2545456886291504e-05, -2.057105302810669e-05, -1.8596649169921875e-05, -1.662224531173706e-05, -1.4647841453552246e-05, -1.2673437595367432e-05, -1.0699033737182617e-05, -8.724629878997803e-06, -6.750226020812988e-06, -4.775822162628174e-06, -2.8014183044433594e-06, -8.270144462585449e-07, 1.1473894119262695e-06, 3.121793270111084e-06, 5.0961971282958984e-06, 7.070600986480713e-06, 9.045004844665527e-06, 1.1019408702850342e-05, 1.2993812561035156e-05, 1.496821641921997e-05, 1.6942620277404785e-05, 1.89170241355896e-05, 2.0891427993774414e-05, 2.286583185195923e-05, 2.4840235710144043e-05, 2.6814639568328857e-05, 2.8789043426513672e-05, 3.0763447284698486e-05, 3.27378511428833e-05, 3.4712255001068115e-05, 3.668665885925293e-05, 3.8661062717437744e-05, 4.063546657562256e-05, 4.260987043380737e-05, 4.458427429199219e-05, 4.6558678150177e-05, 4.8533082008361816e-05, 5.050748586654663e-05, 5.2481889724731445e-05, 5.445629358291626e-05, 5.6430697441101074e-05, 5.840510129928589e-05, 6.03795051574707e-05]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 5.0, 6.0, 5.0, 9.0, 10.0, 9.0, 8.0, 15.0, 19.0, 15.0, 26.0, 24.0, 29.0, 25.0, 26.0, 24.0, 31.0, 39.0, 38.0, 33.0, 36.0, 37.0, 43.0, 47.0, 37.0, 36.0, 32.0, 37.0, 38.0, 29.0, 24.0, 29.0, 26.0, 19.0, 25.0, 24.0, 26.0, 10.0, 11.0, 7.0, 11.0, 9.0, 4.0, 7.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0], "bins": [-1.3779296875, -1.339202880859375, -1.30047607421875, -1.261749267578125, -1.2230224609375, -1.184295654296875, -1.14556884765625, -1.106842041015625, -1.068115234375, -1.029388427734375, -0.99066162109375, -0.951934814453125, -0.9132080078125, -0.874481201171875, -0.83575439453125, -0.797027587890625, -0.75830078125, -0.719573974609375, -0.68084716796875, -0.642120361328125, -0.6033935546875, -0.564666748046875, -0.52593994140625, -0.487213134765625, -0.448486328125, -0.409759521484375, -0.37103271484375, -0.332305908203125, -0.2935791015625, -0.254852294921875, -0.21612548828125, -0.177398681640625, -0.138671875, -0.099945068359375, -0.06121826171875, -0.022491455078125, 0.0162353515625, 0.054962158203125, 0.09368896484375, 0.132415771484375, 0.171142578125, 0.209869384765625, 0.24859619140625, 0.287322998046875, 0.3260498046875, 0.364776611328125, 0.40350341796875, 0.442230224609375, 0.48095703125, 0.519683837890625, 0.55841064453125, 0.597137451171875, 0.6358642578125, 0.674591064453125, 0.71331787109375, 0.752044677734375, 0.790771484375, 0.829498291015625, 0.86822509765625, 0.906951904296875, 0.9456787109375, 0.984405517578125, 1.02313232421875, 1.061859130859375, 1.1005859375]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 8.0, 11.0, 9.0, 17.0, 16.0, 23.0, 40.0, 61.0, 67.0, 112.0, 136.0, 203.0, 297.0, 405.0, 708.0, 1196.0, 2100.0, 4135.0, 8320.0, 18818.0, 45157.0, 109850.0, 233362.0, 300918.0, 182887.0, 79674.0, 32335.0, 13680.0, 6383.0, 3213.0, 1673.0, 961.0, 559.0, 374.0, 227.0, 198.0, 107.0, 88.0, 65.0, 41.0, 49.0, 24.0, 16.0, 15.0, 10.0, 6.0, 2.0, 4.0, 2.0, 2.0, 0.0, 3.0], "bins": [-1.763671875, -1.7137298583984375, -1.663787841796875, -1.6138458251953125, -1.56390380859375, -1.5139617919921875, -1.464019775390625, -1.4140777587890625, -1.3641357421875, -1.3141937255859375, -1.264251708984375, -1.2143096923828125, -1.16436767578125, -1.1144256591796875, -1.064483642578125, -1.0145416259765625, -0.964599609375, -0.9146575927734375, -0.864715576171875, -0.8147735595703125, -0.76483154296875, -0.7148895263671875, -0.664947509765625, -0.6150054931640625, -0.5650634765625, -0.5151214599609375, -0.465179443359375, -0.4152374267578125, -0.36529541015625, -0.3153533935546875, -0.265411376953125, -0.2154693603515625, -0.16552734375, -0.1155853271484375, -0.065643310546875, -0.0157012939453125, 0.03424072265625, 0.0841827392578125, 0.134124755859375, 0.1840667724609375, 0.2340087890625, 0.2839508056640625, 0.333892822265625, 0.3838348388671875, 0.43377685546875, 0.4837188720703125, 0.533660888671875, 0.5836029052734375, 0.633544921875, 0.6834869384765625, 0.733428955078125, 0.7833709716796875, 0.83331298828125, 0.8832550048828125, 0.933197021484375, 0.9831390380859375, 1.0330810546875, 1.0830230712890625, 1.132965087890625, 1.1829071044921875, 1.23284912109375, 1.2827911376953125, 1.332733154296875, 1.3826751708984375, 1.4326171875]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 3.0, 3.0, 5.0, 12.0, 15.0, 11.0, 13.0, 20.0, 25.0, 23.0, 35.0, 30.0, 38.0, 46.0, 46.0, 59.0, 86.0, 154.0, 315.0, 1390.0, 197.0, 99.0, 67.0, 51.0, 40.0, 38.0, 37.0, 24.0, 23.0, 18.0, 26.0, 18.0, 10.0, 16.0, 8.0, 7.0, 10.0, 11.0, 7.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.82421875, -4.67431640625, -4.5244140625, -4.37451171875, -4.224609375, -4.07470703125, -3.9248046875, -3.77490234375, -3.625, -3.47509765625, -3.3251953125, -3.17529296875, -3.025390625, -2.87548828125, -2.7255859375, -2.57568359375, -2.42578125, -2.27587890625, -2.1259765625, -1.97607421875, -1.826171875, -1.67626953125, -1.5263671875, -1.37646484375, -1.2265625, -1.07666015625, -0.9267578125, -0.77685546875, -0.626953125, -0.47705078125, -0.3271484375, -0.17724609375, -0.02734375, 0.12255859375, 0.2724609375, 0.42236328125, 0.572265625, 0.72216796875, 0.8720703125, 1.02197265625, 1.171875, 1.32177734375, 1.4716796875, 1.62158203125, 1.771484375, 1.92138671875, 2.0712890625, 2.22119140625, 2.37109375, 2.52099609375, 2.6708984375, 2.82080078125, 2.970703125, 3.12060546875, 3.2705078125, 3.42041015625, 3.5703125, 3.72021484375, 3.8701171875, 4.02001953125, 4.169921875, 4.31982421875, 4.4697265625, 4.61962890625, 4.76953125]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 4.0, 6.0, 11.0, 7.0, 15.0, 12.0, 10.0, 16.0, 18.0, 23.0, 25.0, 37.0, 51.0, 73.0, 103.0, 155.0, 290.0, 572.0, 1856.0, 24930.0, 2746057.0, 363908.0, 5446.0, 961.0, 404.0, 228.0, 131.0, 90.0, 62.0, 45.0, 23.0, 29.0, 22.0, 17.0, 18.0, 12.0, 15.0, 6.0, 5.0, 5.0, 4.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.65625, -9.352294921875, -9.04833984375, -8.744384765625, -8.4404296875, -8.136474609375, -7.83251953125, -7.528564453125, -7.224609375, -6.920654296875, -6.61669921875, -6.312744140625, -6.0087890625, -5.704833984375, -5.40087890625, -5.096923828125, -4.79296875, -4.489013671875, -4.18505859375, -3.881103515625, -3.5771484375, -3.273193359375, -2.96923828125, -2.665283203125, -2.361328125, -2.057373046875, -1.75341796875, -1.449462890625, -1.1455078125, -0.841552734375, -0.53759765625, -0.233642578125, 0.0703125, 0.374267578125, 0.67822265625, 0.982177734375, 1.2861328125, 1.590087890625, 1.89404296875, 2.197998046875, 2.501953125, 2.805908203125, 3.10986328125, 3.413818359375, 3.7177734375, 4.021728515625, 4.32568359375, 4.629638671875, 4.93359375, 5.237548828125, 5.54150390625, 5.845458984375, 6.1494140625, 6.453369140625, 6.75732421875, 7.061279296875, 7.365234375, 7.669189453125, 7.97314453125, 8.277099609375, 8.5810546875, 8.885009765625, 9.18896484375, 9.492919921875, 9.796875]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 30.0, 100.0, 245.0, 326.0, 214.0, 72.0, 15.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.365718841552734, -26.832176208496094, -26.298633575439453, -25.765090942382812, -25.231548309326172, -24.698007583618164, -24.164464950561523, -23.630922317504883, -23.097379684448242, -22.5638370513916, -22.03029441833496, -21.49675178527832, -20.963211059570312, -20.429668426513672, -19.89612579345703, -19.36258316040039, -18.82904052734375, -18.29549789428711, -17.76195526123047, -17.228412628173828, -16.694869995117188, -16.16132926940918, -15.627786636352539, -15.094244003295898, -14.560701370239258, -14.027158737182617, -13.493616104125977, -12.960074424743652, -12.426531791687012, -11.892989158630371, -11.359447479248047, -10.825904846191406, -10.292362213134766, -9.758819580078125, -9.225276947021484, -8.69173526763916, -8.15819263458252, -7.624650001525879, -7.0911078453063965, -6.557565689086914, -6.024022579193115, -5.490480422973633, -4.956937789916992, -4.423395156860352, -3.889853000640869, -3.3563106060028076, -2.822768211364746, -2.2892258167266846, -1.755683422088623, -1.2221410274505615, -0.6885986328125, -0.15505623817443848, 0.37848615646362305, 0.9120285511016846, 1.445570945739746, 1.9791133403778076, 2.512655735015869, 3.0461981296539307, 3.579740524291992, 4.113283157348633, 4.646825313568115, 5.180367469787598, 5.713910102844238, 6.247452735900879, 6.780994892120361]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 3.0, 7.0, 5.0, 7.0, 8.0, 7.0, 15.0, 12.0, 12.0, 10.0, 21.0, 19.0, 18.0, 27.0, 31.0, 35.0, 40.0, 25.0, 37.0, 46.0, 39.0, 28.0, 42.0, 32.0, 32.0, 31.0, 31.0, 37.0, 36.0, 29.0, 34.0, 33.0, 32.0, 29.0, 13.0, 29.0, 19.0, 9.0, 11.0, 14.0, 9.0, 12.0, 8.0, 10.0, 9.0, 6.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-13.07627010345459, -12.650373458862305, -12.224477767944336, -11.79858112335205, -11.372684478759766, -10.946788787841797, -10.520892143249512, -10.094995498657227, -9.669099807739258, -9.243203163146973, -8.817307472229004, -8.391410827636719, -7.965514659881592, -7.539618492126465, -7.11372184753418, -6.687825679779053, -6.261929035186768, -5.836032867431641, -5.4101362228393555, -4.9842400550842285, -4.558343887329102, -4.132447242736816, -3.7065510749816895, -3.2806549072265625, -2.8547585010528564, -2.4288620948791504, -2.0029659271240234, -1.5770695209503174, -1.1511732339859009, -0.7252769470214844, -0.2993805408477783, 0.12651562690734863, 0.5524120330810547, 0.9783083200454712, 1.4042046070098877, 1.8301010131835938, 2.2559971809387207, 2.6818935871124268, 3.107789993286133, 3.5336861610412598, 3.959582567214966, 4.385478973388672, 4.811375141143799, 5.237271308898926, 5.663167953491211, 6.089064121246338, 6.514960289001465, 6.94085693359375, 7.366753101348877, 7.792649269104004, 8.218545913696289, 8.644441604614258, 9.070338249206543, 9.496234893798828, 9.922130584716797, 10.348027229309082, 10.773923873901367, 11.199820518493652, 11.625716209411621, 12.051612854003906, 12.477509498596191, 12.90340518951416, 13.329301834106445, 13.755197525024414, 14.1810941696167]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 9.0, 4.0, 5.0, 10.0, 3.0, 12.0, 15.0, 15.0, 20.0, 26.0, 22.0, 23.0, 28.0, 25.0, 36.0, 27.0, 37.0, 36.0, 47.0, 35.0, 47.0, 42.0, 47.0, 37.0, 33.0, 30.0, 36.0, 33.0, 37.0, 29.0, 28.0, 28.0, 21.0, 14.0, 18.0, 19.0, 15.0, 12.0, 11.0, 9.0, 8.0, 7.0, 1.0, 7.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-1.5, -1.4578704833984375, -1.415740966796875, -1.3736114501953125, -1.33148193359375, -1.2893524169921875, -1.247222900390625, -1.2050933837890625, -1.1629638671875, -1.1208343505859375, -1.078704833984375, -1.0365753173828125, -0.99444580078125, -0.9523162841796875, -0.910186767578125, -0.8680572509765625, -0.825927734375, -0.7837982177734375, -0.741668701171875, -0.6995391845703125, -0.65740966796875, -0.6152801513671875, -0.573150634765625, -0.5310211181640625, -0.4888916015625, -0.4467620849609375, -0.404632568359375, -0.3625030517578125, -0.32037353515625, -0.2782440185546875, -0.236114501953125, -0.1939849853515625, -0.15185546875, -0.1097259521484375, -0.067596435546875, -0.0254669189453125, 0.01666259765625, 0.0587921142578125, 0.100921630859375, 0.1430511474609375, 0.1851806640625, 0.2273101806640625, 0.269439697265625, 0.3115692138671875, 0.35369873046875, 0.3958282470703125, 0.437957763671875, 0.4800872802734375, 0.522216796875, 0.5643463134765625, 0.606475830078125, 0.6486053466796875, 0.69073486328125, 0.7328643798828125, 0.774993896484375, 0.8171234130859375, 0.8592529296875, 0.9013824462890625, 0.943511962890625, 0.9856414794921875, 1.02777099609375, 1.0699005126953125, 1.112030029296875, 1.1541595458984375, 1.1962890625]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 8.0, 7.0, 6.0, 13.0, 14.0, 14.0, 20.0, 19.0, 38.0, 52.0, 56.0, 78.0, 106.0, 180.0, 341.0, 752.0, 2231.0, 9942.0, 75733.0, 1169697.0, 2659620.0, 245612.0, 23152.0, 4187.0, 1185.0, 468.0, 200.0, 161.0, 100.0, 55.0, 57.0, 50.0, 23.0, 16.0, 17.0, 14.0, 11.0, 21.0, 8.0, 5.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.65234375, -4.50335693359375, -4.3543701171875, -4.20538330078125, -4.056396484375, -3.90740966796875, -3.7584228515625, -3.60943603515625, -3.46044921875, -3.31146240234375, -3.1624755859375, -3.01348876953125, -2.864501953125, -2.71551513671875, -2.5665283203125, -2.41754150390625, -2.2685546875, -2.11956787109375, -1.9705810546875, -1.82159423828125, -1.672607421875, -1.52362060546875, -1.3746337890625, -1.22564697265625, -1.07666015625, -0.92767333984375, -0.7786865234375, -0.62969970703125, -0.480712890625, -0.33172607421875, -0.1827392578125, -0.03375244140625, 0.115234375, 0.26422119140625, 0.4132080078125, 0.56219482421875, 0.711181640625, 0.86016845703125, 1.0091552734375, 1.15814208984375, 1.30712890625, 1.45611572265625, 1.6051025390625, 1.75408935546875, 1.903076171875, 2.05206298828125, 2.2010498046875, 2.35003662109375, 2.4990234375, 2.64801025390625, 2.7969970703125, 2.94598388671875, 3.094970703125, 3.24395751953125, 3.3929443359375, 3.54193115234375, 3.69091796875, 3.83990478515625, 3.9888916015625, 4.13787841796875, 4.286865234375, 4.43585205078125, 4.5848388671875, 4.73382568359375, 4.8828125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 7.0, 14.0, 19.0, 25.0, 43.0, 65.0, 111.0, 189.0, 287.0, 429.0, 561.0, 639.0, 530.0, 420.0, 256.0, 172.0, 113.0, 75.0, 62.0, 22.0, 10.0, 8.0, 10.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.8671875, -8.667510986328125, -8.46783447265625, -8.268157958984375, -8.0684814453125, -7.868804931640625, -7.66912841796875, -7.469451904296875, -7.269775390625, -7.070098876953125, -6.87042236328125, -6.670745849609375, -6.4710693359375, -6.271392822265625, -6.07171630859375, -5.872039794921875, -5.67236328125, -5.472686767578125, -5.27301025390625, -5.073333740234375, -4.8736572265625, -4.673980712890625, -4.47430419921875, -4.274627685546875, -4.074951171875, -3.875274658203125, -3.67559814453125, -3.475921630859375, -3.2762451171875, -3.076568603515625, -2.87689208984375, -2.677215576171875, -2.4775390625, -2.277862548828125, -2.07818603515625, -1.878509521484375, -1.6788330078125, -1.479156494140625, -1.27947998046875, -1.079803466796875, -0.880126953125, -0.680450439453125, -0.48077392578125, -0.281097412109375, -0.0814208984375, 0.118255615234375, 0.31793212890625, 0.517608642578125, 0.71728515625, 0.916961669921875, 1.11663818359375, 1.316314697265625, 1.5159912109375, 1.715667724609375, 1.91534423828125, 2.115020751953125, 2.314697265625, 2.514373779296875, 2.71405029296875, 2.913726806640625, 3.1134033203125, 3.313079833984375, 3.51275634765625, 3.712432861328125, 3.912109375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 3.0, 9.0, 16.0, 17.0, 51.0, 77.0, 138.0, 201.0, 445.0, 969.0, 5580.0, 250136.0, 3817389.0, 113831.0, 3874.0, 828.0, 314.0, 150.0, 106.0, 49.0, 30.0, 17.0, 21.0, 7.0, 7.0, 4.0, 8.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.703125, -11.24267578125, -10.7822265625, -10.32177734375, -9.861328125, -9.40087890625, -8.9404296875, -8.47998046875, -8.01953125, -7.55908203125, -7.0986328125, -6.63818359375, -6.177734375, -5.71728515625, -5.2568359375, -4.79638671875, -4.3359375, -3.87548828125, -3.4150390625, -2.95458984375, -2.494140625, -2.03369140625, -1.5732421875, -1.11279296875, -0.65234375, -0.19189453125, 0.2685546875, 0.72900390625, 1.189453125, 1.64990234375, 2.1103515625, 2.57080078125, 3.03125, 3.49169921875, 3.9521484375, 4.41259765625, 4.873046875, 5.33349609375, 5.7939453125, 6.25439453125, 6.71484375, 7.17529296875, 7.6357421875, 8.09619140625, 8.556640625, 9.01708984375, 9.4775390625, 9.93798828125, 10.3984375, 10.85888671875, 11.3193359375, 11.77978515625, 12.240234375, 12.70068359375, 13.1611328125, 13.62158203125, 14.08203125, 14.54248046875, 15.0029296875, 15.46337890625, 15.923828125, 16.38427734375, 16.8447265625, 17.30517578125, 17.765625]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 26.0, 42.0, 95.0, 138.0, 178.0, 174.0, 158.0, 92.0, 61.0, 29.0, 7.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.693729400634766, -36.87528610229492, -36.05684280395508, -35.238399505615234, -34.41995620727539, -33.60151290893555, -32.7830696105957, -31.964624404907227, -31.146181106567383, -30.32773780822754, -29.509294509887695, -28.69085121154785, -27.872407913208008, -27.05396270751953, -26.235519409179688, -25.417076110839844, -24.5986328125, -23.780189514160156, -22.961746215820312, -22.14330291748047, -21.324859619140625, -20.50641632080078, -19.687973022460938, -18.86952781677246, -18.05108642578125, -17.232643127441406, -16.414199829101562, -15.595756530761719, -14.777312278747559, -13.958868980407715, -13.140425682067871, -12.321981430053711, -11.50353717803955, -10.685093879699707, -9.866650581359863, -9.048206329345703, -8.22976303100586, -7.411319732666016, -6.592876434326172, -5.77443265914917, -4.955989360809326, -4.137546062469482, -3.3191022872924805, -2.5006589889526367, -1.6822154521942139, -0.863771915435791, -0.045328617095947266, 0.7731151580810547, 1.5915584564208984, 2.4100019931793213, 3.228445529937744, 4.046888828277588, 4.86533260345459, 5.683775901794434, 6.502219200134277, 7.320662975311279, 8.139106750488281, 8.957550048828125, 9.775993347167969, 10.594436645507812, 11.412880897521973, 12.231324195861816, 13.04976749420166, 13.86821174621582, 14.686654090881348]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 5.0, 0.0, 1.0, 2.0, 6.0, 8.0, 8.0, 9.0, 6.0, 11.0, 16.0, 20.0, 20.0, 13.0, 22.0, 22.0, 34.0, 40.0, 39.0, 29.0, 48.0, 29.0, 40.0, 41.0, 42.0, 52.0, 45.0, 50.0, 37.0, 38.0, 34.0, 35.0, 39.0, 22.0, 24.0, 21.0, 18.0, 14.0, 13.0, 8.0, 15.0, 11.0, 7.0, 9.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 5.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.780960083007812, -12.321908950805664, -11.8628568649292, -11.40380573272705, -10.944753646850586, -10.485702514648438, -10.026651382446289, -9.567599296569824, -9.10854721069336, -8.649496078491211, -8.190443992614746, -7.731392860412598, -7.272340774536133, -6.813289642333984, -6.354238033294678, -5.895186424255371, -5.436135292053223, -4.977083683013916, -4.518032073974609, -4.058980941772461, -3.599929094314575, -3.1408774852752686, -2.681826114654541, -2.2227745056152344, -1.7637228965759277, -1.304671287536621, -0.845619797706604, -0.3865683078765869, 0.07248330116271973, 0.5315349102020264, 0.9905862808227539, 1.4496378898620605, 1.9086894989013672, 2.367741107940674, 2.8267927169799805, 3.285844087600708, 3.7448956966400146, 4.203947067260742, 4.662998676300049, 5.1220502853393555, 5.581101894378662, 6.040153503417969, 6.499205112457275, 6.958256721496582, 7.4173078536987305, 7.876359939575195, 8.335411071777344, 8.794462203979492, 9.253514289855957, 9.712565422058105, 10.17161750793457, 10.630668640136719, 11.089720726013184, 11.548771858215332, 12.007823944091797, 12.466875076293945, 12.925926208496094, 13.384977340698242, 13.844029426574707, 14.303080558776855, 14.76213264465332, 15.221183776855469, 15.680234909057617, 16.139286041259766, 16.598339080810547]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 7.0, 5.0, 1.0, 10.0, 6.0, 13.0, 9.0, 16.0, 12.0, 13.0, 15.0, 31.0, 25.0, 21.0, 26.0, 37.0, 35.0, 37.0, 43.0, 46.0, 28.0, 52.0, 45.0, 41.0, 48.0, 39.0, 37.0, 44.0, 33.0, 30.0, 35.0, 27.0, 20.0, 22.0, 19.0, 16.0, 14.0, 8.0, 7.0, 10.0, 8.0, 10.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5712890625, -1.5255889892578125, -1.479888916015625, -1.4341888427734375, -1.38848876953125, -1.3427886962890625, -1.297088623046875, -1.2513885498046875, -1.2056884765625, -1.1599884033203125, -1.114288330078125, -1.0685882568359375, -1.02288818359375, -0.9771881103515625, -0.931488037109375, -0.8857879638671875, -0.840087890625, -0.7943878173828125, -0.748687744140625, -0.7029876708984375, -0.65728759765625, -0.6115875244140625, -0.565887451171875, -0.5201873779296875, -0.4744873046875, -0.4287872314453125, -0.383087158203125, -0.3373870849609375, -0.29168701171875, -0.2459869384765625, -0.200286865234375, -0.1545867919921875, -0.10888671875, -0.0631866455078125, -0.017486572265625, 0.0282135009765625, 0.07391357421875, 0.1196136474609375, 0.165313720703125, 0.2110137939453125, 0.2567138671875, 0.3024139404296875, 0.348114013671875, 0.3938140869140625, 0.43951416015625, 0.4852142333984375, 0.530914306640625, 0.5766143798828125, 0.622314453125, 0.6680145263671875, 0.713714599609375, 0.7594146728515625, 0.80511474609375, 0.8508148193359375, 0.896514892578125, 0.9422149658203125, 0.9879150390625, 1.0336151123046875, 1.079315185546875, 1.1250152587890625, 1.17071533203125, 1.2164154052734375, 1.262115478515625, 1.3078155517578125, 1.353515625]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 5.0, 7.0, 19.0, 17.0, 28.0, 43.0, 69.0, 92.0, 163.0, 239.0, 372.0, 528.0, 827.0, 1158.0, 1796.0, 2686.0, 4127.0, 6341.0, 9832.0, 15289.0, 24334.0, 39818.0, 68350.0, 134376.0, 311537.0, 200655.0, 91117.0, 50681.0, 30392.0, 18971.0, 12096.0, 7802.0, 4993.0, 3337.0, 2127.0, 1415.0, 980.0, 673.0, 461.0, 263.0, 184.0, 137.0, 78.0, 54.0, 36.0, 20.0, 15.0, 5.0, 8.0, 3.0, 2.0, 6.0, 1.0, 2.0], "bins": [-0.301025390625, -0.2923583984375, -0.28369140625, -0.2750244140625, -0.266357421875, -0.2576904296875, -0.2490234375, -0.2403564453125, -0.231689453125, -0.2230224609375, -0.21435546875, -0.2056884765625, -0.197021484375, -0.1883544921875, -0.1796875, -0.1710205078125, -0.162353515625, -0.1536865234375, -0.14501953125, -0.1363525390625, -0.127685546875, -0.1190185546875, -0.1103515625, -0.1016845703125, -0.093017578125, -0.0843505859375, -0.07568359375, -0.0670166015625, -0.058349609375, -0.0496826171875, -0.041015625, -0.0323486328125, -0.023681640625, -0.0150146484375, -0.00634765625, 0.0023193359375, 0.010986328125, 0.0196533203125, 0.0283203125, 0.0369873046875, 0.045654296875, 0.0543212890625, 0.06298828125, 0.0716552734375, 0.080322265625, 0.0889892578125, 0.09765625, 0.1063232421875, 0.114990234375, 0.1236572265625, 0.13232421875, 0.1409912109375, 0.149658203125, 0.1583251953125, 0.1669921875, 0.1756591796875, 0.184326171875, 0.1929931640625, 0.20166015625, 0.2103271484375, 0.218994140625, 0.2276611328125, 0.236328125, 0.2449951171875, 0.253662109375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 13.0, 7.0, 9.0, 12.0, 14.0, 17.0, 14.0, 27.0, 27.0, 18.0, 29.0, 31.0, 33.0, 42.0, 29.0, 45.0, 35.0, 47.0, 1056.0, 47.0, 43.0, 45.0, 29.0, 43.0, 31.0, 47.0, 23.0, 30.0, 35.0, 24.0, 33.0, 17.0, 8.0, 16.0, 15.0, 3.0, 14.0, 6.0, 4.0, 2.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.88671875, -0.8589859008789062, -0.8312530517578125, -0.8035202026367188, -0.775787353515625, -0.7480545043945312, -0.7203216552734375, -0.6925888061523438, -0.66485595703125, -0.6371231079101562, -0.6093902587890625, -0.5816574096679688, -0.553924560546875, -0.5261917114257812, -0.4984588623046875, -0.47072601318359375, -0.4429931640625, -0.41526031494140625, -0.3875274658203125, -0.35979461669921875, -0.332061767578125, -0.30432891845703125, -0.2765960693359375, -0.24886322021484375, -0.22113037109375, -0.19339752197265625, -0.1656646728515625, -0.13793182373046875, -0.110198974609375, -0.08246612548828125, -0.0547332763671875, -0.02700042724609375, 0.000732421875, 0.02846527099609375, 0.0561981201171875, 0.08393096923828125, 0.111663818359375, 0.13939666748046875, 0.1671295166015625, 0.19486236572265625, 0.22259521484375, 0.25032806396484375, 0.2780609130859375, 0.30579376220703125, 0.333526611328125, 0.36125946044921875, 0.3889923095703125, 0.41672515869140625, 0.4444580078125, 0.47219085693359375, 0.4999237060546875, 0.5276565551757812, 0.555389404296875, 0.5831222534179688, 0.6108551025390625, 0.6385879516601562, 0.66632080078125, 0.6940536499023438, 0.7217864990234375, 0.7495193481445312, 0.777252197265625, 0.8049850463867188, 0.8327178955078125, 0.8604507446289062, 0.88818359375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 3.0, 9.0, 14.0, 21.0, 25.0, 38.0, 62.0, 78.0, 121.0, 186.0, 257.0, 402.0, 610.0, 901.0, 1438.0, 2098.0, 3247.0, 5145.0, 7987.0, 12615.0, 19977.0, 33368.0, 55336.0, 99462.0, 209679.0, 1333621.0, 132897.0, 69595.0, 40969.0, 24646.0, 15078.0, 9653.0, 6208.0, 3974.0, 2524.0, 1687.0, 1079.0, 693.0, 445.0, 313.0, 206.0, 144.0, 100.0, 65.0, 48.0, 40.0, 29.0, 18.0, 9.0, 7.0, 3.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.2445068359375, -0.23691558837890625, -0.2293243408203125, -0.22173309326171875, -0.214141845703125, -0.20655059814453125, -0.1989593505859375, -0.19136810302734375, -0.18377685546875, -0.17618560791015625, -0.1685943603515625, -0.16100311279296875, -0.153411865234375, -0.14582061767578125, -0.1382293701171875, -0.13063812255859375, -0.123046875, -0.11545562744140625, -0.1078643798828125, -0.10027313232421875, -0.092681884765625, -0.08509063720703125, -0.0774993896484375, -0.06990814208984375, -0.06231689453125, -0.05472564697265625, -0.0471343994140625, -0.03954315185546875, -0.031951904296875, -0.02436065673828125, -0.0167694091796875, -0.00917816162109375, -0.0015869140625, 0.00600433349609375, 0.0135955810546875, 0.02118682861328125, 0.028778076171875, 0.03636932373046875, 0.0439605712890625, 0.05155181884765625, 0.05914306640625, 0.06673431396484375, 0.0743255615234375, 0.08191680908203125, 0.089508056640625, 0.09709930419921875, 0.1046905517578125, 0.11228179931640625, 0.119873046875, 0.12746429443359375, 0.1350555419921875, 0.14264678955078125, 0.150238037109375, 0.15782928466796875, 0.1654205322265625, 0.17301177978515625, 0.18060302734375, 0.18819427490234375, 0.1957855224609375, 0.20337677001953125, 0.210968017578125, 0.21855926513671875, 0.2261505126953125, 0.23374176025390625, 0.2413330078125]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 1.0, 1.0, 5.0, 6.0, 6.0, 4.0, 5.0, 8.0, 12.0, 11.0, 8.0, 21.0, 25.0, 19.0, 30.0, 26.0, 40.0, 43.0, 47.0, 46.0, 44.0, 46.0, 55.0, 55.0, 51.0, 55.0, 40.0, 43.0, 38.0, 40.0, 31.0, 22.0, 18.0, 20.0, 15.0, 19.0, 12.0, 7.0, 7.0, 7.0, 3.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0001678466796875, -0.00016313977539539337, -0.00015843287110328674, -0.00015372596681118011, -0.00014901906251907349, -0.00014431215822696686, -0.00013960525393486023, -0.0001348983496427536, -0.00013019144535064697, -0.00012548454105854034, -0.00012077763676643372, -0.00011607073247432709, -0.00011136382818222046, -0.00010665692389011383, -0.0001019500195980072, -9.724311530590057e-05, -9.253621101379395e-05, -8.782930672168732e-05, -8.312240242958069e-05, -7.841549813747406e-05, -7.370859384536743e-05, -6.90016895532608e-05, -6.429478526115417e-05, -5.9587880969047546e-05, -5.488097667694092e-05, -5.017407238483429e-05, -4.546716809272766e-05, -4.076026380062103e-05, -3.6053359508514404e-05, -3.1346455216407776e-05, -2.6639550924301147e-05, -2.193264663219452e-05, -1.722574234008789e-05, -1.2518838047981262e-05, -7.811933755874634e-06, -3.1050294637680054e-06, 1.601874828338623e-06, 6.3087791204452515e-06, 1.101568341255188e-05, 1.5722587704658508e-05, 2.0429491996765137e-05, 2.5136396288871765e-05, 2.9843300580978394e-05, 3.455020487308502e-05, 3.925710916519165e-05, 4.396401345729828e-05, 4.867091774940491e-05, 5.3377822041511536e-05, 5.8084726333618164e-05, 6.279163062572479e-05, 6.749853491783142e-05, 7.220543920993805e-05, 7.691234350204468e-05, 8.16192477941513e-05, 8.632615208625793e-05, 9.103305637836456e-05, 9.573996067047119e-05, 0.00010044686496257782, 0.00010515376925468445, 0.00010986067354679108, 0.0001145675778388977, 0.00011927448213100433, 0.00012398138642311096, 0.0001286882907152176, 0.00013339519500732422]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 6.0, 7.0, 12.0, 10.0, 17.0, 12.0, 20.0, 35.0, 27.0, 54.0, 64.0, 79.0, 101.0, 124.0, 161.0, 206.0, 323.0, 548.0, 2892.0, 980844.0, 60567.0, 947.0, 408.0, 295.0, 195.0, 153.0, 93.0, 95.0, 54.0, 53.0, 34.0, 25.0, 40.0, 13.0, 18.0, 6.0, 5.0, 4.0, 2.0, 0.0, 5.0, 5.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0025768280029296875, -0.0024839043617248535, -0.0023909807205200195, -0.0022980570793151855, -0.0022051334381103516, -0.0021122097969055176, -0.0020192861557006836, -0.0019263625144958496, -0.0018334388732910156, -0.0017405152320861816, -0.0016475915908813477, -0.0015546679496765137, -0.0014617443084716797, -0.0013688206672668457, -0.0012758970260620117, -0.0011829733848571777, -0.0010900497436523438, -0.0009971261024475098, -0.0009042024612426758, -0.0008112788200378418, -0.0007183551788330078, -0.0006254315376281738, -0.0005325078964233398, -0.00043958425521850586, -0.0003466606140136719, -0.0002537369728088379, -0.0001608133316040039, -6.788969039916992e-05, 2.5033950805664062e-05, 0.00011795759201049805, 0.00021088123321533203, 0.000303804874420166, 0.000396728515625, 0.000489652156829834, 0.000582575798034668, 0.000675499439239502, 0.0007684230804443359, 0.0008613467216491699, 0.0009542703628540039, 0.0010471940040588379, 0.0011401176452636719, 0.0012330412864685059, 0.0013259649276733398, 0.0014188885688781738, 0.0015118122100830078, 0.0016047358512878418, 0.0016976594924926758, 0.0017905831336975098, 0.0018835067749023438, 0.0019764304161071777, 0.0020693540573120117, 0.0021622776985168457, 0.0022552013397216797, 0.0023481249809265137, 0.0024410486221313477, 0.0025339722633361816, 0.0026268959045410156, 0.0027198195457458496, 0.0028127431869506836, 0.0029056668281555176, 0.0029985904693603516, 0.0030915141105651855, 0.0031844377517700195, 0.0032773613929748535, 0.0033702850341796875]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 45.0, 175.0, 337.0, 286.0, 121.0, 39.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00024024049344006926, -0.00023130580666474998, -0.00022237110533751547, -0.0002134364185621962, -0.00020450173178687692, -0.0001955670304596424, -0.00018663234368432313, -0.00017769765690900385, -0.00016876295558176935, -0.00015982826880645007, -0.00015089356747921556, -0.00014195888070389628, -0.000133024193928577, -0.00012408950715325773, -0.00011515480582602322, -0.00010622011905070394, -9.728543227538466e-05, -8.835073822410777e-05, -7.94160514487885e-05, -7.04813573975116e-05, -6.154667062219232e-05, -5.261197657091543e-05, -4.367728251963854e-05, -3.474259574431926e-05, -2.5807901693042368e-05, -1.6873211279744282e-05, -7.938519047456793e-06, 9.961731848306954e-07, 9.93086359812878e-06, 1.8865554011426866e-05, 2.780024806270376e-05, 3.673493483802304e-05, 4.566964344121516e-05, 5.460433385451324e-05, 6.353902426781133e-05, 7.247371831908822e-05, 8.14084050944075e-05, 9.034309914568439e-05, 9.927779319696128e-05, 0.00010821247997228056, 0.00011714717402355745, 0.00012608186807483435, 0.00013501655485015363, 0.0001439512416254729, 0.0001528859429527074, 0.0001618206297280267, 0.00017075531650334597, 0.00017969001783058047, 0.00018862470460589975, 0.00019755939138121903, 0.00020649409270845354, 0.00021542877948377281, 0.0002243634662590921, 0.0002332981675863266, 0.00024223285436164588, 0.00025116754113696516, 0.00026010224246419966, 0.00026903694379143417, 0.0002779716160148382, 0.0002869063173420727, 0.00029584101866930723, 0.0003047756908927113, 0.0003137103922199458, 0.00032264506444334984, 0.00033157976577058434]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 2.0, 4.0, 0.0, 7.0, 8.0, 11.0, 13.0, 26.0, 17.0, 25.0, 26.0, 22.0, 25.0, 28.0, 35.0, 35.0, 33.0, 24.0, 48.0, 43.0, 42.0, 41.0, 54.0, 30.0, 45.0, 41.0, 28.0, 30.0, 32.0, 16.0, 39.0, 21.0, 29.0, 21.0, 18.0, 16.0, 15.0, 10.0, 13.0, 5.0, 4.0, 9.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-9.417533874511719e-05, -9.147822856903076e-05, -8.878111839294434e-05, -8.608400821685791e-05, -8.338689804077148e-05, -8.068978786468506e-05, -7.799267768859863e-05, -7.529556751251221e-05, -7.259845733642578e-05, -6.990134716033936e-05, -6.720423698425293e-05, -6.45071268081665e-05, -6.181001663208008e-05, -5.911290645599365e-05, -5.6415796279907227e-05, -5.37186861038208e-05, -5.1021575927734375e-05, -4.832446575164795e-05, -4.5627355575561523e-05, -4.29302453994751e-05, -4.023313522338867e-05, -3.7536025047302246e-05, -3.483891487121582e-05, -3.2141804695129395e-05, -2.944469451904297e-05, -2.6747584342956543e-05, -2.4050474166870117e-05, -2.135336399078369e-05, -1.8656253814697266e-05, -1.595914363861084e-05, -1.3262033462524414e-05, -1.0564923286437988e-05, -7.867813110351562e-06, -5.170702934265137e-06, -2.473592758178711e-06, 2.2351741790771484e-07, 2.9206275939941406e-06, 5.617737770080566e-06, 8.314847946166992e-06, 1.1011958122253418e-05, 1.3709068298339844e-05, 1.640617847442627e-05, 1.9103288650512695e-05, 2.180039882659912e-05, 2.4497509002685547e-05, 2.7194619178771973e-05, 2.98917293548584e-05, 3.2588839530944824e-05, 3.528594970703125e-05, 3.7983059883117676e-05, 4.06801700592041e-05, 4.337728023529053e-05, 4.607439041137695e-05, 4.877150058746338e-05, 5.1468610763549805e-05, 5.416572093963623e-05, 5.6862831115722656e-05, 5.955994129180908e-05, 6.225705146789551e-05, 6.495416164398193e-05, 6.765127182006836e-05, 7.034838199615479e-05, 7.304549217224121e-05, 7.574260234832764e-05, 7.843971252441406e-05]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 7.0, 5.0, 1.0, 10.0, 6.0, 13.0, 9.0, 16.0, 12.0, 13.0, 15.0, 31.0, 25.0, 21.0, 26.0, 37.0, 35.0, 37.0, 43.0, 46.0, 28.0, 52.0, 45.0, 41.0, 48.0, 39.0, 37.0, 44.0, 33.0, 30.0, 35.0, 27.0, 20.0, 22.0, 19.0, 16.0, 14.0, 8.0, 7.0, 10.0, 8.0, 10.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5712890625, -1.5255889892578125, -1.479888916015625, -1.4341888427734375, -1.38848876953125, -1.3427886962890625, -1.297088623046875, -1.2513885498046875, -1.2056884765625, -1.1599884033203125, -1.114288330078125, -1.0685882568359375, -1.02288818359375, -0.9771881103515625, -0.931488037109375, -0.8857879638671875, -0.840087890625, -0.7943878173828125, -0.748687744140625, -0.7029876708984375, -0.65728759765625, -0.6115875244140625, -0.565887451171875, -0.5201873779296875, -0.4744873046875, -0.4287872314453125, -0.383087158203125, -0.3373870849609375, -0.29168701171875, -0.2459869384765625, -0.200286865234375, -0.1545867919921875, -0.10888671875, -0.0631866455078125, -0.017486572265625, 0.0282135009765625, 0.07391357421875, 0.1196136474609375, 0.165313720703125, 0.2110137939453125, 0.2567138671875, 0.3024139404296875, 0.348114013671875, 0.3938140869140625, 0.43951416015625, 0.4852142333984375, 0.530914306640625, 0.5766143798828125, 0.622314453125, 0.6680145263671875, 0.713714599609375, 0.7594146728515625, 0.80511474609375, 0.8508148193359375, 0.896514892578125, 0.9422149658203125, 0.9879150390625, 1.0336151123046875, 1.079315185546875, 1.1250152587890625, 1.17071533203125, 1.2164154052734375, 1.262115478515625, 1.3078155517578125, 1.353515625]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 7.0, 4.0, 5.0, 7.0, 8.0, 15.0, 15.0, 15.0, 36.0, 41.0, 56.0, 84.0, 93.0, 117.0, 144.0, 237.0, 312.0, 386.0, 677.0, 1065.0, 1561.0, 2738.0, 4788.0, 8808.0, 17480.0, 36762.0, 86699.0, 216883.0, 357714.0, 176669.0, 70469.0, 30908.0, 15003.0, 7761.0, 4166.0, 2349.0, 1490.0, 926.0, 592.0, 405.0, 283.0, 205.0, 151.0, 107.0, 86.0, 67.0, 45.0, 39.0, 26.0, 18.0, 16.0, 11.0, 8.0, 8.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.4716796875, -1.426239013671875, -1.38079833984375, -1.335357666015625, -1.2899169921875, -1.244476318359375, -1.19903564453125, -1.153594970703125, -1.108154296875, -1.062713623046875, -1.01727294921875, -0.971832275390625, -0.9263916015625, -0.880950927734375, -0.83551025390625, -0.790069580078125, -0.74462890625, -0.699188232421875, -0.65374755859375, -0.608306884765625, -0.5628662109375, -0.517425537109375, -0.47198486328125, -0.426544189453125, -0.381103515625, -0.335662841796875, -0.29022216796875, -0.244781494140625, -0.1993408203125, -0.153900146484375, -0.10845947265625, -0.063018798828125, -0.017578125, 0.027862548828125, 0.07330322265625, 0.118743896484375, 0.1641845703125, 0.209625244140625, 0.25506591796875, 0.300506591796875, 0.345947265625, 0.391387939453125, 0.43682861328125, 0.482269287109375, 0.5277099609375, 0.573150634765625, 0.61859130859375, 0.664031982421875, 0.70947265625, 0.754913330078125, 0.80035400390625, 0.845794677734375, 0.8912353515625, 0.936676025390625, 0.98211669921875, 1.027557373046875, 1.072998046875, 1.118438720703125, 1.16387939453125, 1.209320068359375, 1.2547607421875, 1.300201416015625, 1.34564208984375, 1.391082763671875, 1.4365234375]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 2.0, 2.0, 5.0, 7.0, 2.0, 12.0, 9.0, 12.0, 17.0, 13.0, 26.0, 19.0, 20.0, 35.0, 30.0, 32.0, 40.0, 40.0, 42.0, 60.0, 77.0, 220.0, 1505.0, 288.0, 102.0, 59.0, 59.0, 30.0, 28.0, 40.0, 29.0, 30.0, 25.0, 25.0, 19.0, 21.0, 12.0, 13.0, 7.0, 5.0, 8.0, 6.0, 1.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.91796875, -4.76275634765625, -4.6075439453125, -4.45233154296875, -4.297119140625, -4.14190673828125, -3.9866943359375, -3.83148193359375, -3.67626953125, -3.52105712890625, -3.3658447265625, -3.21063232421875, -3.055419921875, -2.90020751953125, -2.7449951171875, -2.58978271484375, -2.4345703125, -2.27935791015625, -2.1241455078125, -1.96893310546875, -1.813720703125, -1.65850830078125, -1.5032958984375, -1.34808349609375, -1.19287109375, -1.03765869140625, -0.8824462890625, -0.72723388671875, -0.572021484375, -0.41680908203125, -0.2615966796875, -0.10638427734375, 0.048828125, 0.20404052734375, 0.3592529296875, 0.51446533203125, 0.669677734375, 0.82489013671875, 0.9801025390625, 1.13531494140625, 1.29052734375, 1.44573974609375, 1.6009521484375, 1.75616455078125, 1.911376953125, 2.06658935546875, 2.2218017578125, 2.37701416015625, 2.5322265625, 2.68743896484375, 2.8426513671875, 2.99786376953125, 3.153076171875, 3.30828857421875, 3.4635009765625, 3.61871337890625, 3.77392578125, 3.92913818359375, 4.0843505859375, 4.23956298828125, 4.394775390625, 4.54998779296875, 4.7052001953125, 4.86041259765625, 5.015625]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 5.0, 6.0, 8.0, 9.0, 11.0, 9.0, 16.0, 23.0, 29.0, 30.0, 36.0, 51.0, 83.0, 98.0, 156.0, 293.0, 687.0, 2709.0, 42081.0, 2906076.0, 185113.0, 6097.0, 1011.0, 330.0, 198.0, 147.0, 97.0, 67.0, 47.0, 27.0, 37.0, 25.0, 23.0, 20.0, 8.0, 8.0, 5.0, 9.0, 5.0, 7.0, 5.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-10.1640625, -9.879150390625, -9.59423828125, -9.309326171875, -9.0244140625, -8.739501953125, -8.45458984375, -8.169677734375, -7.884765625, -7.599853515625, -7.31494140625, -7.030029296875, -6.7451171875, -6.460205078125, -6.17529296875, -5.890380859375, -5.60546875, -5.320556640625, -5.03564453125, -4.750732421875, -4.4658203125, -4.180908203125, -3.89599609375, -3.611083984375, -3.326171875, -3.041259765625, -2.75634765625, -2.471435546875, -2.1865234375, -1.901611328125, -1.61669921875, -1.331787109375, -1.046875, -0.761962890625, -0.47705078125, -0.192138671875, 0.0927734375, 0.377685546875, 0.66259765625, 0.947509765625, 1.232421875, 1.517333984375, 1.80224609375, 2.087158203125, 2.3720703125, 2.656982421875, 2.94189453125, 3.226806640625, 3.51171875, 3.796630859375, 4.08154296875, 4.366455078125, 4.6513671875, 4.936279296875, 5.22119140625, 5.506103515625, 5.791015625, 6.075927734375, 6.36083984375, 6.645751953125, 6.9306640625, 7.215576171875, 7.50048828125, 7.785400390625, 8.0703125]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 6.0, 20.0, 135.0, 366.0, 348.0, 122.0, 16.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.35190200805664, -14.58341121673584, -13.814920425415039, -13.046428680419922, -12.277938842773438, -11.50944709777832, -10.74095630645752, -9.972465515136719, -9.203974723815918, -8.435483932495117, -7.666993141174316, -6.898501873016357, -6.130011081695557, -5.361520290374756, -4.593029022216797, -3.824538230895996, -3.0560474395751953, -2.2875566482543945, -1.5190656185150146, -0.7505745887756348, 0.017916202545166016, 0.7864069938659668, 1.5548982620239258, 2.3233890533447266, 3.0918798446655273, 3.860370635986328, 4.628861427307129, 5.397352695465088, 6.165843486785889, 6.9343342781066895, 7.702825546264648, 8.47131633758545, 9.23980712890625, 10.00829792022705, 10.776788711547852, 11.545280456542969, 12.313770294189453, 13.08226203918457, 13.850752830505371, 14.619243621826172, 15.387734413146973, 16.156225204467773, 16.92471694946289, 17.693206787109375, 18.461698532104492, 19.230188369750977, 19.998680114746094, 20.767169952392578, 21.535661697387695, 22.304153442382812, 23.072643280029297, 23.841135025024414, 24.6096248626709, 25.378116607666016, 26.1466064453125, 26.915098190307617, 27.683589935302734, 28.45208168029785, 29.220571517944336, 29.989063262939453, 30.757553100585938, 31.526044845581055, 32.29453659057617, 33.063026428222656, 33.83151626586914]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 5.0, 4.0, 6.0, 5.0, 10.0, 7.0, 18.0, 20.0, 15.0, 21.0, 23.0, 32.0, 18.0, 33.0, 38.0, 26.0, 46.0, 41.0, 35.0, 44.0, 34.0, 49.0, 57.0, 42.0, 30.0, 29.0, 33.0, 29.0, 37.0, 37.0, 31.0, 20.0, 19.0, 22.0, 14.0, 11.0, 9.0, 12.0, 11.0, 6.0, 7.0, 11.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-17.569936752319336, -17.070125579833984, -16.5703125, -16.07050132751465, -15.57068920135498, -15.070877075195312, -14.571064949035645, -14.071252822875977, -13.571441650390625, -13.071629524230957, -12.571817398071289, -12.072006225585938, -11.57219409942627, -11.072381973266602, -10.572569847106934, -10.072757720947266, -9.572946548461914, -9.073134422302246, -8.573322296142578, -8.073511123657227, -7.573698997497559, -7.073886871337891, -6.574074745178223, -6.074263095855713, -5.574450492858887, -5.074638366699219, -4.574826717376709, -4.075014591217041, -3.5752029418945312, -3.0753908157348633, -2.5755789279937744, -2.0757670402526855, -1.5759553909301758, -1.076143503189087, -0.5763315558433533, -0.07651960849761963, 0.42329227924346924, 0.9231042861938477, 1.4229161739349365, 1.9227280616760254, 2.4225399494171143, 2.922351837158203, 3.422163724899292, 3.921975612640381, 4.421787738800049, 4.921599388122559, 5.421411514282227, 5.9212236404418945, 6.421035289764404, 6.920847415924072, 7.420659065246582, 7.92047119140625, 8.420283317565918, 8.920095443725586, 9.419906616210938, 9.919718742370605, 10.419530868530273, 10.919342994689941, 11.41915512084961, 11.918966293334961, 12.418778419494629, 12.918590545654297, 13.418402671813965, 13.918214797973633, 14.418025970458984]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 6.0, 4.0, 11.0, 12.0, 15.0, 8.0, 15.0, 17.0, 16.0, 19.0, 20.0, 19.0, 27.0, 29.0, 39.0, 35.0, 35.0, 39.0, 34.0, 41.0, 48.0, 51.0, 35.0, 41.0, 35.0, 44.0, 36.0, 32.0, 36.0, 31.0, 20.0, 29.0, 24.0, 11.0, 19.0, 19.0, 5.0, 8.0, 9.0, 7.0, 5.0, 8.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.6611328125, -1.6137237548828125, -1.566314697265625, -1.5189056396484375, -1.47149658203125, -1.4240875244140625, -1.376678466796875, -1.3292694091796875, -1.2818603515625, -1.2344512939453125, -1.187042236328125, -1.1396331787109375, -1.09222412109375, -1.0448150634765625, -0.997406005859375, -0.9499969482421875, -0.902587890625, -0.8551788330078125, -0.807769775390625, -0.7603607177734375, -0.71295166015625, -0.6655426025390625, -0.618133544921875, -0.5707244873046875, -0.5233154296875, -0.4759063720703125, -0.428497314453125, -0.3810882568359375, -0.33367919921875, -0.2862701416015625, -0.238861083984375, -0.1914520263671875, -0.14404296875, -0.0966339111328125, -0.049224853515625, -0.0018157958984375, 0.04559326171875, 0.0930023193359375, 0.140411376953125, 0.1878204345703125, 0.2352294921875, 0.2826385498046875, 0.330047607421875, 0.3774566650390625, 0.42486572265625, 0.4722747802734375, 0.519683837890625, 0.5670928955078125, 0.614501953125, 0.6619110107421875, 0.709320068359375, 0.7567291259765625, 0.80413818359375, 0.8515472412109375, 0.898956298828125, 0.9463653564453125, 0.9937744140625, 1.0411834716796875, 1.088592529296875, 1.1360015869140625, 1.18341064453125, 1.2308197021484375, 1.278228759765625, 1.3256378173828125, 1.373046875]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 7.0, 7.0, 11.0, 8.0, 12.0, 19.0, 13.0, 14.0, 16.0, 11.0, 13.0, 27.0, 20.0, 35.0, 49.0, 69.0, 136.0, 369.0, 1585.0, 11554.0, 330566.0, 3574222.0, 262910.0, 10400.0, 1398.0, 357.0, 125.0, 50.0, 32.0, 37.0, 37.0, 28.0, 18.0, 27.0, 15.0, 15.0, 14.0, 14.0, 10.0, 5.0, 7.0, 5.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0], "bins": [-7.87109375, -7.64276123046875, -7.4144287109375, -7.18609619140625, -6.957763671875, -6.72943115234375, -6.5010986328125, -6.27276611328125, -6.04443359375, -5.81610107421875, -5.5877685546875, -5.35943603515625, -5.131103515625, -4.90277099609375, -4.6744384765625, -4.44610595703125, -4.2177734375, -3.98944091796875, -3.7611083984375, -3.53277587890625, -3.304443359375, -3.07611083984375, -2.8477783203125, -2.61944580078125, -2.39111328125, -2.16278076171875, -1.9344482421875, -1.70611572265625, -1.477783203125, -1.24945068359375, -1.0211181640625, -0.79278564453125, -0.564453125, -0.33612060546875, -0.1077880859375, 0.12054443359375, 0.348876953125, 0.57720947265625, 0.8055419921875, 1.03387451171875, 1.26220703125, 1.49053955078125, 1.7188720703125, 1.94720458984375, 2.175537109375, 2.40386962890625, 2.6322021484375, 2.86053466796875, 3.0888671875, 3.31719970703125, 3.5455322265625, 3.77386474609375, 4.002197265625, 4.23052978515625, 4.4588623046875, 4.68719482421875, 4.91552734375, 5.14385986328125, 5.3721923828125, 5.60052490234375, 5.828857421875, 6.05718994140625, 6.2855224609375, 6.51385498046875, 6.7421875]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 7.0, 7.0, 6.0, 15.0, 16.0, 30.0, 28.0, 45.0, 57.0, 82.0, 123.0, 174.0, 239.0, 286.0, 395.0, 487.0, 452.0, 392.0, 329.0, 262.0, 168.0, 132.0, 89.0, 63.0, 45.0, 36.0, 19.0, 27.0, 25.0, 10.0, 7.0, 6.0, 6.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.27734375, -5.138763427734375, -5.00018310546875, -4.861602783203125, -4.7230224609375, -4.584442138671875, -4.44586181640625, -4.307281494140625, -4.168701171875, -4.030120849609375, -3.89154052734375, -3.752960205078125, -3.6143798828125, -3.475799560546875, -3.33721923828125, -3.198638916015625, -3.06005859375, -2.921478271484375, -2.78289794921875, -2.644317626953125, -2.5057373046875, -2.367156982421875, -2.22857666015625, -2.089996337890625, -1.951416015625, -1.812835693359375, -1.67425537109375, -1.535675048828125, -1.3970947265625, -1.258514404296875, -1.11993408203125, -0.981353759765625, -0.8427734375, -0.704193115234375, -0.56561279296875, -0.427032470703125, -0.2884521484375, -0.149871826171875, -0.01129150390625, 0.127288818359375, 0.265869140625, 0.404449462890625, 0.54302978515625, 0.681610107421875, 0.8201904296875, 0.958770751953125, 1.09735107421875, 1.235931396484375, 1.37451171875, 1.513092041015625, 1.65167236328125, 1.790252685546875, 1.9288330078125, 2.067413330078125, 2.20599365234375, 2.344573974609375, 2.483154296875, 2.621734619140625, 2.76031494140625, 2.898895263671875, 3.0374755859375, 3.176055908203125, 3.31463623046875, 3.453216552734375, 3.591796875]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 12.0, 13.0, 18.0, 30.0, 30.0, 49.0, 42.0, 87.0, 125.0, 175.0, 289.0, 689.0, 2296.0, 16871.0, 521574.0, 3496196.0, 145684.0, 7594.0, 1375.0, 439.0, 243.0, 136.0, 91.0, 59.0, 43.0, 32.0, 26.0, 13.0, 12.0, 5.0, 10.0, 7.0, 4.0, 6.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.546875, -11.166259765625, -10.78564453125, -10.405029296875, -10.0244140625, -9.643798828125, -9.26318359375, -8.882568359375, -8.501953125, -8.121337890625, -7.74072265625, -7.360107421875, -6.9794921875, -6.598876953125, -6.21826171875, -5.837646484375, -5.45703125, -5.076416015625, -4.69580078125, -4.315185546875, -3.9345703125, -3.553955078125, -3.17333984375, -2.792724609375, -2.412109375, -2.031494140625, -1.65087890625, -1.270263671875, -0.8896484375, -0.509033203125, -0.12841796875, 0.252197265625, 0.6328125, 1.013427734375, 1.39404296875, 1.774658203125, 2.1552734375, 2.535888671875, 2.91650390625, 3.297119140625, 3.677734375, 4.058349609375, 4.43896484375, 4.819580078125, 5.2001953125, 5.580810546875, 5.96142578125, 6.342041015625, 6.72265625, 7.103271484375, 7.48388671875, 7.864501953125, 8.2451171875, 8.625732421875, 9.00634765625, 9.386962890625, 9.767578125, 10.148193359375, 10.52880859375, 10.909423828125, 11.2900390625, 11.670654296875, 12.05126953125, 12.431884765625, 12.8125]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 14.0, 35.0, 38.0, 64.0, 90.0, 103.0, 111.0, 114.0, 101.0, 113.0, 81.0, 56.0, 31.0, 15.0, 18.0, 9.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.88625717163086, -26.293231964111328, -25.700204849243164, -25.107179641723633, -24.51415252685547, -23.921127319335938, -23.328102111816406, -22.735076904296875, -22.14204978942871, -21.54902458190918, -20.955997467041016, -20.362972259521484, -19.769947052001953, -19.17691993713379, -18.583894729614258, -17.990867614746094, -17.397842407226562, -16.80481719970703, -16.211790084838867, -15.618764877319336, -15.025738716125488, -14.43271255493164, -13.83968734741211, -13.246661186218262, -12.653635025024414, -12.060608863830566, -11.467582702636719, -10.874557495117188, -10.28153133392334, -9.688505172729492, -9.095479965209961, -8.502453804016113, -7.909427642822266, -7.316401481628418, -6.7233757972717285, -6.130350112915039, -5.537323951721191, -4.944297790527344, -4.351272106170654, -3.758246421813965, -3.165220260620117, -2.5721943378448486, -1.97916841506958, -1.3861424922943115, -0.793116569519043, -0.20009064674377441, 0.39293527603149414, 0.9859609603881836, 1.5789871215820312, 2.1720130443573, 2.7650389671325684, 3.358064889907837, 3.9510908126831055, 4.544116973876953, 5.137142658233643, 5.730168342590332, 6.32319450378418, 6.916220664978027, 7.509246349334717, 8.102272033691406, 8.695298194885254, 9.288324356079102, 9.881349563598633, 10.47437572479248, 11.067401885986328]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 8.0, 7.0, 9.0, 15.0, 16.0, 15.0, 17.0, 13.0, 23.0, 29.0, 24.0, 13.0, 34.0, 33.0, 36.0, 34.0, 40.0, 38.0, 43.0, 40.0, 44.0, 40.0, 39.0, 38.0, 36.0, 36.0, 33.0, 34.0, 23.0, 24.0, 23.0, 25.0, 13.0, 12.0, 20.0, 10.0, 8.0, 14.0, 9.0, 10.0, 7.0, 3.0, 7.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.997387886047363, -13.576021194458008, -13.154654502868652, -12.733287811279297, -12.311921119689941, -11.890554428100586, -11.46918773651123, -11.047821044921875, -10.62645435333252, -10.205087661743164, -9.783720970153809, -9.362354278564453, -8.940987586975098, -8.519620895385742, -8.098254203796387, -7.676887512207031, -7.255520820617676, -6.83415412902832, -6.412787437438965, -5.991420745849609, -5.570054054260254, -5.148687362670898, -4.727320671081543, -4.3059539794921875, -3.884587287902832, -3.4632205963134766, -3.041853904724121, -2.6204872131347656, -2.19912052154541, -1.7777538299560547, -1.3563871383666992, -0.9350204467773438, -0.5136528015136719, -0.0922861099243164, 0.32908058166503906, 0.7504472732543945, 1.17181396484375, 1.5931806564331055, 2.014547348022461, 2.4359140396118164, 2.857280731201172, 3.2786474227905273, 3.700014114379883, 4.121380805969238, 4.542747497558594, 4.964114189147949, 5.385480880737305, 5.80684757232666, 6.228214263916016, 6.649580955505371, 7.070947647094727, 7.492314338684082, 7.9136810302734375, 8.335047721862793, 8.756414413452148, 9.177781105041504, 9.59914779663086, 10.020514488220215, 10.44188117980957, 10.863247871398926, 11.284614562988281, 11.705981254577637, 12.127347946166992, 12.548714637756348, 12.970081329345703]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 7.0, 5.0, 7.0, 10.0, 12.0, 10.0, 12.0, 11.0, 12.0, 14.0, 21.0, 19.0, 22.0, 23.0, 24.0, 29.0, 37.0, 44.0, 42.0, 41.0, 56.0, 50.0, 41.0, 36.0, 36.0, 37.0, 36.0, 32.0, 30.0, 31.0, 36.0, 26.0, 19.0, 24.0, 16.0, 22.0, 19.0, 9.0, 12.0, 8.0, 5.0, 5.0, 5.0, 3.0, 4.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.48046875, -1.432861328125, -1.38525390625, -1.337646484375, -1.2900390625, -1.242431640625, -1.19482421875, -1.147216796875, -1.099609375, -1.052001953125, -1.00439453125, -0.956787109375, -0.9091796875, -0.861572265625, -0.81396484375, -0.766357421875, -0.71875, -0.671142578125, -0.62353515625, -0.575927734375, -0.5283203125, -0.480712890625, -0.43310546875, -0.385498046875, -0.337890625, -0.290283203125, -0.24267578125, -0.195068359375, -0.1474609375, -0.099853515625, -0.05224609375, -0.004638671875, 0.04296875, 0.090576171875, 0.13818359375, 0.185791015625, 0.2333984375, 0.281005859375, 0.32861328125, 0.376220703125, 0.423828125, 0.471435546875, 0.51904296875, 0.566650390625, 0.6142578125, 0.661865234375, 0.70947265625, 0.757080078125, 0.8046875, 0.852294921875, 0.89990234375, 0.947509765625, 0.9951171875, 1.042724609375, 1.09033203125, 1.137939453125, 1.185546875, 1.233154296875, 1.28076171875, 1.328369140625, 1.3759765625, 1.423583984375, 1.47119140625, 1.518798828125, 1.56640625]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [5.0, 5.0, 4.0, 2.0, 1.0, 7.0, 12.0, 24.0, 36.0, 53.0, 53.0, 81.0, 104.0, 204.0, 262.0, 357.0, 471.0, 791.0, 1041.0, 1410.0, 2155.0, 2995.0, 4470.0, 6467.0, 9337.0, 13712.0, 19804.0, 30293.0, 47804.0, 79826.0, 151319.0, 284248.0, 160944.0, 82863.0, 49716.0, 31570.0, 21018.0, 14095.0, 9522.0, 6596.0, 4553.0, 3095.0, 2191.0, 1494.0, 1028.0, 774.0, 527.0, 354.0, 263.0, 202.0, 135.0, 86.0, 46.0, 51.0, 37.0, 24.0, 12.0, 7.0, 3.0, 7.0, 3.0, 3.0, 1.0, 3.0], "bins": [-0.251220703125, -0.243255615234375, -0.23529052734375, -0.227325439453125, -0.2193603515625, -0.211395263671875, -0.20343017578125, -0.195465087890625, -0.1875, -0.179534912109375, -0.17156982421875, -0.163604736328125, -0.1556396484375, -0.147674560546875, -0.13970947265625, -0.131744384765625, -0.123779296875, -0.115814208984375, -0.10784912109375, -0.099884033203125, -0.0919189453125, -0.083953857421875, -0.07598876953125, -0.068023681640625, -0.06005859375, -0.052093505859375, -0.04412841796875, -0.036163330078125, -0.0281982421875, -0.020233154296875, -0.01226806640625, -0.004302978515625, 0.003662109375, 0.011627197265625, 0.01959228515625, 0.027557373046875, 0.0355224609375, 0.043487548828125, 0.05145263671875, 0.059417724609375, 0.0673828125, 0.075347900390625, 0.08331298828125, 0.091278076171875, 0.0992431640625, 0.107208251953125, 0.11517333984375, 0.123138427734375, 0.131103515625, 0.139068603515625, 0.14703369140625, 0.154998779296875, 0.1629638671875, 0.170928955078125, 0.17889404296875, 0.186859130859375, 0.19482421875, 0.202789306640625, 0.21075439453125, 0.218719482421875, 0.2266845703125, 0.234649658203125, 0.24261474609375, 0.250579833984375, 0.258544921875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 8.0, 3.0, 2.0, 2.0, 4.0, 7.0, 5.0, 8.0, 11.0, 11.0, 13.0, 12.0, 10.0, 20.0, 36.0, 21.0, 28.0, 34.0, 31.0, 34.0, 41.0, 38.0, 35.0, 31.0, 40.0, 45.0, 1062.0, 30.0, 29.0, 36.0, 35.0, 26.0, 25.0, 30.0, 34.0, 27.0, 33.0, 20.0, 18.0, 16.0, 19.0, 13.0, 10.0, 5.0, 7.0, 6.0, 7.0, 7.0, 3.0, 2.0, 1.0, 6.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8505859375, -0.821502685546875, -0.79241943359375, -0.763336181640625, -0.7342529296875, -0.705169677734375, -0.67608642578125, -0.647003173828125, -0.617919921875, -0.588836669921875, -0.55975341796875, -0.530670166015625, -0.5015869140625, -0.472503662109375, -0.44342041015625, -0.414337158203125, -0.38525390625, -0.356170654296875, -0.32708740234375, -0.298004150390625, -0.2689208984375, -0.239837646484375, -0.21075439453125, -0.181671142578125, -0.152587890625, -0.123504638671875, -0.09442138671875, -0.065338134765625, -0.0362548828125, -0.007171630859375, 0.02191162109375, 0.050994873046875, 0.080078125, 0.109161376953125, 0.13824462890625, 0.167327880859375, 0.1964111328125, 0.225494384765625, 0.25457763671875, 0.283660888671875, 0.312744140625, 0.341827392578125, 0.37091064453125, 0.399993896484375, 0.4290771484375, 0.458160400390625, 0.48724365234375, 0.516326904296875, 0.54541015625, 0.574493408203125, 0.60357666015625, 0.632659912109375, 0.6617431640625, 0.690826416015625, 0.71990966796875, 0.748992919921875, 0.778076171875, 0.807159423828125, 0.83624267578125, 0.865325927734375, 0.8944091796875, 0.923492431640625, 0.95257568359375, 0.981658935546875, 1.0107421875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 9.0, 9.0, 13.0, 17.0, 31.0, 51.0, 81.0, 122.0, 211.0, 275.0, 388.0, 597.0, 874.0, 1207.0, 1760.0, 2634.0, 3800.0, 5842.0, 8817.0, 13471.0, 20994.0, 32780.0, 54578.0, 94291.0, 186839.0, 1331382.0, 136924.0, 75695.0, 44536.0, 27501.0, 17494.0, 11323.0, 7310.0, 4874.0, 3359.0, 2299.0, 1469.0, 1062.0, 763.0, 459.0, 345.0, 195.0, 164.0, 105.0, 59.0, 49.0, 31.0, 17.0, 14.0, 9.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.24951171875, -0.24127578735351562, -0.23303985595703125, -0.22480392456054688, -0.2165679931640625, -0.20833206176757812, -0.20009613037109375, -0.19186019897460938, -0.183624267578125, -0.17538833618164062, -0.16715240478515625, -0.15891647338867188, -0.1506805419921875, -0.14244461059570312, -0.13420867919921875, -0.12597274780273438, -0.11773681640625, -0.10950088500976562, -0.10126495361328125, -0.09302902221679688, -0.0847930908203125, -0.07655715942382812, -0.06832122802734375, -0.060085296630859375, -0.051849365234375, -0.043613433837890625, -0.03537750244140625, -0.027141571044921875, -0.0189056396484375, -0.010669708251953125, -0.00243377685546875, 0.005802154541015625, 0.0140380859375, 0.022274017333984375, 0.03050994873046875, 0.038745880126953125, 0.0469818115234375, 0.055217742919921875, 0.06345367431640625, 0.07168960571289062, 0.079925537109375, 0.08816146850585938, 0.09639739990234375, 0.10463333129882812, 0.1128692626953125, 0.12110519409179688, 0.12934112548828125, 0.13757705688476562, 0.14581298828125, 0.15404891967773438, 0.16228485107421875, 0.17052078247070312, 0.1787567138671875, 0.18699264526367188, 0.19522857666015625, 0.20346450805664062, 0.211700439453125, 0.21993637084960938, 0.22817230224609375, 0.23640823364257812, 0.2446441650390625, 0.2528800964355469, 0.26111602783203125, 0.2693519592285156, 0.277587890625]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 4.0, 8.0, 7.0, 11.0, 11.0, 11.0, 10.0, 19.0, 14.0, 30.0, 31.0, 36.0, 53.0, 42.0, 37.0, 48.0, 63.0, 49.0, 46.0, 41.0, 39.0, 46.0, 49.0, 46.0, 37.0, 36.0, 29.0, 25.0, 18.0, 17.0, 18.0, 13.0, 12.0, 8.0, 9.0, 9.0, 8.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.00016367435455322266, -0.00015834160149097443, -0.0001530088484287262, -0.00014767609536647797, -0.00014234334230422974, -0.0001370105892419815, -0.00013167783617973328, -0.00012634508311748505, -0.00012101233005523682, -0.00011567957699298859, -0.00011034682393074036, -0.00010501407086849213, -9.96813178062439e-05, -9.434856474399567e-05, -8.901581168174744e-05, -8.36830586194992e-05, -7.835030555725098e-05, -7.301755249500275e-05, -6.768479943275452e-05, -6.235204637050629e-05, -5.701929330825806e-05, -5.168654024600983e-05, -4.63537871837616e-05, -4.102103412151337e-05, -3.568828105926514e-05, -3.0355527997016907e-05, -2.5022774934768677e-05, -1.9690021872520447e-05, -1.4357268810272217e-05, -9.024515748023987e-06, -3.691762685775757e-06, 1.6409903764724731e-06, 6.973743438720703e-06, 1.2306496500968933e-05, 1.7639249563217163e-05, 2.2972002625465393e-05, 2.8304755687713623e-05, 3.363750874996185e-05, 3.897026181221008e-05, 4.430301487445831e-05, 4.963576793670654e-05, 5.496852099895477e-05, 6.0301274061203e-05, 6.563402712345123e-05, 7.096678018569946e-05, 7.629953324794769e-05, 8.163228631019592e-05, 8.696503937244415e-05, 9.229779243469238e-05, 9.763054549694061e-05, 0.00010296329855918884, 0.00010829605162143707, 0.0001136288046836853, 0.00011896155774593353, 0.00012429431080818176, 0.00012962706387043, 0.00013495981693267822, 0.00014029256999492645, 0.00014562532305717468, 0.0001509580761194229, 0.00015629082918167114, 0.00016162358224391937, 0.0001669563353061676, 0.00017228908836841583, 0.00017762184143066406]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 3.0, 4.0, 11.0, 9.0, 12.0, 23.0, 18.0, 25.0, 41.0, 45.0, 57.0, 71.0, 106.0, 109.0, 167.0, 275.0, 324.0, 613.0, 3339.0, 942681.0, 97947.0, 1150.0, 443.0, 254.0, 208.0, 116.0, 120.0, 93.0, 86.0, 54.0, 34.0, 31.0, 11.0, 13.0, 17.0, 10.0, 7.0, 7.0, 10.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0031909942626953125, -0.00308382511138916, -0.002976655960083008, -0.0028694868087768555, -0.002762317657470703, -0.0026551485061645508, -0.0025479793548583984, -0.002440810203552246, -0.0023336410522460938, -0.0022264719009399414, -0.002119302749633789, -0.0020121335983276367, -0.0019049644470214844, -0.001797795295715332, -0.0016906261444091797, -0.0015834569931030273, -0.001476287841796875, -0.0013691186904907227, -0.0012619495391845703, -0.001154780387878418, -0.0010476112365722656, -0.0009404420852661133, -0.0008332729339599609, -0.0007261037826538086, -0.0006189346313476562, -0.0005117654800415039, -0.00040459632873535156, -0.0002974271774291992, -0.00019025802612304688, -8.308887481689453e-05, 2.4080276489257812e-05, 0.00013124942779541016, 0.0002384185791015625, 0.00034558773040771484, 0.0004527568817138672, 0.0005599260330200195, 0.0006670951843261719, 0.0007742643356323242, 0.0008814334869384766, 0.000988602638244629, 0.0010957717895507812, 0.0012029409408569336, 0.001310110092163086, 0.0014172792434692383, 0.0015244483947753906, 0.001631617546081543, 0.0017387866973876953, 0.0018459558486938477, 0.001953125, 0.0020602941513061523, 0.0021674633026123047, 0.002274632453918457, 0.0023818016052246094, 0.0024889707565307617, 0.002596139907836914, 0.0027033090591430664, 0.0028104782104492188, 0.002917647361755371, 0.0030248165130615234, 0.0031319856643676758, 0.003239154815673828, 0.0033463239669799805, 0.003453493118286133, 0.003560662269592285, 0.0036678314208984375]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 8.0, 119.0, 523.0, 309.0, 49.0, 6.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0010006871307268739, -0.000982757075689733, -0.0009648269042372704, -0.0009468968492001295, -0.0009289667359553277, -0.000911036622710526, -0.0008931065676733851, -0.0008751764544285834, -0.0008572463411837816, -0.0008393162279389799, -0.0008213861146941781, -0.0008034560596570373, -0.0007855259464122355, -0.0007675958331674337, -0.0007496657781302929, -0.0007317356648854911, -0.0007138055516406894, -0.0006958754383958876, -0.0006779453251510859, -0.000660015270113945, -0.0006420851568691432, -0.0006241550436243415, -0.0006062249885872006, -0.0005882948753423989, -0.0005703647620975971, -0.0005524346488527954, -0.0005345045356079936, -0.0005165744805708528, -0.000498644367326051, -0.00048071425408124924, -0.00046278416994027793, -0.00044485408579930663, -0.00042692391434684396, -0.0004089938011020422, -0.0003910637169610709, -0.0003731336328200996, -0.00035520351957529783, -0.00033727340633049607, -0.00031934332218952477, -0.00030141323804855347, -0.0002834831248037517, -0.00026555301155894995, -0.00024762292741797864, -0.0002296928287250921, -0.00021176273003220558, -0.00019383263133931905, -0.00017590253264643252, -0.000157972433953546, -0.00014004234981257468, -0.00012211225111968815, -0.00010418215242680162, -8.625205373391509e-05, -6.832195504102856e-05, -5.039185634814203e-05, -3.2461757655255497e-05, -1.4531658962368965e-05, 3.398439730517566e-06, 2.1328538423404098e-05, 3.925863711629063e-05, 5.718873580917716e-05, 7.511883450206369e-05, 9.304893319495022e-05, 0.00011097903188783675, 0.00012890913058072329, 0.00014683922927360982]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 5.0, 6.0, 12.0, 12.0, 11.0, 14.0, 19.0, 19.0, 23.0, 41.0, 20.0, 22.0, 32.0, 35.0, 29.0, 38.0, 35.0, 50.0, 45.0, 35.0, 48.0, 44.0, 42.0, 37.0, 37.0, 41.0, 33.0, 20.0, 27.0, 26.0, 24.0, 19.0, 19.0, 19.0, 10.0, 1.0, 14.0, 8.0, 2.0, 5.0, 8.0, 6.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0], "bins": [-0.00011289119720458984, -0.00010976940393447876, -0.00010664761066436768, -0.00010352581739425659, -0.00010040402412414551, -9.728223085403442e-05, -9.416043758392334e-05, -9.103864431381226e-05, -8.791685104370117e-05, -8.479505777359009e-05, -8.1673264503479e-05, -7.855147123336792e-05, -7.542967796325684e-05, -7.230788469314575e-05, -6.918609142303467e-05, -6.606429815292358e-05, -6.29425048828125e-05, -5.9820711612701416e-05, -5.669891834259033e-05, -5.357712507247925e-05, -5.0455331802368164e-05, -4.733353853225708e-05, -4.4211745262145996e-05, -4.108995199203491e-05, -3.796815872192383e-05, -3.4846365451812744e-05, -3.172457218170166e-05, -2.8602778911590576e-05, -2.5480985641479492e-05, -2.2359192371368408e-05, -1.9237399101257324e-05, -1.611560583114624e-05, -1.2993812561035156e-05, -9.872019290924072e-06, -6.750226020812988e-06, -3.6284327507019043e-06, -5.066394805908203e-07, 2.6151537895202637e-06, 5.736947059631348e-06, 8.858740329742432e-06, 1.1980533599853516e-05, 1.51023268699646e-05, 1.8224120140075684e-05, 2.1345913410186768e-05, 2.446770668029785e-05, 2.7589499950408936e-05, 3.071129322052002e-05, 3.3833086490631104e-05, 3.695487976074219e-05, 4.007667303085327e-05, 4.3198466300964355e-05, 4.632025957107544e-05, 4.9442052841186523e-05, 5.256384611129761e-05, 5.568563938140869e-05, 5.8807432651519775e-05, 6.192922592163086e-05, 6.505101919174194e-05, 6.817281246185303e-05, 7.129460573196411e-05, 7.44163990020752e-05, 7.753819227218628e-05, 8.065998554229736e-05, 8.378177881240845e-05, 8.690357208251953e-05]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 7.0, 5.0, 7.0, 10.0, 12.0, 10.0, 12.0, 11.0, 12.0, 14.0, 21.0, 19.0, 22.0, 23.0, 24.0, 29.0, 37.0, 44.0, 42.0, 41.0, 56.0, 50.0, 41.0, 36.0, 36.0, 37.0, 36.0, 32.0, 30.0, 31.0, 36.0, 26.0, 19.0, 24.0, 16.0, 22.0, 19.0, 9.0, 12.0, 8.0, 5.0, 5.0, 5.0, 3.0, 4.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.48046875, -1.432861328125, -1.38525390625, -1.337646484375, -1.2900390625, -1.242431640625, -1.19482421875, -1.147216796875, -1.099609375, -1.052001953125, -1.00439453125, -0.956787109375, -0.9091796875, -0.861572265625, -0.81396484375, -0.766357421875, -0.71875, -0.671142578125, -0.62353515625, -0.575927734375, -0.5283203125, -0.480712890625, -0.43310546875, -0.385498046875, -0.337890625, -0.290283203125, -0.24267578125, -0.195068359375, -0.1474609375, -0.099853515625, -0.05224609375, -0.004638671875, 0.04296875, 0.090576171875, 0.13818359375, 0.185791015625, 0.2333984375, 0.281005859375, 0.32861328125, 0.376220703125, 0.423828125, 0.471435546875, 0.51904296875, 0.566650390625, 0.6142578125, 0.661865234375, 0.70947265625, 0.757080078125, 0.8046875, 0.852294921875, 0.89990234375, 0.947509765625, 0.9951171875, 1.042724609375, 1.09033203125, 1.137939453125, 1.185546875, 1.233154296875, 1.28076171875, 1.328369140625, 1.3759765625, 1.423583984375, 1.47119140625, 1.518798828125, 1.56640625]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 9.0, 7.0, 5.0, 12.0, 10.0, 16.0, 30.0, 32.0, 38.0, 55.0, 95.0, 98.0, 154.0, 207.0, 337.0, 478.0, 789.0, 1611.0, 3246.0, 7989.0, 24446.0, 97705.0, 381692.0, 389632.0, 99418.0, 25117.0, 8116.0, 3231.0, 1514.0, 829.0, 556.0, 324.0, 200.0, 162.0, 111.0, 74.0, 61.0, 36.0, 35.0, 21.0, 22.0, 12.0, 8.0, 7.0, 4.0, 7.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.044921875, -1.976776123046875, -1.90863037109375, -1.840484619140625, -1.7723388671875, -1.704193115234375, -1.63604736328125, -1.567901611328125, -1.499755859375, -1.431610107421875, -1.36346435546875, -1.295318603515625, -1.2271728515625, -1.159027099609375, -1.09088134765625, -1.022735595703125, -0.95458984375, -0.886444091796875, -0.81829833984375, -0.750152587890625, -0.6820068359375, -0.613861083984375, -0.54571533203125, -0.477569580078125, -0.409423828125, -0.341278076171875, -0.27313232421875, -0.204986572265625, -0.1368408203125, -0.068695068359375, -0.00054931640625, 0.067596435546875, 0.1357421875, 0.203887939453125, 0.27203369140625, 0.340179443359375, 0.4083251953125, 0.476470947265625, 0.54461669921875, 0.612762451171875, 0.680908203125, 0.749053955078125, 0.81719970703125, 0.885345458984375, 0.9534912109375, 1.021636962890625, 1.08978271484375, 1.157928466796875, 1.22607421875, 1.294219970703125, 1.36236572265625, 1.430511474609375, 1.4986572265625, 1.566802978515625, 1.63494873046875, 1.703094482421875, 1.771240234375, 1.839385986328125, 1.90753173828125, 1.975677490234375, 2.0438232421875, 2.111968994140625, 2.18011474609375, 2.248260498046875, 2.31640625]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 7.0, 4.0, 6.0, 5.0, 11.0, 13.0, 11.0, 12.0, 12.0, 16.0, 28.0, 23.0, 24.0, 27.0, 34.0, 27.0, 40.0, 35.0, 60.0, 83.0, 112.0, 338.0, 1463.0, 152.0, 80.0, 58.0, 48.0, 52.0, 34.0, 34.0, 21.0, 18.0, 27.0, 19.0, 17.0, 18.0, 15.0, 11.0, 8.0, 10.0, 11.0, 8.0, 4.0, 5.0, 2.0, 3.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.16015625, -4.99981689453125, -4.8394775390625, -4.67913818359375, -4.518798828125, -4.35845947265625, -4.1981201171875, -4.03778076171875, -3.87744140625, -3.71710205078125, -3.5567626953125, -3.39642333984375, -3.236083984375, -3.07574462890625, -2.9154052734375, -2.75506591796875, -2.5947265625, -2.43438720703125, -2.2740478515625, -2.11370849609375, -1.953369140625, -1.79302978515625, -1.6326904296875, -1.47235107421875, -1.31201171875, -1.15167236328125, -0.9913330078125, -0.83099365234375, -0.670654296875, -0.51031494140625, -0.3499755859375, -0.18963623046875, -0.029296875, 0.13104248046875, 0.2913818359375, 0.45172119140625, 0.612060546875, 0.77239990234375, 0.9327392578125, 1.09307861328125, 1.25341796875, 1.41375732421875, 1.5740966796875, 1.73443603515625, 1.894775390625, 2.05511474609375, 2.2154541015625, 2.37579345703125, 2.5361328125, 2.69647216796875, 2.8568115234375, 3.01715087890625, 3.177490234375, 3.33782958984375, 3.4981689453125, 3.65850830078125, 3.81884765625, 3.97918701171875, 4.1395263671875, 4.29986572265625, 4.460205078125, 4.62054443359375, 4.7808837890625, 4.94122314453125, 5.1015625]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 3.0, 11.0, 8.0, 6.0, 17.0, 19.0, 27.0, 33.0, 41.0, 54.0, 63.0, 87.0, 154.0, 301.0, 705.0, 3112.0, 73598.0, 3022724.0, 40903.0, 2447.0, 592.0, 270.0, 168.0, 82.0, 66.0, 56.0, 34.0, 27.0, 18.0, 24.0, 20.0, 8.0, 6.0, 7.0, 12.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.0703125, -10.72900390625, -10.3876953125, -10.04638671875, -9.705078125, -9.36376953125, -9.0224609375, -8.68115234375, -8.33984375, -7.99853515625, -7.6572265625, -7.31591796875, -6.974609375, -6.63330078125, -6.2919921875, -5.95068359375, -5.609375, -5.26806640625, -4.9267578125, -4.58544921875, -4.244140625, -3.90283203125, -3.5615234375, -3.22021484375, -2.87890625, -2.53759765625, -2.1962890625, -1.85498046875, -1.513671875, -1.17236328125, -0.8310546875, -0.48974609375, -0.1484375, 0.19287109375, 0.5341796875, 0.87548828125, 1.216796875, 1.55810546875, 1.8994140625, 2.24072265625, 2.58203125, 2.92333984375, 3.2646484375, 3.60595703125, 3.947265625, 4.28857421875, 4.6298828125, 4.97119140625, 5.3125, 5.65380859375, 5.9951171875, 6.33642578125, 6.677734375, 7.01904296875, 7.3603515625, 7.70166015625, 8.04296875, 8.38427734375, 8.7255859375, 9.06689453125, 9.408203125, 9.74951171875, 10.0908203125, 10.43212890625, 10.7734375]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [16.0, 441.0, 548.0, 10.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.105020523071289, -2.1163346767425537, -0.12764883041381836, 1.861037254333496, 3.8497228622436523, 5.838408470153809, 7.827095031738281, 9.815780639648438, 11.804466247558594, 13.79315185546875, 15.781837463378906, 17.770523071289062, 19.75920867919922, 21.747894287109375, 23.736581802368164, 25.72526741027832, 27.713953018188477, 29.702638626098633, 31.69132423400879, 33.68001174926758, 35.668697357177734, 37.65738296508789, 39.64606857299805, 41.6347541809082, 43.62343978881836, 45.612125396728516, 47.60081100463867, 49.58949661254883, 51.578182220458984, 53.56686782836914, 55.55555725097656, 57.54424285888672, 59.532928466796875, 61.52161407470703, 63.51029968261719, 65.49898529052734, 67.4876708984375, 69.47635650634766, 71.46504211425781, 73.45372772216797, 75.44241333007812, 77.43109893798828, 79.41978454589844, 81.4084701538086, 83.39715576171875, 85.3858413696289, 87.37452697753906, 89.36321258544922, 91.35189819335938, 93.34058380126953, 95.32926940917969, 97.31795501708984, 99.306640625, 101.29532623291016, 103.28401184082031, 105.27269744873047, 107.26139068603516, 109.25007629394531, 111.23876190185547, 113.22744750976562, 115.21613311767578, 117.20481872558594, 119.1935043334961, 121.18218994140625, 123.1708755493164]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 3.0, 6.0, 7.0, 8.0, 9.0, 8.0, 11.0, 11.0, 17.0, 20.0, 20.0, 21.0, 26.0, 26.0, 28.0, 27.0, 24.0, 21.0, 36.0, 26.0, 42.0, 37.0, 39.0, 38.0, 29.0, 41.0, 48.0, 38.0, 29.0, 35.0, 32.0, 27.0, 30.0, 31.0, 23.0, 11.0, 15.0, 19.0, 13.0, 19.0, 13.0, 13.0, 5.0, 4.0, 2.0, 5.0, 1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-16.06462860107422, -15.56001091003418, -15.05539321899414, -14.550775527954102, -14.046157836914062, -13.541540145874023, -13.036921501159668, -12.532303810119629, -12.02768611907959, -11.52306842803955, -11.018450736999512, -10.513833045959473, -10.009214401245117, -9.504596710205078, -8.999979019165039, -8.495361328125, -7.990743637084961, -7.486125946044922, -6.981508255004883, -6.4768900871276855, -5.9722723960876465, -5.467654705047607, -4.96303653717041, -4.458418846130371, -3.953801155090332, -3.449183464050293, -2.944565534591675, -2.4399476051330566, -1.9353299140930176, -1.4307122230529785, -0.9260942935943604, -0.4214763641357422, 0.08314132690429688, 0.5877591371536255, 1.092376947402954, 1.5969947576522827, 2.1016125679016113, 2.6062302589416504, 3.1108481884002686, 3.6154661178588867, 4.120083808898926, 4.624701499938965, 5.129319190979004, 5.633937358856201, 6.13855504989624, 6.643172740936279, 7.147790908813477, 7.652408599853516, 8.157026290893555, 8.661643981933594, 9.166261672973633, 9.670879364013672, 10.175497055053711, 10.68011474609375, 11.184733390808105, 11.689351081848145, 12.193968772888184, 12.698586463928223, 13.203204154968262, 13.7078218460083, 14.212440490722656, 14.717058181762695, 15.221675872802734, 15.726293563842773, 16.230911254882812]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 6.0, 8.0, 10.0, 10.0, 9.0, 12.0, 9.0, 14.0, 12.0, 18.0, 21.0, 18.0, 10.0, 20.0, 33.0, 21.0, 42.0, 32.0, 46.0, 41.0, 56.0, 50.0, 38.0, 44.0, 34.0, 43.0, 38.0, 29.0, 22.0, 35.0, 27.0, 31.0, 24.0, 30.0, 26.0, 14.0, 25.0, 7.0, 7.0, 9.0, 4.0, 1.0, 5.0, 8.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5673828125, -1.5173492431640625, -1.467315673828125, -1.4172821044921875, -1.36724853515625, -1.3172149658203125, -1.267181396484375, -1.2171478271484375, -1.1671142578125, -1.1170806884765625, -1.067047119140625, -1.0170135498046875, -0.96697998046875, -0.9169464111328125, -0.866912841796875, -0.8168792724609375, -0.766845703125, -0.7168121337890625, -0.666778564453125, -0.6167449951171875, -0.56671142578125, -0.5166778564453125, -0.466644287109375, -0.4166107177734375, -0.3665771484375, -0.3165435791015625, -0.266510009765625, -0.2164764404296875, -0.16644287109375, -0.1164093017578125, -0.066375732421875, -0.0163421630859375, 0.03369140625, 0.0837249755859375, 0.133758544921875, 0.1837921142578125, 0.23382568359375, 0.2838592529296875, 0.333892822265625, 0.3839263916015625, 0.4339599609375, 0.4839935302734375, 0.534027099609375, 0.5840606689453125, 0.63409423828125, 0.6841278076171875, 0.734161376953125, 0.7841949462890625, 0.834228515625, 0.8842620849609375, 0.934295654296875, 0.9843292236328125, 1.03436279296875, 1.0843963623046875, 1.134429931640625, 1.1844635009765625, 1.2344970703125, 1.2845306396484375, 1.334564208984375, 1.3845977783203125, 1.43463134765625, 1.4846649169921875, 1.534698486328125, 1.5847320556640625, 1.634765625]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 2.0, 2.0, 6.0, 6.0, 6.0, 14.0, 8.0, 8.0, 19.0, 22.0, 17.0, 22.0, 44.0, 70.0, 116.0, 179.0, 371.0, 833.0, 2289.0, 7603.0, 33281.0, 211460.0, 1460883.0, 2016106.0, 389176.0, 54733.0, 11623.0, 3252.0, 1105.0, 433.0, 203.0, 115.0, 82.0, 52.0, 41.0, 25.0, 13.0, 19.0, 12.0, 5.0, 8.0, 11.0, 4.0, 5.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.376953125, -3.264923095703125, -3.15289306640625, -3.040863037109375, -2.9288330078125, -2.816802978515625, -2.70477294921875, -2.592742919921875, -2.480712890625, -2.368682861328125, -2.25665283203125, -2.144622802734375, -2.0325927734375, -1.920562744140625, -1.80853271484375, -1.696502685546875, -1.58447265625, -1.472442626953125, -1.36041259765625, -1.248382568359375, -1.1363525390625, -1.024322509765625, -0.91229248046875, -0.800262451171875, -0.688232421875, -0.576202392578125, -0.46417236328125, -0.352142333984375, -0.2401123046875, -0.128082275390625, -0.01605224609375, 0.095977783203125, 0.2080078125, 0.320037841796875, 0.43206787109375, 0.544097900390625, 0.6561279296875, 0.768157958984375, 0.88018798828125, 0.992218017578125, 1.104248046875, 1.216278076171875, 1.32830810546875, 1.440338134765625, 1.5523681640625, 1.664398193359375, 1.77642822265625, 1.888458251953125, 2.00048828125, 2.112518310546875, 2.22454833984375, 2.336578369140625, 2.4486083984375, 2.560638427734375, 2.67266845703125, 2.784698486328125, 2.896728515625, 3.008758544921875, 3.12078857421875, 3.232818603515625, 3.3448486328125, 3.456878662109375, 3.56890869140625, 3.680938720703125, 3.79296875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 5.0, 7.0, 6.0, 7.0, 17.0, 11.0, 15.0, 31.0, 39.0, 40.0, 70.0, 73.0, 119.0, 142.0, 190.0, 265.0, 301.0, 405.0, 389.0, 419.0, 306.0, 286.0, 223.0, 154.0, 135.0, 97.0, 87.0, 53.0, 55.0, 28.0, 26.0, 20.0, 10.0, 10.0, 12.0, 5.0, 3.0, 7.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.7578125, -3.63153076171875, -3.5052490234375, -3.37896728515625, -3.252685546875, -3.12640380859375, -3.0001220703125, -2.87384033203125, -2.74755859375, -2.62127685546875, -2.4949951171875, -2.36871337890625, -2.242431640625, -2.11614990234375, -1.9898681640625, -1.86358642578125, -1.7373046875, -1.61102294921875, -1.4847412109375, -1.35845947265625, -1.232177734375, -1.10589599609375, -0.9796142578125, -0.85333251953125, -0.72705078125, -0.60076904296875, -0.4744873046875, -0.34820556640625, -0.221923828125, -0.09564208984375, 0.0306396484375, 0.15692138671875, 0.283203125, 0.40948486328125, 0.5357666015625, 0.66204833984375, 0.788330078125, 0.91461181640625, 1.0408935546875, 1.16717529296875, 1.29345703125, 1.41973876953125, 1.5460205078125, 1.67230224609375, 1.798583984375, 1.92486572265625, 2.0511474609375, 2.17742919921875, 2.3037109375, 2.42999267578125, 2.5562744140625, 2.68255615234375, 2.808837890625, 2.93511962890625, 3.0614013671875, 3.18768310546875, 3.31396484375, 3.44024658203125, 3.5665283203125, 3.69281005859375, 3.819091796875, 3.94537353515625, 4.0716552734375, 4.19793701171875, 4.32421875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 10.0, 12.0, 23.0, 35.0, 55.0, 97.0, 172.0, 478.0, 2740.0, 153447.0, 3952261.0, 82074.0, 2082.0, 415.0, 165.0, 99.0, 50.0, 20.0, 22.0, 8.0, 5.0, 6.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-24.53125, -23.9532470703125, -23.375244140625, -22.7972412109375, -22.21923828125, -21.6412353515625, -21.063232421875, -20.4852294921875, -19.9072265625, -19.3292236328125, -18.751220703125, -18.1732177734375, -17.59521484375, -17.0172119140625, -16.439208984375, -15.8612060546875, -15.283203125, -14.7052001953125, -14.127197265625, -13.5491943359375, -12.97119140625, -12.3931884765625, -11.815185546875, -11.2371826171875, -10.6591796875, -10.0811767578125, -9.503173828125, -8.9251708984375, -8.34716796875, -7.7691650390625, -7.191162109375, -6.6131591796875, -6.03515625, -5.4571533203125, -4.879150390625, -4.3011474609375, -3.72314453125, -3.1451416015625, -2.567138671875, -1.9891357421875, -1.4111328125, -0.8331298828125, -0.255126953125, 0.3228759765625, 0.90087890625, 1.4788818359375, 2.056884765625, 2.6348876953125, 3.212890625, 3.7908935546875, 4.368896484375, 4.9468994140625, 5.52490234375, 6.1029052734375, 6.680908203125, 7.2589111328125, 7.8369140625, 8.4149169921875, 8.992919921875, 9.5709228515625, 10.14892578125, 10.7269287109375, 11.304931640625, 11.8829345703125, 12.4609375]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 7.0, 14.0, 42.0, 75.0, 109.0, 184.0, 195.0, 167.0, 115.0, 57.0, 30.0, 12.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.153446197509766, -42.1279411315918, -41.102439880371094, -40.076934814453125, -39.051429748535156, -38.02592468261719, -37.00041961669922, -35.974918365478516, -34.94941329956055, -33.92390823364258, -32.898406982421875, -31.872901916503906, -30.847396850585938, -29.82189178466797, -28.796388626098633, -27.770885467529297, -26.745380401611328, -25.71987533569336, -24.694372177124023, -23.668869018554688, -22.64336395263672, -21.61785888671875, -20.592355728149414, -19.566852569580078, -18.54134750366211, -17.51584243774414, -16.490339279174805, -15.464835166931152, -14.4393310546875, -13.413826942443848, -12.388322830200195, -11.362818717956543, -10.33731460571289, -9.311810493469238, -8.286306381225586, -7.260802268981934, -6.235298156738281, -5.209794044494629, -4.184289932250977, -3.158785820007324, -2.133281707763672, -1.1077775955200195, -0.08227348327636719, 0.9432306289672852, 1.9687347412109375, 2.99423885345459, 4.019742965698242, 5.0452470779418945, 6.070751190185547, 7.096255302429199, 8.121759414672852, 9.147263526916504, 10.172767639160156, 11.198271751403809, 12.223775863647461, 13.249279975891113, 14.274784088134766, 15.300288200378418, 16.32579231262207, 17.351295471191406, 18.376800537109375, 19.402305603027344, 20.42780876159668, 21.453311920166016, 22.478816986083984]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 3.0, 5.0, 8.0, 6.0, 7.0, 10.0, 9.0, 15.0, 11.0, 18.0, 25.0, 18.0, 24.0, 23.0, 36.0, 29.0, 26.0, 24.0, 31.0, 44.0, 28.0, 33.0, 30.0, 36.0, 42.0, 41.0, 39.0, 45.0, 31.0, 42.0, 33.0, 29.0, 29.0, 21.0, 28.0, 27.0, 16.0, 18.0, 18.0, 17.0, 8.0, 7.0, 8.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.86210823059082, -12.397945404052734, -11.933783531188965, -11.469621658325195, -11.00545883178711, -10.541296005249023, -10.077134132385254, -9.612972259521484, -9.148809432983398, -8.684646606445312, -8.220484733581543, -7.756322383880615, -7.2921600341796875, -6.82799768447876, -6.363835334777832, -5.899672985076904, -5.435510635375977, -4.971348285675049, -4.507185935974121, -4.043023586273193, -3.5788612365722656, -3.114698886871338, -2.65053653717041, -2.1863741874694824, -1.7222118377685547, -1.258049488067627, -0.7938871383666992, -0.3297247886657715, 0.13443756103515625, 0.598599910736084, 1.0627622604370117, 1.5269246101379395, 1.9910869598388672, 2.455249309539795, 2.9194116592407227, 3.3835740089416504, 3.847736358642578, 4.311898708343506, 4.776061058044434, 5.240223407745361, 5.704385757446289, 6.168548107147217, 6.6327104568481445, 7.096872806549072, 7.56103515625, 8.025197982788086, 8.489359855651855, 8.953521728515625, 9.417684555053711, 9.881847381591797, 10.346009254455566, 10.810171127319336, 11.274333953857422, 11.738496780395508, 12.202658653259277, 12.666820526123047, 13.130983352661133, 13.595146179199219, 14.059308052062988, 14.523469924926758, 14.987632751464844, 15.45179557800293, 15.9159574508667, 16.38011932373047, 16.844282150268555]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 5.0, 10.0, 5.0, 11.0, 7.0, 10.0, 10.0, 16.0, 12.0, 15.0, 15.0, 18.0, 11.0, 22.0, 33.0, 27.0, 34.0, 41.0, 36.0, 32.0, 40.0, 52.0, 35.0, 39.0, 30.0, 36.0, 42.0, 40.0, 40.0, 28.0, 34.0, 22.0, 23.0, 26.0, 21.0, 25.0, 19.0, 15.0, 9.0, 12.0, 8.0, 7.0, 4.0, 4.0, 8.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0], "bins": [-1.669921875, -1.621978759765625, -1.57403564453125, -1.526092529296875, -1.4781494140625, -1.430206298828125, -1.38226318359375, -1.334320068359375, -1.286376953125, -1.238433837890625, -1.19049072265625, -1.142547607421875, -1.0946044921875, -1.046661376953125, -0.99871826171875, -0.950775146484375, -0.90283203125, -0.854888916015625, -0.80694580078125, -0.759002685546875, -0.7110595703125, -0.663116455078125, -0.61517333984375, -0.567230224609375, -0.519287109375, -0.471343994140625, -0.42340087890625, -0.375457763671875, -0.3275146484375, -0.279571533203125, -0.23162841796875, -0.183685302734375, -0.1357421875, -0.087799072265625, -0.03985595703125, 0.008087158203125, 0.0560302734375, 0.103973388671875, 0.15191650390625, 0.199859619140625, 0.247802734375, 0.295745849609375, 0.34368896484375, 0.391632080078125, 0.4395751953125, 0.487518310546875, 0.53546142578125, 0.583404541015625, 0.63134765625, 0.679290771484375, 0.72723388671875, 0.775177001953125, 0.8231201171875, 0.871063232421875, 0.91900634765625, 0.966949462890625, 1.014892578125, 1.062835693359375, 1.11077880859375, 1.158721923828125, 1.2066650390625, 1.254608154296875, 1.30255126953125, 1.350494384765625, 1.3984375]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 4.0, 3.0, 15.0, 9.0, 16.0, 29.0, 46.0, 53.0, 113.0, 162.0, 219.0, 289.0, 438.0, 569.0, 797.0, 1077.0, 1569.0, 2122.0, 2902.0, 4109.0, 5914.0, 8265.0, 11448.0, 16411.0, 23927.0, 35521.0, 55488.0, 90266.0, 160143.0, 239834.0, 144633.0, 82602.0, 50952.0, 32832.0, 22306.0, 15197.0, 10939.0, 7751.0, 5525.0, 4006.0, 2856.0, 2023.0, 1432.0, 1141.0, 810.0, 513.0, 450.0, 235.0, 197.0, 146.0, 86.0, 57.0, 64.0, 26.0, 17.0, 10.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.2490234375, -0.24109649658203125, -0.2331695556640625, -0.22524261474609375, -0.217315673828125, -0.20938873291015625, -0.2014617919921875, -0.19353485107421875, -0.18560791015625, -0.17768096923828125, -0.1697540283203125, -0.16182708740234375, -0.153900146484375, -0.14597320556640625, -0.1380462646484375, -0.13011932373046875, -0.1221923828125, -0.11426544189453125, -0.1063385009765625, -0.09841156005859375, -0.090484619140625, -0.08255767822265625, -0.0746307373046875, -0.06670379638671875, -0.05877685546875, -0.05084991455078125, -0.0429229736328125, -0.03499603271484375, -0.027069091796875, -0.01914215087890625, -0.0112152099609375, -0.00328826904296875, 0.004638671875, 0.01256561279296875, 0.0204925537109375, 0.02841949462890625, 0.036346435546875, 0.04427337646484375, 0.0522003173828125, 0.06012725830078125, 0.06805419921875, 0.07598114013671875, 0.0839080810546875, 0.09183502197265625, 0.099761962890625, 0.10768890380859375, 0.1156158447265625, 0.12354278564453125, 0.1314697265625, 0.13939666748046875, 0.1473236083984375, 0.15525054931640625, 0.163177490234375, 0.17110443115234375, 0.1790313720703125, 0.18695831298828125, 0.19488525390625, 0.20281219482421875, 0.2107391357421875, 0.21866607666015625, 0.226593017578125, 0.23451995849609375, 0.2424468994140625, 0.25037384033203125, 0.25830078125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 9.0, 7.0, 10.0, 7.0, 6.0, 11.0, 15.0, 19.0, 20.0, 25.0, 23.0, 33.0, 28.0, 19.0, 31.0, 40.0, 46.0, 31.0, 42.0, 49.0, 1058.0, 35.0, 44.0, 31.0, 52.0, 32.0, 32.0, 32.0, 28.0, 22.0, 21.0, 18.0, 18.0, 20.0, 24.0, 18.0, 14.0, 10.0, 8.0, 10.0, 6.0, 7.0, 1.0, 5.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.025390625, -0.9940109252929688, -0.9626312255859375, -0.9312515258789062, -0.899871826171875, -0.8684921264648438, -0.8371124267578125, -0.8057327270507812, -0.77435302734375, -0.7429733276367188, -0.7115936279296875, -0.6802139282226562, -0.648834228515625, -0.6174545288085938, -0.5860748291015625, -0.5546951293945312, -0.5233154296875, -0.49193572998046875, -0.4605560302734375, -0.42917633056640625, -0.397796630859375, -0.36641693115234375, -0.3350372314453125, -0.30365753173828125, -0.27227783203125, -0.24089813232421875, -0.2095184326171875, -0.17813873291015625, -0.146759033203125, -0.11537933349609375, -0.0839996337890625, -0.05261993408203125, -0.021240234375, 0.01013946533203125, 0.0415191650390625, 0.07289886474609375, 0.104278564453125, 0.13565826416015625, 0.1670379638671875, 0.19841766357421875, 0.22979736328125, 0.26117706298828125, 0.2925567626953125, 0.32393646240234375, 0.355316162109375, 0.38669586181640625, 0.4180755615234375, 0.44945526123046875, 0.4808349609375, 0.5122146606445312, 0.5435943603515625, 0.5749740600585938, 0.606353759765625, 0.6377334594726562, 0.6691131591796875, 0.7004928588867188, 0.73187255859375, 0.7632522583007812, 0.7946319580078125, 0.8260116577148438, 0.857391357421875, 0.8887710571289062, 0.9201507568359375, 0.9515304565429688, 0.98291015625]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 9.0, 8.0, 10.0, 15.0, 19.0, 47.0, 53.0, 81.0, 130.0, 216.0, 274.0, 368.0, 621.0, 902.0, 1223.0, 1823.0, 2626.0, 4053.0, 5755.0, 8518.0, 12679.0, 18980.0, 29341.0, 47612.0, 82815.0, 161117.0, 1337754.0, 162145.0, 83089.0, 47815.0, 29637.0, 18921.0, 12262.0, 8278.0, 5640.0, 3751.0, 2665.0, 1791.0, 1293.0, 845.0, 637.0, 427.0, 269.0, 199.0, 145.0, 91.0, 74.0, 37.0, 33.0, 18.0, 9.0, 12.0, 2.0, 5.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.27685546875, -0.2683372497558594, -0.25981903076171875, -0.2513008117675781, -0.2427825927734375, -0.23426437377929688, -0.22574615478515625, -0.21722793579101562, -0.208709716796875, -0.20019149780273438, -0.19167327880859375, -0.18315505981445312, -0.1746368408203125, -0.16611862182617188, -0.15760040283203125, -0.14908218383789062, -0.14056396484375, -0.13204574584960938, -0.12352752685546875, -0.11500930786132812, -0.1064910888671875, -0.09797286987304688, -0.08945465087890625, -0.08093643188476562, -0.072418212890625, -0.06389999389648438, -0.05538177490234375, -0.046863555908203125, -0.0383453369140625, -0.029827117919921875, -0.02130889892578125, -0.012790679931640625, -0.0042724609375, 0.004245758056640625, 0.01276397705078125, 0.021282196044921875, 0.0298004150390625, 0.038318634033203125, 0.04683685302734375, 0.055355072021484375, 0.063873291015625, 0.07239151000976562, 0.08090972900390625, 0.08942794799804688, 0.0979461669921875, 0.10646438598632812, 0.11498260498046875, 0.12350082397460938, 0.13201904296875, 0.14053726196289062, 0.14905548095703125, 0.15757369995117188, 0.1660919189453125, 0.17461013793945312, 0.18312835693359375, 0.19164657592773438, 0.200164794921875, 0.20868301391601562, 0.21720123291015625, 0.22571945190429688, 0.2342376708984375, 0.24275588989257812, 0.25127410888671875, 0.2597923278808594, 0.268310546875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 7.0, 5.0, 5.0, 14.0, 14.0, 14.0, 15.0, 18.0, 22.0, 28.0, 37.0, 37.0, 33.0, 62.0, 50.0, 51.0, 49.0, 67.0, 47.0, 54.0, 50.0, 48.0, 42.0, 36.0, 40.0, 24.0, 30.0, 20.0, 17.0, 15.0, 7.0, 6.0, 3.0, 8.0, 2.0, 9.0, 3.0, 6.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013875961303710938, -0.0001340322196483612, -0.00012930482625961304, -0.00012457743287086487, -0.0001198500394821167, -0.00011512264609336853, -0.00011039525270462036, -0.00010566785931587219, -0.00010094046592712402, -9.621307253837585e-05, -9.148567914962769e-05, -8.675828576087952e-05, -8.203089237213135e-05, -7.730349898338318e-05, -7.257610559463501e-05, -6.784871220588684e-05, -6.312131881713867e-05, -5.83939254283905e-05, -5.3666532039642334e-05, -4.8939138650894165e-05, -4.4211745262145996e-05, -3.948435187339783e-05, -3.475695848464966e-05, -3.002956509590149e-05, -2.530217170715332e-05, -2.057477831840515e-05, -1.5847384929656982e-05, -1.1119991540908813e-05, -6.3925981521606445e-06, -1.6652047634124756e-06, 3.0621886253356934e-06, 7.789582014083862e-06, 1.2516975402832031e-05, 1.72443687915802e-05, 2.197176218032837e-05, 2.6699155569076538e-05, 3.142654895782471e-05, 3.6153942346572876e-05, 4.0881335735321045e-05, 4.5608729124069214e-05, 5.033612251281738e-05, 5.506351590156555e-05, 5.979090929031372e-05, 6.451830267906189e-05, 6.924569606781006e-05, 7.397308945655823e-05, 7.87004828453064e-05, 8.342787623405457e-05, 8.815526962280273e-05, 9.28826630115509e-05, 9.761005640029907e-05, 0.00010233744978904724, 0.00010706484317779541, 0.00011179223656654358, 0.00011651962995529175, 0.00012124702334403992, 0.00012597441673278809, 0.00013070181012153625, 0.00013542920351028442, 0.0001401565968990326, 0.00014488399028778076, 0.00014961138367652893, 0.0001543387770652771, 0.00015906617045402527, 0.00016379356384277344]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 2.0, 2.0, 5.0, 3.0, 12.0, 6.0, 13.0, 5.0, 9.0, 16.0, 12.0, 36.0, 44.0, 64.0, 67.0, 101.0, 162.0, 187.0, 282.0, 483.0, 999.0, 80256.0, 957159.0, 6674.0, 659.0, 392.0, 249.0, 173.0, 119.0, 82.0, 63.0, 59.0, 33.0, 26.0, 26.0, 16.0, 13.0, 14.0, 11.0, 10.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0032215118408203125, -0.0031276047229766846, -0.0030336976051330566, -0.0029397904872894287, -0.0028458833694458008, -0.002751976251602173, -0.002658069133758545, -0.002564162015914917, -0.002470254898071289, -0.002376347780227661, -0.002282440662384033, -0.0021885335445404053, -0.0020946264266967773, -0.0020007193088531494, -0.0019068121910095215, -0.0018129050731658936, -0.0017189979553222656, -0.0016250908374786377, -0.0015311837196350098, -0.0014372766017913818, -0.001343369483947754, -0.001249462366104126, -0.001155555248260498, -0.0010616481304168701, -0.0009677410125732422, -0.0008738338947296143, -0.0007799267768859863, -0.0006860196590423584, -0.0005921125411987305, -0.0004982054233551025, -0.0004042983055114746, -0.0003103911876678467, -0.00021648406982421875, -0.00012257695198059082, -2.866983413696289e-05, 6.523728370666504e-05, 0.00015914440155029297, 0.0002530515193939209, 0.00034695863723754883, 0.00044086575508117676, 0.0005347728729248047, 0.0006286799907684326, 0.0007225871086120605, 0.0008164942264556885, 0.0009104013442993164, 0.0010043084621429443, 0.0010982155799865723, 0.0011921226978302002, 0.0012860298156738281, 0.001379936933517456, 0.001473844051361084, 0.001567751169204712, 0.0016616582870483398, 0.0017555654048919678, 0.0018494725227355957, 0.0019433796405792236, 0.0020372867584228516, 0.0021311938762664795, 0.0022251009941101074, 0.0023190081119537354, 0.0024129152297973633, 0.002506822347640991, 0.002600729465484619, 0.002694636583328247, 0.002788543701171875]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 10.0, 65.0, 299.0, 409.0, 196.0, 30.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004159118980169296, -0.0004017203173134476, -0.00038752873660996556, -0.00037333715590648353, -0.0003591455752030015, -0.00034495399449951947, -0.00033076241379603744, -0.00031657086219638586, -0.00030237925238907337, -0.00028818767168559134, -0.0002739960909821093, -0.0002598045102786273, -0.00024561292957514524, -0.0002314213488716632, -0.0002172297827200964, -0.00020303820201661438, -0.00018884663586504757, -0.00017465505516156554, -0.0001604634744580835, -0.00014627189375460148, -0.00013208031305111945, -0.00011788873962359503, -0.00010369716619607061, -8.950558549258858e-05, -7.531400478910655e-05, -6.112242408562452e-05, -4.693084702012129e-05, -3.2739269954618067e-05, -1.8547689251136035e-05, -4.356108547654003e-06, 9.835464879870415e-06, 2.4027045583352447e-05, 3.821862628683448e-05, 5.241020699031651e-05, 6.660178769379854e-05, 8.079336112132296e-05, 9.498494182480499e-05, 0.00010917652252828702, 0.00012336809595581144, 0.00013755967665929347, 0.0001517512573627755, 0.00016594283806625754, 0.00018013441876973957, 0.00019432598492130637, 0.0002085175656247884, 0.00022270914632827044, 0.00023690072703175247, 0.0002510923077352345, 0.00026528388843871653, 0.00027947546914219856, 0.0002936670498456806, 0.0003078586305491626, 0.00032205021125264466, 0.0003362417919561267, 0.00035043334355577826, 0.00036462495336309075, 0.00037881650496274233, 0.00039300808566622436, 0.0004071996663697064, 0.0004213912470731884, 0.00043558282777667046, 0.0004497744084801525, 0.0004639659891836345, 0.0004781575407832861, 0.0004923491505905986]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 9.0, 5.0, 12.0, 15.0, 21.0, 20.0, 22.0, 34.0, 40.0, 36.0, 38.0, 41.0, 40.0, 37.0, 43.0, 43.0, 47.0, 35.0, 39.0, 50.0, 48.0, 35.0, 39.0, 35.0, 34.0, 26.0, 21.0, 24.0, 18.0, 20.0, 15.0, 11.0, 14.0, 10.0, 5.0, 1.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.690357208251953e-05, -8.42418521642685e-05, -8.158013224601746e-05, -7.891841232776642e-05, -7.625669240951538e-05, -7.359497249126434e-05, -7.09332525730133e-05, -6.827153265476227e-05, -6.560981273651123e-05, -6.294809281826019e-05, -6.0286372900009155e-05, -5.762465298175812e-05, -5.496293306350708e-05, -5.230121314525604e-05, -4.9639493227005005e-05, -4.697777330875397e-05, -4.431605339050293e-05, -4.165433347225189e-05, -3.8992613554000854e-05, -3.633089363574982e-05, -3.366917371749878e-05, -3.100745379924774e-05, -2.8345733880996704e-05, -2.5684013962745667e-05, -2.302229404449463e-05, -2.036057412624359e-05, -1.7698854207992554e-05, -1.5037134289741516e-05, -1.2375414371490479e-05, -9.713694453239441e-06, -7.051974534988403e-06, -4.390254616737366e-06, -1.7285346984863281e-06, 9.331852197647095e-07, 3.594905138015747e-06, 6.256625056266785e-06, 8.918344974517822e-06, 1.158006489276886e-05, 1.4241784811019897e-05, 1.6903504729270935e-05, 1.9565224647521973e-05, 2.222694456577301e-05, 2.4888664484024048e-05, 2.7550384402275085e-05, 3.0212104320526123e-05, 3.287382423877716e-05, 3.55355441570282e-05, 3.8197264075279236e-05, 4.0858983993530273e-05, 4.352070391178131e-05, 4.618242383003235e-05, 4.8844143748283386e-05, 5.1505863666534424e-05, 5.416758358478546e-05, 5.68293035030365e-05, 5.949102342128754e-05, 6.215274333953857e-05, 6.481446325778961e-05, 6.747618317604065e-05, 7.013790309429169e-05, 7.279962301254272e-05, 7.546134293079376e-05, 7.81230628490448e-05, 8.078478276729584e-05, 8.344650268554688e-05]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 5.0, 10.0, 5.0, 11.0, 7.0, 10.0, 10.0, 16.0, 12.0, 15.0, 15.0, 18.0, 11.0, 22.0, 33.0, 27.0, 34.0, 41.0, 36.0, 32.0, 40.0, 52.0, 35.0, 39.0, 30.0, 36.0, 42.0, 40.0, 40.0, 28.0, 34.0, 22.0, 23.0, 26.0, 21.0, 25.0, 19.0, 15.0, 9.0, 12.0, 8.0, 7.0, 4.0, 4.0, 8.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0], "bins": [-1.669921875, -1.621978759765625, -1.57403564453125, -1.526092529296875, -1.4781494140625, -1.430206298828125, -1.38226318359375, -1.334320068359375, -1.286376953125, -1.238433837890625, -1.19049072265625, -1.142547607421875, -1.0946044921875, -1.046661376953125, -0.99871826171875, -0.950775146484375, -0.90283203125, -0.854888916015625, -0.80694580078125, -0.759002685546875, -0.7110595703125, -0.663116455078125, -0.61517333984375, -0.567230224609375, -0.519287109375, -0.471343994140625, -0.42340087890625, -0.375457763671875, -0.3275146484375, -0.279571533203125, -0.23162841796875, -0.183685302734375, -0.1357421875, -0.087799072265625, -0.03985595703125, 0.008087158203125, 0.0560302734375, 0.103973388671875, 0.15191650390625, 0.199859619140625, 0.247802734375, 0.295745849609375, 0.34368896484375, 0.391632080078125, 0.4395751953125, 0.487518310546875, 0.53546142578125, 0.583404541015625, 0.63134765625, 0.679290771484375, 0.72723388671875, 0.775177001953125, 0.8231201171875, 0.871063232421875, 0.91900634765625, 0.966949462890625, 1.014892578125, 1.062835693359375, 1.11077880859375, 1.158721923828125, 1.2066650390625, 1.254608154296875, 1.30255126953125, 1.350494384765625, 1.3984375]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 5.0, 3.0, 7.0, 7.0, 12.0, 16.0, 24.0, 20.0, 42.0, 54.0, 84.0, 110.0, 183.0, 287.0, 433.0, 708.0, 1186.0, 1847.0, 3170.0, 5639.0, 10444.0, 21015.0, 43724.0, 91790.0, 175495.0, 250345.0, 209469.0, 118205.0, 57007.0, 26961.0, 13308.0, 7014.0, 3871.0, 2297.0, 1350.0, 877.0, 528.0, 336.0, 231.0, 156.0, 96.0, 60.0, 46.0, 25.0, 22.0, 16.0, 7.0, 8.0, 7.0, 10.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.2685546875, -1.229736328125, -1.19091796875, -1.152099609375, -1.11328125, -1.074462890625, -1.03564453125, -0.996826171875, -0.9580078125, -0.919189453125, -0.88037109375, -0.841552734375, -0.802734375, -0.763916015625, -0.72509765625, -0.686279296875, -0.6474609375, -0.608642578125, -0.56982421875, -0.531005859375, -0.4921875, -0.453369140625, -0.41455078125, -0.375732421875, -0.3369140625, -0.298095703125, -0.25927734375, -0.220458984375, -0.181640625, -0.142822265625, -0.10400390625, -0.065185546875, -0.0263671875, 0.012451171875, 0.05126953125, 0.090087890625, 0.12890625, 0.167724609375, 0.20654296875, 0.245361328125, 0.2841796875, 0.322998046875, 0.36181640625, 0.400634765625, 0.439453125, 0.478271484375, 0.51708984375, 0.555908203125, 0.5947265625, 0.633544921875, 0.67236328125, 0.711181640625, 0.75, 0.788818359375, 0.82763671875, 0.866455078125, 0.9052734375, 0.944091796875, 0.98291015625, 1.021728515625, 1.060546875, 1.099365234375, 1.13818359375, 1.177001953125, 1.2158203125]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 1.0, 2.0, 3.0, 1.0, 6.0, 5.0, 10.0, 9.0, 10.0, 14.0, 14.0, 14.0, 14.0, 18.0, 22.0, 18.0, 30.0, 34.0, 36.0, 42.0, 36.0, 39.0, 80.0, 170.0, 336.0, 1387.0, 185.0, 90.0, 57.0, 50.0, 36.0, 36.0, 35.0, 21.0, 31.0, 18.0, 26.0, 24.0, 13.0, 13.0, 13.0, 15.0, 7.0, 8.0, 5.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.84765625, -5.6761474609375, -5.504638671875, -5.3331298828125, -5.16162109375, -4.9901123046875, -4.818603515625, -4.6470947265625, -4.4755859375, -4.3040771484375, -4.132568359375, -3.9610595703125, -3.78955078125, -3.6180419921875, -3.446533203125, -3.2750244140625, -3.103515625, -2.9320068359375, -2.760498046875, -2.5889892578125, -2.41748046875, -2.2459716796875, -2.074462890625, -1.9029541015625, -1.7314453125, -1.5599365234375, -1.388427734375, -1.2169189453125, -1.04541015625, -0.8739013671875, -0.702392578125, -0.5308837890625, -0.359375, -0.1878662109375, -0.016357421875, 0.1551513671875, 0.32666015625, 0.4981689453125, 0.669677734375, 0.8411865234375, 1.0126953125, 1.1842041015625, 1.355712890625, 1.5272216796875, 1.69873046875, 1.8702392578125, 2.041748046875, 2.2132568359375, 2.384765625, 2.5562744140625, 2.727783203125, 2.8992919921875, 3.07080078125, 3.2423095703125, 3.413818359375, 3.5853271484375, 3.7568359375, 3.9283447265625, 4.099853515625, 4.2713623046875, 4.44287109375, 4.6143798828125, 4.785888671875, 4.9573974609375, 5.12890625]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 0.0, 1.0, 5.0, 3.0, 3.0, 9.0, 14.0, 15.0, 11.0, 17.0, 19.0, 24.0, 30.0, 47.0, 62.0, 72.0, 94.0, 123.0, 225.0, 454.0, 1225.0, 8544.0, 469153.0, 2633216.0, 28648.0, 2122.0, 631.0, 267.0, 187.0, 118.0, 87.0, 62.0, 38.0, 32.0, 33.0, 24.0, 23.0, 17.0, 14.0, 12.0, 5.0, 6.0, 4.0, 5.0, 2.0, 5.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4921875, -9.1778564453125, -8.863525390625, -8.5491943359375, -8.23486328125, -7.9205322265625, -7.606201171875, -7.2918701171875, -6.9775390625, -6.6632080078125, -6.348876953125, -6.0345458984375, -5.72021484375, -5.4058837890625, -5.091552734375, -4.7772216796875, -4.462890625, -4.1485595703125, -3.834228515625, -3.5198974609375, -3.20556640625, -2.8912353515625, -2.576904296875, -2.2625732421875, -1.9482421875, -1.6339111328125, -1.319580078125, -1.0052490234375, -0.69091796875, -0.3765869140625, -0.062255859375, 0.2520751953125, 0.56640625, 0.8807373046875, 1.195068359375, 1.5093994140625, 1.82373046875, 2.1380615234375, 2.452392578125, 2.7667236328125, 3.0810546875, 3.3953857421875, 3.709716796875, 4.0240478515625, 4.33837890625, 4.6527099609375, 4.967041015625, 5.2813720703125, 5.595703125, 5.9100341796875, 6.224365234375, 6.5386962890625, 6.85302734375, 7.1673583984375, 7.481689453125, 7.7960205078125, 8.1103515625, 8.4246826171875, 8.739013671875, 9.0533447265625, 9.36767578125, 9.6820068359375, 9.996337890625, 10.3106689453125, 10.625]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 9.0, 125.0, 449.0, 360.0, 64.0, 9.0, 0.0, 0.0, 0.0, 2.0], "bins": [-72.02841186523438, -70.76129913330078, -69.49418640136719, -68.2270736694336, -66.95996856689453, -65.69285583496094, -64.42574310302734, -63.15863037109375, -61.891517639160156, -60.62440490722656, -59.357295989990234, -58.09018325805664, -56.82307052612305, -55.55595779418945, -54.288848876953125, -53.02173614501953, -51.75462341308594, -50.487510681152344, -49.220401763916016, -47.95328903198242, -46.68617630004883, -45.419063568115234, -44.151954650878906, -42.88484191894531, -41.617733001708984, -40.35062026977539, -39.08351135253906, -37.81639862060547, -36.549285888671875, -35.28217315673828, -34.01506423950195, -32.74795150756836, -31.4808349609375, -30.21372413635254, -28.946611404418945, -27.679500579833984, -26.41238784790039, -25.14527702331543, -23.87816619873047, -22.611053466796875, -21.343942642211914, -20.076831817626953, -18.80971908569336, -17.5426082611084, -16.275495529174805, -15.008384704589844, -13.741272926330566, -12.474161148071289, -11.207049369812012, -9.939937591552734, -8.672825813293457, -7.405714511871338, -6.1386027336120605, -4.871490955352783, -3.604379653930664, -2.3372678756713867, -1.0701560974121094, 0.19695556163787842, 1.4640672206878662, 2.7311787605285645, 3.998290538787842, 5.265402317047119, 6.532513618469238, 7.799625396728516, 9.066737174987793]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 7.0, 3.0, 4.0, 4.0, 10.0, 6.0, 8.0, 8.0, 10.0, 12.0, 20.0, 26.0, 19.0, 32.0, 28.0, 35.0, 27.0, 38.0, 35.0, 33.0, 58.0, 57.0, 48.0, 55.0, 53.0, 52.0, 45.0, 36.0, 49.0, 28.0, 30.0, 19.0, 25.0, 20.0, 16.0, 5.0, 14.0, 10.0, 10.0, 8.0, 5.0, 5.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.34966278076172, -22.683855056762695, -22.018049240112305, -21.35224151611328, -20.68643569946289, -20.020627975463867, -19.354822158813477, -18.689014434814453, -18.023208618164062, -17.35740089416504, -16.69159507751465, -16.025787353515625, -15.359981536865234, -14.694174766540527, -14.02836799621582, -13.362560272216797, -12.69675350189209, -12.030946731567383, -11.365139961242676, -10.699333190917969, -10.033526420593262, -9.367719650268555, -8.701911926269531, -8.03610610961914, -7.370298862457275, -6.704492092132568, -6.038685321807861, -5.372878074645996, -4.707071304321289, -4.041264533996582, -3.375457763671875, -2.709650993347168, -2.043844223022461, -1.378037452697754, -0.7122305631637573, -0.04642367362976074, 0.6193830966949463, 1.2851898670196533, 1.9509968757629395, 2.6168036460876465, 3.2826104164123535, 3.9484171867370605, 4.614223957061768, 5.280031204223633, 5.94583797454834, 6.611644744873047, 7.277451515197754, 7.943258285522461, 8.609065055847168, 9.274871826171875, 9.940678596496582, 10.606485366821289, 11.272292137145996, 11.938098907470703, 12.603906631469727, 13.269712448120117, 13.93552017211914, 14.601326942443848, 15.267133712768555, 15.932940483093262, 16.59874725341797, 17.264554977416992, 17.930360794067383, 18.596168518066406, 19.261974334716797]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 7.0, 3.0, 6.0, 10.0, 5.0, 9.0, 6.0, 10.0, 17.0, 16.0, 17.0, 11.0, 19.0, 23.0, 23.0, 23.0, 32.0, 33.0, 33.0, 38.0, 38.0, 51.0, 44.0, 44.0, 42.0, 37.0, 31.0, 43.0, 32.0, 23.0, 44.0, 30.0, 26.0, 30.0, 27.0, 17.0, 19.0, 19.0, 14.0, 13.0, 10.0, 9.0, 6.0, 3.0, 3.0, 4.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0], "bins": [-1.8212890625, -1.768798828125, -1.71630859375, -1.663818359375, -1.611328125, -1.558837890625, -1.50634765625, -1.453857421875, -1.4013671875, -1.348876953125, -1.29638671875, -1.243896484375, -1.19140625, -1.138916015625, -1.08642578125, -1.033935546875, -0.9814453125, -0.928955078125, -0.87646484375, -0.823974609375, -0.771484375, -0.718994140625, -0.66650390625, -0.614013671875, -0.5615234375, -0.509033203125, -0.45654296875, -0.404052734375, -0.3515625, -0.299072265625, -0.24658203125, -0.194091796875, -0.1416015625, -0.089111328125, -0.03662109375, 0.015869140625, 0.068359375, 0.120849609375, 0.17333984375, 0.225830078125, 0.2783203125, 0.330810546875, 0.38330078125, 0.435791015625, 0.48828125, 0.540771484375, 0.59326171875, 0.645751953125, 0.6982421875, 0.750732421875, 0.80322265625, 0.855712890625, 0.908203125, 0.960693359375, 1.01318359375, 1.065673828125, 1.1181640625, 1.170654296875, 1.22314453125, 1.275634765625, 1.328125, 1.380615234375, 1.43310546875, 1.485595703125, 1.5380859375]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 6.0, 8.0, 5.0, 4.0, 9.0, 4.0, 6.0, 9.0, 14.0, 13.0, 14.0, 16.0, 30.0, 29.0, 32.0, 54.0, 89.0, 113.0, 172.0, 373.0, 990.0, 3548.0, 18383.0, 149730.0, 1502618.0, 2180789.0, 298345.0, 30909.0, 5402.0, 1369.0, 509.0, 225.0, 136.0, 80.0, 51.0, 47.0, 36.0, 34.0, 18.0, 18.0, 13.0, 7.0, 10.0, 11.0, 3.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-4.609375, -4.47027587890625, -4.3311767578125, -4.19207763671875, -4.052978515625, -3.91387939453125, -3.7747802734375, -3.63568115234375, -3.49658203125, -3.35748291015625, -3.2183837890625, -3.07928466796875, -2.940185546875, -2.80108642578125, -2.6619873046875, -2.52288818359375, -2.3837890625, -2.24468994140625, -2.1055908203125, -1.96649169921875, -1.827392578125, -1.68829345703125, -1.5491943359375, -1.41009521484375, -1.27099609375, -1.13189697265625, -0.9927978515625, -0.85369873046875, -0.714599609375, -0.57550048828125, -0.4364013671875, -0.29730224609375, -0.158203125, -0.01910400390625, 0.1199951171875, 0.25909423828125, 0.398193359375, 0.53729248046875, 0.6763916015625, 0.81549072265625, 0.95458984375, 1.09368896484375, 1.2327880859375, 1.37188720703125, 1.510986328125, 1.65008544921875, 1.7891845703125, 1.92828369140625, 2.0673828125, 2.20648193359375, 2.3455810546875, 2.48468017578125, 2.623779296875, 2.76287841796875, 2.9019775390625, 3.04107666015625, 3.18017578125, 3.31927490234375, 3.4583740234375, 3.59747314453125, 3.736572265625, 3.87567138671875, 4.0147705078125, 4.15386962890625, 4.29296875]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 5.0, 4.0, 5.0, 6.0, 6.0, 14.0, 14.0, 25.0, 41.0, 50.0, 56.0, 80.0, 119.0, 185.0, 248.0, 312.0, 425.0, 491.0, 475.0, 375.0, 308.0, 236.0, 184.0, 126.0, 91.0, 57.0, 46.0, 22.0, 28.0, 14.0, 11.0, 8.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0859375, -4.9266357421875, -4.767333984375, -4.6080322265625, -4.44873046875, -4.2894287109375, -4.130126953125, -3.9708251953125, -3.8115234375, -3.6522216796875, -3.492919921875, -3.3336181640625, -3.17431640625, -3.0150146484375, -2.855712890625, -2.6964111328125, -2.537109375, -2.3778076171875, -2.218505859375, -2.0592041015625, -1.89990234375, -1.7406005859375, -1.581298828125, -1.4219970703125, -1.2626953125, -1.1033935546875, -0.944091796875, -0.7847900390625, -0.62548828125, -0.4661865234375, -0.306884765625, -0.1475830078125, 0.01171875, 0.1710205078125, 0.330322265625, 0.4896240234375, 0.64892578125, 0.8082275390625, 0.967529296875, 1.1268310546875, 1.2861328125, 1.4454345703125, 1.604736328125, 1.7640380859375, 1.92333984375, 2.0826416015625, 2.241943359375, 2.4012451171875, 2.560546875, 2.7198486328125, 2.879150390625, 3.0384521484375, 3.19775390625, 3.3570556640625, 3.516357421875, 3.6756591796875, 3.8349609375, 3.9942626953125, 4.153564453125, 4.3128662109375, 4.47216796875, 4.6314697265625, 4.790771484375, 4.9500732421875, 5.109375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 6.0, 12.0, 8.0, 17.0, 18.0, 40.0, 54.0, 102.0, 120.0, 215.0, 416.0, 1050.0, 4953.0, 71356.0, 2616572.0, 1456444.0, 37808.0, 3313.0, 861.0, 341.0, 188.0, 123.0, 84.0, 46.0, 42.0, 30.0, 20.0, 10.0, 7.0, 7.0, 1.0, 4.0, 4.0, 4.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.203125, -9.8238525390625, -9.444580078125, -9.0653076171875, -8.68603515625, -8.3067626953125, -7.927490234375, -7.5482177734375, -7.1689453125, -6.7896728515625, -6.410400390625, -6.0311279296875, -5.65185546875, -5.2725830078125, -4.893310546875, -4.5140380859375, -4.134765625, -3.7554931640625, -3.376220703125, -2.9969482421875, -2.61767578125, -2.2384033203125, -1.859130859375, -1.4798583984375, -1.1005859375, -0.7213134765625, -0.342041015625, 0.0372314453125, 0.41650390625, 0.7957763671875, 1.175048828125, 1.5543212890625, 1.93359375, 2.3128662109375, 2.692138671875, 3.0714111328125, 3.45068359375, 3.8299560546875, 4.209228515625, 4.5885009765625, 4.9677734375, 5.3470458984375, 5.726318359375, 6.1055908203125, 6.48486328125, 6.8641357421875, 7.243408203125, 7.6226806640625, 8.001953125, 8.3812255859375, 8.760498046875, 9.1397705078125, 9.51904296875, 9.8983154296875, 10.277587890625, 10.6568603515625, 11.0361328125, 11.4154052734375, 11.794677734375, 12.1739501953125, 12.55322265625, 12.9324951171875, 13.311767578125, 13.6910400390625, 14.0703125]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 8.0, 26.0, 33.0, 78.0, 105.0, 153.0, 168.0, 138.0, 125.0, 86.0, 51.0, 23.0, 11.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-13.65777587890625, -12.658008575439453, -11.658241271972656, -10.65847396850586, -9.658706665039062, -8.658939361572266, -7.659172534942627, -6.65940523147583, -5.659637928009033, -4.659870624542236, -3.6601033210754395, -2.6603362560272217, -1.6605689525604248, -0.660801887512207, 0.33896541595458984, 1.3387327194213867, 2.3385000228881836, 3.3382673263549805, 4.338034629821777, 5.337801933288574, 6.337569236755371, 7.33733606338501, 8.337102890014648, 9.336870193481445, 10.336637496948242, 11.336404800415039, 12.336172103881836, 13.335939407348633, 14.33570671081543, 15.335474014282227, 16.335241317749023, 17.33500862121582, 18.334775924682617, 19.334543228149414, 20.33431053161621, 21.334077835083008, 22.333845138549805, 23.3336124420166, 24.3333797454834, 25.333147048950195, 26.332914352416992, 27.33268165588379, 28.332448959350586, 29.332216262817383, 30.33198356628418, 31.331750869750977, 32.33151626586914, 33.33128356933594, 34.331050872802734, 35.33081817626953, 36.33058547973633, 37.330352783203125, 38.33012008666992, 39.32988739013672, 40.329654693603516, 41.32942199707031, 42.32918930053711, 43.328956604003906, 44.3287239074707, 45.3284912109375, 46.3282585144043, 47.328025817871094, 48.32779312133789, 49.32756042480469, 50.327327728271484]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 2.0, 4.0, 8.0, 4.0, 5.0, 4.0, 4.0, 13.0, 7.0, 20.0, 14.0, 15.0, 18.0, 26.0, 23.0, 26.0, 30.0, 35.0, 34.0, 40.0, 42.0, 46.0, 40.0, 46.0, 42.0, 47.0, 45.0, 41.0, 36.0, 32.0, 31.0, 31.0, 28.0, 25.0, 25.0, 32.0, 17.0, 10.0, 10.0, 9.0, 14.0, 6.0, 8.0, 2.0, 2.0, 6.0, 3.0, 2.0, 1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.956981658935547, -13.46343994140625, -12.969898223876953, -12.476357460021973, -11.982815742492676, -11.489274024963379, -10.995733261108398, -10.502191543579102, -10.008649826049805, -9.515108108520508, -9.021566390991211, -8.52802562713623, -8.034483909606934, -7.540942192077637, -7.047400951385498, -6.553859710693359, -6.0603179931640625, -5.566776275634766, -5.073235034942627, -4.579693794250488, -4.086152076721191, -3.5926105976104736, -3.099069118499756, -2.605527639389038, -2.1119861602783203, -1.6184446811676025, -1.1249032020568848, -0.631361722946167, -0.13782024383544922, 0.35572123527526855, 0.8492627143859863, 1.342804193496704, 1.8363456726074219, 2.3298871517181396, 2.8234286308288574, 3.316970109939575, 3.810511589050293, 4.30405330657959, 4.7975945472717285, 5.291135787963867, 5.784677505493164, 6.278219223022461, 6.7717604637146, 7.265301704406738, 7.758843421936035, 8.252385139465332, 8.745925903320312, 9.23946762084961, 9.733009338378906, 10.226551055908203, 10.7200927734375, 11.21363353729248, 11.707175254821777, 12.200716972351074, 12.694257736206055, 13.187799453735352, 13.681341171264648, 14.174882888793945, 14.668424606323242, 15.161965370178223, 15.65550708770752, 16.1490478515625, 16.642589569091797, 17.136131286621094, 17.62967300415039]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 8.0, 4.0, 4.0, 7.0, 5.0, 6.0, 4.0, 12.0, 11.0, 15.0, 10.0, 22.0, 13.0, 15.0, 15.0, 26.0, 23.0, 21.0, 32.0, 35.0, 34.0, 38.0, 45.0, 42.0, 46.0, 44.0, 49.0, 42.0, 34.0, 39.0, 31.0, 25.0, 34.0, 27.0, 27.0, 17.0, 23.0, 19.0, 18.0, 18.0, 14.0, 11.0, 11.0, 8.0, 4.0, 5.0, 5.0, 4.0, 2.0, 4.0, 0.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.572265625, -1.5201416015625, -1.468017578125, -1.4158935546875, -1.36376953125, -1.3116455078125, -1.259521484375, -1.2073974609375, -1.1552734375, -1.1031494140625, -1.051025390625, -0.9989013671875, -0.94677734375, -0.8946533203125, -0.842529296875, -0.7904052734375, -0.73828125, -0.6861572265625, -0.634033203125, -0.5819091796875, -0.52978515625, -0.4776611328125, -0.425537109375, -0.3734130859375, -0.3212890625, -0.2691650390625, -0.217041015625, -0.1649169921875, -0.11279296875, -0.0606689453125, -0.008544921875, 0.0435791015625, 0.095703125, 0.1478271484375, 0.199951171875, 0.2520751953125, 0.30419921875, 0.3563232421875, 0.408447265625, 0.4605712890625, 0.5126953125, 0.5648193359375, 0.616943359375, 0.6690673828125, 0.72119140625, 0.7733154296875, 0.825439453125, 0.8775634765625, 0.9296875, 0.9818115234375, 1.033935546875, 1.0860595703125, 1.13818359375, 1.1903076171875, 1.242431640625, 1.2945556640625, 1.3466796875, 1.3988037109375, 1.450927734375, 1.5030517578125, 1.55517578125, 1.6072998046875, 1.659423828125, 1.7115478515625, 1.763671875]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 1.0, 8.0, 13.0, 12.0, 15.0, 26.0, 40.0, 68.0, 106.0, 124.0, 193.0, 326.0, 435.0, 618.0, 834.0, 1183.0, 1702.0, 2553.0, 3679.0, 5353.0, 7847.0, 11582.0, 17610.0, 26781.0, 41993.0, 68393.0, 123064.0, 260443.0, 204910.0, 101747.0, 58728.0, 36425.0, 23472.0, 15467.0, 10435.0, 6842.0, 4816.0, 3306.0, 2267.0, 1573.0, 1078.0, 729.0, 540.0, 379.0, 273.0, 192.0, 120.0, 88.0, 58.0, 42.0, 30.0, 17.0, 14.0, 9.0, 7.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.306884765625, -0.29724884033203125, -0.2876129150390625, -0.27797698974609375, -0.268341064453125, -0.25870513916015625, -0.2490692138671875, -0.23943328857421875, -0.22979736328125, -0.22016143798828125, -0.2105255126953125, -0.20088958740234375, -0.191253662109375, -0.18161773681640625, -0.1719818115234375, -0.16234588623046875, -0.1527099609375, -0.14307403564453125, -0.1334381103515625, -0.12380218505859375, -0.114166259765625, -0.10453033447265625, -0.0948944091796875, -0.08525848388671875, -0.07562255859375, -0.06598663330078125, -0.0563507080078125, -0.04671478271484375, -0.037078857421875, -0.02744293212890625, -0.0178070068359375, -0.00817108154296875, 0.00146484375, 0.01110076904296875, 0.0207366943359375, 0.03037261962890625, 0.040008544921875, 0.04964447021484375, 0.0592803955078125, 0.06891632080078125, 0.07855224609375, 0.08818817138671875, 0.0978240966796875, 0.10746002197265625, 0.117095947265625, 0.12673187255859375, 0.1363677978515625, 0.14600372314453125, 0.1556396484375, 0.16527557373046875, 0.1749114990234375, 0.18454742431640625, 0.194183349609375, 0.20381927490234375, 0.2134552001953125, 0.22309112548828125, 0.23272705078125, 0.24236297607421875, 0.2519989013671875, 0.26163482666015625, 0.271270751953125, 0.28090667724609375, 0.2905426025390625, 0.30017852783203125, 0.309814453125]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 5.0, 3.0, 5.0, 6.0, 4.0, 12.0, 10.0, 12.0, 14.0, 16.0, 7.0, 16.0, 24.0, 21.0, 36.0, 28.0, 28.0, 26.0, 36.0, 24.0, 29.0, 29.0, 35.0, 30.0, 1053.0, 41.0, 34.0, 34.0, 34.0, 33.0, 32.0, 17.0, 33.0, 32.0, 25.0, 29.0, 24.0, 11.0, 33.0, 19.0, 18.0, 12.0, 11.0, 11.0, 7.0, 9.0, 12.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.9716796875, -0.9411544799804688, -0.9106292724609375, -0.8801040649414062, -0.849578857421875, -0.8190536499023438, -0.7885284423828125, -0.7580032348632812, -0.72747802734375, -0.6969528198242188, -0.6664276123046875, -0.6359024047851562, -0.605377197265625, -0.5748519897460938, -0.5443267822265625, -0.5138015747070312, -0.4832763671875, -0.45275115966796875, -0.4222259521484375, -0.39170074462890625, -0.361175537109375, -0.33065032958984375, -0.3001251220703125, -0.26959991455078125, -0.23907470703125, -0.20854949951171875, -0.1780242919921875, -0.14749908447265625, -0.116973876953125, -0.08644866943359375, -0.0559234619140625, -0.02539825439453125, 0.005126953125, 0.03565216064453125, 0.0661773681640625, 0.09670257568359375, 0.127227783203125, 0.15775299072265625, 0.1882781982421875, 0.21880340576171875, 0.24932861328125, 0.27985382080078125, 0.3103790283203125, 0.34090423583984375, 0.371429443359375, 0.40195465087890625, 0.4324798583984375, 0.46300506591796875, 0.4935302734375, 0.5240554809570312, 0.5545806884765625, 0.5851058959960938, 0.615631103515625, 0.6461563110351562, 0.6766815185546875, 0.7072067260742188, 0.73773193359375, 0.7682571411132812, 0.7987823486328125, 0.8293075561523438, 0.859832763671875, 0.8903579711914062, 0.9208831787109375, 0.9514083862304688, 0.98193359375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 7.0, 11.0, 12.0, 13.0, 33.0, 53.0, 69.0, 100.0, 154.0, 242.0, 337.0, 497.0, 675.0, 1068.0, 1527.0, 2198.0, 3210.0, 4756.0, 6877.0, 10084.0, 15034.0, 22642.0, 34203.0, 54086.0, 88535.0, 159527.0, 1307727.0, 149491.0, 83884.0, 51114.0, 32801.0, 21511.0, 14145.0, 9527.0, 6458.0, 4467.0, 3145.0, 2153.0, 1540.0, 1057.0, 714.0, 502.0, 318.0, 229.0, 125.0, 98.0, 63.0, 55.0, 21.0, 16.0, 13.0, 5.0, 6.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.2646484375, -0.25623321533203125, -0.2478179931640625, -0.23940277099609375, -0.230987548828125, -0.22257232666015625, -0.2141571044921875, -0.20574188232421875, -0.19732666015625, -0.18891143798828125, -0.1804962158203125, -0.17208099365234375, -0.163665771484375, -0.15525054931640625, -0.1468353271484375, -0.13842010498046875, -0.1300048828125, -0.12158966064453125, -0.1131744384765625, -0.10475921630859375, -0.096343994140625, -0.08792877197265625, -0.0795135498046875, -0.07109832763671875, -0.06268310546875, -0.05426788330078125, -0.0458526611328125, -0.03743743896484375, -0.029022216796875, -0.02060699462890625, -0.0121917724609375, -0.00377655029296875, 0.004638671875, 0.01305389404296875, 0.0214691162109375, 0.02988433837890625, 0.038299560546875, 0.04671478271484375, 0.0551300048828125, 0.06354522705078125, 0.07196044921875, 0.08037567138671875, 0.0887908935546875, 0.09720611572265625, 0.105621337890625, 0.11403656005859375, 0.1224517822265625, 0.13086700439453125, 0.1392822265625, 0.14769744873046875, 0.1561126708984375, 0.16452789306640625, 0.172943115234375, 0.18135833740234375, 0.1897735595703125, 0.19818878173828125, 0.20660400390625, 0.21501922607421875, 0.2234344482421875, 0.23184967041015625, 0.240264892578125, 0.24868011474609375, 0.2570953369140625, 0.26551055908203125, 0.27392578125]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 5.0, 5.0, 2.0, 2.0, 8.0, 4.0, 11.0, 8.0, 10.0, 7.0, 10.0, 16.0, 17.0, 17.0, 17.0, 28.0, 44.0, 53.0, 45.0, 41.0, 64.0, 60.0, 59.0, 67.0, 48.0, 55.0, 36.0, 44.0, 43.0, 33.0, 23.0, 29.0, 19.0, 17.0, 13.0, 3.0, 5.0, 5.0, 9.0, 6.0, 8.0, 0.0, 4.0, 1.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.00022685527801513672, -0.000220518559217453, -0.0002141818404197693, -0.00020784512162208557, -0.00020150840282440186, -0.00019517168402671814, -0.00018883496522903442, -0.0001824982464313507, -0.000176161527633667, -0.00016982480883598328, -0.00016348809003829956, -0.00015715137124061584, -0.00015081465244293213, -0.0001444779336452484, -0.0001381412148475647, -0.00013180449604988098, -0.00012546777725219727, -0.00011913105845451355, -0.00011279433965682983, -0.00010645762085914612, -0.0001001209020614624, -9.378418326377869e-05, -8.744746446609497e-05, -8.111074566841125e-05, -7.477402687072754e-05, -6.843730807304382e-05, -6.210058927536011e-05, -5.576387047767639e-05, -4.9427151679992676e-05, -4.309043288230896e-05, -3.6753714084625244e-05, -3.041699528694153e-05, -2.4080276489257812e-05, -1.7743557691574097e-05, -1.1406838893890381e-05, -5.070120096206665e-06, 1.2665987014770508e-06, 7.603317499160767e-06, 1.3940036296844482e-05, 2.0276755094528198e-05, 2.6613473892211914e-05, 3.295019268989563e-05, 3.9286911487579346e-05, 4.562363028526306e-05, 5.196034908294678e-05, 5.829706788063049e-05, 6.463378667831421e-05, 7.097050547599792e-05, 7.730722427368164e-05, 8.364394307136536e-05, 8.998066186904907e-05, 9.631738066673279e-05, 0.0001026540994644165, 0.00010899081826210022, 0.00011532753705978394, 0.00012166425585746765, 0.00012800097465515137, 0.00013433769345283508, 0.0001406744122505188, 0.00014701113104820251, 0.00015334784984588623, 0.00015968456864356995, 0.00016602128744125366, 0.00017235800623893738, 0.0001786947250366211]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 5.0, 3.0, 2.0, 1.0, 3.0, 4.0, 5.0, 8.0, 5.0, 9.0, 13.0, 11.0, 19.0, 25.0, 31.0, 40.0, 55.0, 56.0, 81.0, 83.0, 115.0, 187.0, 223.0, 356.0, 491.0, 1668.0, 133911.0, 899980.0, 8834.0, 794.0, 425.0, 295.0, 189.0, 144.0, 108.0, 67.0, 47.0, 58.0, 40.0, 26.0, 22.0, 24.0, 24.0, 19.0, 15.0, 16.0, 6.0, 9.0, 2.0, 2.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00284576416015625, -0.00274503231048584, -0.0026443004608154297, -0.0025435686111450195, -0.0024428367614746094, -0.0023421049118041992, -0.002241373062133789, -0.002140641212463379, -0.0020399093627929688, -0.0019391775131225586, -0.0018384456634521484, -0.0017377138137817383, -0.0016369819641113281, -0.001536250114440918, -0.0014355182647705078, -0.0013347864151000977, -0.0012340545654296875, -0.0011333227157592773, -0.0010325908660888672, -0.000931859016418457, -0.0008311271667480469, -0.0007303953170776367, -0.0006296634674072266, -0.0005289316177368164, -0.00042819976806640625, -0.0003274679183959961, -0.00022673606872558594, -0.00012600421905517578, -2.5272369384765625e-05, 7.545948028564453e-05, 0.0001761913299560547, 0.00027692317962646484, 0.000377655029296875, 0.00047838687896728516, 0.0005791187286376953, 0.0006798505783081055, 0.0007805824279785156, 0.0008813142776489258, 0.000982046127319336, 0.001082777976989746, 0.0011835098266601562, 0.0012842416763305664, 0.0013849735260009766, 0.0014857053756713867, 0.0015864372253417969, 0.001687169075012207, 0.0017879009246826172, 0.0018886327743530273, 0.0019893646240234375, 0.0020900964736938477, 0.002190828323364258, 0.002291560173034668, 0.002392292022705078, 0.0024930238723754883, 0.0025937557220458984, 0.0026944875717163086, 0.0027952194213867188, 0.002895951271057129, 0.002996683120727539, 0.0030974149703979492, 0.0031981468200683594, 0.0032988786697387695, 0.0033996105194091797, 0.00350034236907959, 0.00360107421875]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 17.0, 39.0, 84.0, 172.0, 225.0, 210.0, 136.0, 67.0, 37.0, 14.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00040207267738878727, -0.00039331018342636526, -0.0003845477185677737, -0.0003757852246053517, -0.0003670227306429297, -0.00035826023668050766, -0.0003494977718219161, -0.0003407352778594941, -0.0003319727838970721, -0.00032321028993465006, -0.0003144478250760585, -0.0003056853311136365, -0.0002969228371512145, -0.00028816034318879247, -0.0002793978783302009, -0.0002706353843677789, -0.0002618728904053569, -0.00025311039644293487, -0.0002443479315843433, -0.0002355854376219213, -0.0002268229436594993, -0.0002180604642489925, -0.00020929798483848572, -0.0002005354908760637, -0.00019177302601747215, -0.00018301054660696536, -0.00017424805264454335, -0.00016548557323403656, -0.00015672307927161455, -0.00014796059986110777, -0.00013919812045060098, -0.00013043562648817897, -0.00012167311797384173, -0.00011291063128737733, -0.00010414814460091293, -9.538566519040614e-05, -8.662317122798413e-05, -7.786069181747735e-05, -6.909820513101295e-05, -6.033571844454855e-05, -5.157323175808415e-05, -4.281074507161975e-05, -3.404825838515535e-05, -2.5285775336669758e-05, -1.652328865020536e-05, -7.76080196374096e-06, 1.0016810847446322e-06, 9.764167771209031e-06, 1.852665445767343e-05, 2.728914114413783e-05, 3.605162783060223e-05, 4.481411087908782e-05, 5.357659756555222e-05, 6.233908061403781e-05, 7.110156730050221e-05, 7.986405398696661e-05, 8.862654067343101e-05, 9.738902735989541e-05, 0.00010615151404635981, 0.0001149140007328242, 0.000123676480143331, 0.000132438974105753, 0.0001412014535162598, 0.0001499639474786818, 0.0001587264268891886]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 0.0, 2.0, 3.0, 4.0, 6.0, 8.0, 8.0, 15.0, 13.0, 13.0, 20.0, 22.0, 15.0, 26.0, 33.0, 24.0, 28.0, 55.0, 35.0, 35.0, 37.0, 43.0, 42.0, 29.0, 35.0, 27.0, 41.0, 37.0, 32.0, 33.0, 21.0, 35.0, 35.0, 22.0, 24.0, 31.0, 16.0, 20.0, 16.0, 13.0, 12.0, 6.0, 2.0, 7.0, 3.0, 9.0, 1.0, 4.0, 2.0, 6.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.00010120868682861328, -9.79127362370491e-05, -9.461678564548492e-05, -9.132083505392075e-05, -8.802488446235657e-05, -8.472893387079239e-05, -8.143298327922821e-05, -7.813703268766403e-05, -7.484108209609985e-05, -7.154513150453568e-05, -6.82491809129715e-05, -6.495323032140732e-05, -6.165727972984314e-05, -5.836132913827896e-05, -5.506537854671478e-05, -5.1769427955150604e-05, -4.8473477363586426e-05, -4.517752677202225e-05, -4.188157618045807e-05, -3.858562558889389e-05, -3.528967499732971e-05, -3.1993724405765533e-05, -2.8697773814201355e-05, -2.5401823222637177e-05, -2.2105872631072998e-05, -1.880992203950882e-05, -1.551397144794464e-05, -1.2218020856380463e-05, -8.922070264816284e-06, -5.626119673252106e-06, -2.3301690816879272e-06, 9.657815098762512e-07, 4.26173210144043e-06, 7.557682693004608e-06, 1.0853633284568787e-05, 1.4149583876132965e-05, 1.7445534467697144e-05, 2.0741485059261322e-05, 2.40374356508255e-05, 2.733338624238968e-05, 3.062933683395386e-05, 3.3925287425518036e-05, 3.7221238017082214e-05, 4.051718860864639e-05, 4.381313920021057e-05, 4.710908979177475e-05, 5.040504038333893e-05, 5.370099097490311e-05, 5.6996941566467285e-05, 6.0292892158031464e-05, 6.358884274959564e-05, 6.688479334115982e-05, 7.0180743932724e-05, 7.347669452428818e-05, 7.677264511585236e-05, 8.006859570741653e-05, 8.336454629898071e-05, 8.666049689054489e-05, 8.995644748210907e-05, 9.325239807367325e-05, 9.654834866523743e-05, 9.98442992568016e-05, 0.00010314024984836578, 0.00010643620043992996, 0.00010973215103149414]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 8.0, 4.0, 4.0, 7.0, 5.0, 6.0, 4.0, 12.0, 11.0, 15.0, 10.0, 22.0, 13.0, 15.0, 15.0, 26.0, 23.0, 21.0, 32.0, 35.0, 34.0, 38.0, 45.0, 42.0, 46.0, 44.0, 49.0, 42.0, 34.0, 39.0, 31.0, 25.0, 34.0, 27.0, 27.0, 17.0, 23.0, 19.0, 18.0, 18.0, 14.0, 11.0, 11.0, 8.0, 4.0, 5.0, 5.0, 4.0, 2.0, 4.0, 0.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.572265625, -1.5201416015625, -1.468017578125, -1.4158935546875, -1.36376953125, -1.3116455078125, -1.259521484375, -1.2073974609375, -1.1552734375, -1.1031494140625, -1.051025390625, -0.9989013671875, -0.94677734375, -0.8946533203125, -0.842529296875, -0.7904052734375, -0.73828125, -0.6861572265625, -0.634033203125, -0.5819091796875, -0.52978515625, -0.4776611328125, -0.425537109375, -0.3734130859375, -0.3212890625, -0.2691650390625, -0.217041015625, -0.1649169921875, -0.11279296875, -0.0606689453125, -0.008544921875, 0.0435791015625, 0.095703125, 0.1478271484375, 0.199951171875, 0.2520751953125, 0.30419921875, 0.3563232421875, 0.408447265625, 0.4605712890625, 0.5126953125, 0.5648193359375, 0.616943359375, 0.6690673828125, 0.72119140625, 0.7733154296875, 0.825439453125, 0.8775634765625, 0.9296875, 0.9818115234375, 1.033935546875, 1.0860595703125, 1.13818359375, 1.1903076171875, 1.242431640625, 1.2945556640625, 1.3466796875, 1.3988037109375, 1.450927734375, 1.5030517578125, 1.55517578125, 1.6072998046875, 1.659423828125, 1.7115478515625, 1.763671875]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 5.0, 12.0, 10.0, 14.0, 17.0, 26.0, 29.0, 49.0, 60.0, 90.0, 123.0, 178.0, 277.0, 388.0, 587.0, 981.0, 1692.0, 2917.0, 5442.0, 10368.0, 22412.0, 56867.0, 184221.0, 455573.0, 197669.0, 60898.0, 23707.0, 10616.0, 5503.0, 3035.0, 1821.0, 1071.0, 624.0, 402.0, 263.0, 174.0, 121.0, 98.0, 59.0, 45.0, 30.0, 25.0, 15.0, 11.0, 12.0, 8.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.251953125, -2.175689697265625, -2.09942626953125, -2.023162841796875, -1.9468994140625, -1.870635986328125, -1.79437255859375, -1.718109130859375, -1.641845703125, -1.565582275390625, -1.48931884765625, -1.413055419921875, -1.3367919921875, -1.260528564453125, -1.18426513671875, -1.108001708984375, -1.03173828125, -0.955474853515625, -0.87921142578125, -0.802947998046875, -0.7266845703125, -0.650421142578125, -0.57415771484375, -0.497894287109375, -0.421630859375, -0.345367431640625, -0.26910400390625, -0.192840576171875, -0.1165771484375, -0.040313720703125, 0.03594970703125, 0.112213134765625, 0.1884765625, 0.264739990234375, 0.34100341796875, 0.417266845703125, 0.4935302734375, 0.569793701171875, 0.64605712890625, 0.722320556640625, 0.798583984375, 0.874847412109375, 0.95111083984375, 1.027374267578125, 1.1036376953125, 1.179901123046875, 1.25616455078125, 1.332427978515625, 1.40869140625, 1.484954833984375, 1.56121826171875, 1.637481689453125, 1.7137451171875, 1.790008544921875, 1.86627197265625, 1.942535400390625, 2.018798828125, 2.095062255859375, 2.17132568359375, 2.247589111328125, 2.3238525390625, 2.400115966796875, 2.47637939453125, 2.552642822265625, 2.62890625]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 3.0, 7.0, 5.0, 5.0, 6.0, 10.0, 15.0, 10.0, 12.0, 16.0, 14.0, 15.0, 14.0, 25.0, 20.0, 31.0, 42.0, 43.0, 44.0, 43.0, 73.0, 110.0, 182.0, 1392.0, 296.0, 129.0, 79.0, 54.0, 42.0, 47.0, 30.0, 30.0, 27.0, 20.0, 23.0, 21.0, 26.0, 25.0, 9.0, 15.0, 11.0, 5.0, 8.0, 6.0, 4.0, 1.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.76171875, -5.5743408203125, -5.386962890625, -5.1995849609375, -5.01220703125, -4.8248291015625, -4.637451171875, -4.4500732421875, -4.2626953125, -4.0753173828125, -3.887939453125, -3.7005615234375, -3.51318359375, -3.3258056640625, -3.138427734375, -2.9510498046875, -2.763671875, -2.5762939453125, -2.388916015625, -2.2015380859375, -2.01416015625, -1.8267822265625, -1.639404296875, -1.4520263671875, -1.2646484375, -1.0772705078125, -0.889892578125, -0.7025146484375, -0.51513671875, -0.3277587890625, -0.140380859375, 0.0469970703125, 0.234375, 0.4217529296875, 0.609130859375, 0.7965087890625, 0.98388671875, 1.1712646484375, 1.358642578125, 1.5460205078125, 1.7333984375, 1.9207763671875, 2.108154296875, 2.2955322265625, 2.48291015625, 2.6702880859375, 2.857666015625, 3.0450439453125, 3.232421875, 3.4197998046875, 3.607177734375, 3.7945556640625, 3.98193359375, 4.1693115234375, 4.356689453125, 4.5440673828125, 4.7314453125, 4.9188232421875, 5.106201171875, 5.2935791015625, 5.48095703125, 5.6683349609375, 5.855712890625, 6.0430908203125, 6.23046875]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 7.0, 2.0, 7.0, 11.0, 21.0, 38.0, 39.0, 73.0, 117.0, 181.0, 374.0, 1246.0, 36173.0, 3093095.0, 12571.0, 943.0, 320.0, 165.0, 98.0, 66.0, 48.0, 34.0, 20.0, 22.0, 15.0, 6.0, 2.0, 3.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-26.5625, -25.790283203125, -25.01806640625, -24.245849609375, -23.4736328125, -22.701416015625, -21.92919921875, -21.156982421875, -20.384765625, -19.612548828125, -18.84033203125, -18.068115234375, -17.2958984375, -16.523681640625, -15.75146484375, -14.979248046875, -14.20703125, -13.434814453125, -12.66259765625, -11.890380859375, -11.1181640625, -10.345947265625, -9.57373046875, -8.801513671875, -8.029296875, -7.257080078125, -6.48486328125, -5.712646484375, -4.9404296875, -4.168212890625, -3.39599609375, -2.623779296875, -1.8515625, -1.079345703125, -0.30712890625, 0.465087890625, 1.2373046875, 2.009521484375, 2.78173828125, 3.553955078125, 4.326171875, 5.098388671875, 5.87060546875, 6.642822265625, 7.4150390625, 8.187255859375, 8.95947265625, 9.731689453125, 10.50390625, 11.276123046875, 12.04833984375, 12.820556640625, 13.5927734375, 14.364990234375, 15.13720703125, 15.909423828125, 16.681640625, 17.453857421875, 18.22607421875, 18.998291015625, 19.7705078125, 20.542724609375, 21.31494140625, 22.087158203125, 22.859375]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 10.0, 144.0, 560.0, 282.0, 19.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-102.21324920654297, -100.40779113769531, -98.60233306884766, -96.796875, -94.99141693115234, -93.18595886230469, -91.38050079345703, -89.57504272460938, -87.76958465576172, -85.96412658691406, -84.1586685180664, -82.35321044921875, -80.5477523803711, -78.74229431152344, -76.93683624267578, -75.13137817382812, -73.32592010498047, -71.52046203613281, -69.71500396728516, -67.9095458984375, -66.10408782958984, -64.29862976074219, -62.49317169189453, -60.687713623046875, -58.882259368896484, -57.07680130004883, -55.27134323120117, -53.465885162353516, -51.66042709350586, -49.8549690246582, -48.04951095581055, -46.24405288696289, -44.43859100341797, -42.63313293457031, -40.827674865722656, -39.022216796875, -37.216758728027344, -35.41130065917969, -33.60584259033203, -31.800384521484375, -29.994930267333984, -28.189472198486328, -26.384014129638672, -24.578556060791016, -22.77309799194336, -20.967639923095703, -19.162181854248047, -17.35672378540039, -15.551265716552734, -13.745807647705078, -11.940349578857422, -10.134891510009766, -8.32943344116211, -6.5239763259887695, -4.718518257141113, -2.913060188293457, -1.1076021194458008, 0.6978558301925659, 2.5033137798309326, 4.30877161026001, 6.114229679107666, 7.919687271118164, 9.72514533996582, 11.530603408813477, 13.336061477661133]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 2.0, 7.0, 11.0, 10.0, 9.0, 8.0, 9.0, 15.0, 9.0, 10.0, 24.0, 15.0, 31.0, 19.0, 37.0, 16.0, 27.0, 30.0, 23.0, 31.0, 32.0, 32.0, 41.0, 32.0, 41.0, 44.0, 43.0, 36.0, 38.0, 25.0, 42.0, 27.0, 30.0, 26.0, 19.0, 21.0, 24.0, 18.0, 16.0, 19.0, 6.0, 9.0, 9.0, 7.0, 4.0, 9.0, 4.0, 5.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-17.81233024597168, -17.27786636352539, -16.7434024810791, -16.208938598632812, -15.674473762512207, -15.140008926391602, -14.605545043945312, -14.071081161499023, -13.536617279052734, -13.002153396606445, -12.46768856048584, -11.93322467803955, -11.398760795593262, -10.864295959472656, -10.329832077026367, -9.795368194580078, -9.260903358459473, -8.726439476013184, -8.191974639892578, -7.657510757446289, -7.123046875, -6.588582515716553, -6.0541181564331055, -5.519654273986816, -4.985189914703369, -4.450725555419922, -3.916261672973633, -3.3817973136901855, -2.8473331928253174, -2.312869071960449, -1.778404712677002, -1.2439405918121338, -0.7094764709472656, -0.17501229047775269, 0.35945188999176025, 0.893916130065918, 1.4283802509307861, 1.9628443717956543, 2.4973087310791016, 3.0317728519439697, 3.566236972808838, 4.100701332092285, 4.635165214538574, 5.1696295738220215, 5.704093933105469, 6.238557815551758, 6.773022174835205, 7.307486534118652, 7.841950416564941, 8.37641429901123, 8.910879135131836, 9.445343017578125, 9.979806900024414, 10.514270782470703, 11.048735618591309, 11.583199501037598, 12.117664337158203, 12.652128219604492, 13.186593055725098, 13.721056938171387, 14.255520820617676, 14.789985656738281, 15.32444953918457, 15.85891342163086, 16.39337730407715]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 1.0, 4.0, 2.0, 7.0, 4.0, 6.0, 6.0, 6.0, 6.0, 9.0, 12.0, 13.0, 12.0, 13.0, 10.0, 16.0, 27.0, 29.0, 32.0, 22.0, 25.0, 28.0, 31.0, 40.0, 40.0, 35.0, 40.0, 40.0, 39.0, 35.0, 33.0, 33.0, 35.0, 46.0, 29.0, 24.0, 19.0, 31.0, 25.0, 23.0, 14.0, 17.0, 11.0, 13.0, 13.0, 14.0, 6.0, 5.0, 9.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-1.6435546875, -1.5915069580078125, -1.539459228515625, -1.4874114990234375, -1.43536376953125, -1.3833160400390625, -1.331268310546875, -1.2792205810546875, -1.2271728515625, -1.1751251220703125, -1.123077392578125, -1.0710296630859375, -1.01898193359375, -0.9669342041015625, -0.914886474609375, -0.8628387451171875, -0.810791015625, -0.7587432861328125, -0.706695556640625, -0.6546478271484375, -0.60260009765625, -0.5505523681640625, -0.498504638671875, -0.4464569091796875, -0.3944091796875, -0.3423614501953125, -0.290313720703125, -0.2382659912109375, -0.18621826171875, -0.1341705322265625, -0.082122802734375, -0.0300750732421875, 0.02197265625, 0.0740203857421875, 0.126068115234375, 0.1781158447265625, 0.23016357421875, 0.2822113037109375, 0.334259033203125, 0.3863067626953125, 0.4383544921875, 0.4904022216796875, 0.542449951171875, 0.5944976806640625, 0.64654541015625, 0.6985931396484375, 0.750640869140625, 0.8026885986328125, 0.854736328125, 0.9067840576171875, 0.958831787109375, 1.0108795166015625, 1.06292724609375, 1.1149749755859375, 1.167022705078125, 1.2190704345703125, 1.2711181640625, 1.3231658935546875, 1.375213623046875, 1.4272613525390625, 1.47930908203125, 1.5313568115234375, 1.583404541015625, 1.6354522705078125, 1.6875]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 3.0, 7.0, 8.0, 6.0, 6.0, 17.0, 14.0, 17.0, 28.0, 36.0, 46.0, 74.0, 99.0, 139.0, 222.0, 333.0, 559.0, 1021.0, 2093.0, 4759.0, 11658.0, 32405.0, 101002.0, 333404.0, 909759.0, 1400407.0, 902799.0, 336663.0, 102817.0, 32302.0, 11773.0, 4868.0, 2208.0, 1127.0, 540.0, 329.0, 216.0, 149.0, 96.0, 84.0, 58.0, 30.0, 23.0, 24.0, 13.0, 15.0, 13.0, 3.0, 4.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.27734375, -2.207275390625, -2.13720703125, -2.067138671875, -1.9970703125, -1.927001953125, -1.85693359375, -1.786865234375, -1.716796875, -1.646728515625, -1.57666015625, -1.506591796875, -1.4365234375, -1.366455078125, -1.29638671875, -1.226318359375, -1.15625, -1.086181640625, -1.01611328125, -0.946044921875, -0.8759765625, -0.805908203125, -0.73583984375, -0.665771484375, -0.595703125, -0.525634765625, -0.45556640625, -0.385498046875, -0.3154296875, -0.245361328125, -0.17529296875, -0.105224609375, -0.03515625, 0.034912109375, 0.10498046875, 0.175048828125, 0.2451171875, 0.315185546875, 0.38525390625, 0.455322265625, 0.525390625, 0.595458984375, 0.66552734375, 0.735595703125, 0.8056640625, 0.875732421875, 0.94580078125, 1.015869140625, 1.0859375, 1.156005859375, 1.22607421875, 1.296142578125, 1.3662109375, 1.436279296875, 1.50634765625, 1.576416015625, 1.646484375, 1.716552734375, 1.78662109375, 1.856689453125, 1.9267578125, 1.996826171875, 2.06689453125, 2.136962890625, 2.20703125]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 4.0, 2.0, 3.0, 7.0, 5.0, 12.0, 11.0, 7.0, 10.0, 19.0, 25.0, 47.0, 45.0, 69.0, 98.0, 130.0, 170.0, 216.0, 263.0, 356.0, 395.0, 406.0, 337.0, 271.0, 259.0, 208.0, 188.0, 137.0, 94.0, 65.0, 49.0, 51.0, 30.0, 24.0, 24.0, 18.0, 7.0, 4.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.046875, -3.91400146484375, -3.7811279296875, -3.64825439453125, -3.515380859375, -3.38250732421875, -3.2496337890625, -3.11676025390625, -2.98388671875, -2.85101318359375, -2.7181396484375, -2.58526611328125, -2.452392578125, -2.31951904296875, -2.1866455078125, -2.05377197265625, -1.9208984375, -1.78802490234375, -1.6551513671875, -1.52227783203125, -1.389404296875, -1.25653076171875, -1.1236572265625, -0.99078369140625, -0.85791015625, -0.72503662109375, -0.5921630859375, -0.45928955078125, -0.326416015625, -0.19354248046875, -0.0606689453125, 0.07220458984375, 0.205078125, 0.33795166015625, 0.4708251953125, 0.60369873046875, 0.736572265625, 0.86944580078125, 1.0023193359375, 1.13519287109375, 1.26806640625, 1.40093994140625, 1.5338134765625, 1.66668701171875, 1.799560546875, 1.93243408203125, 2.0653076171875, 2.19818115234375, 2.3310546875, 2.46392822265625, 2.5968017578125, 2.72967529296875, 2.862548828125, 2.99542236328125, 3.1282958984375, 3.26116943359375, 3.39404296875, 3.52691650390625, 3.6597900390625, 3.79266357421875, 3.925537109375, 4.05841064453125, 4.1912841796875, 4.32415771484375, 4.45703125]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 6.0, 5.0, 7.0, 11.0, 25.0, 25.0, 42.0, 48.0, 60.0, 67.0, 115.0, 218.0, 460.0, 1619.0, 12262.0, 310012.0, 3470945.0, 381343.0, 14146.0, 1695.0, 510.0, 221.0, 130.0, 96.0, 61.0, 41.0, 23.0, 19.0, 19.0, 18.0, 9.0, 12.0, 4.0, 0.0, 4.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.46875, -11.10498046875, -10.7412109375, -10.37744140625, -10.013671875, -9.64990234375, -9.2861328125, -8.92236328125, -8.55859375, -8.19482421875, -7.8310546875, -7.46728515625, -7.103515625, -6.73974609375, -6.3759765625, -6.01220703125, -5.6484375, -5.28466796875, -4.9208984375, -4.55712890625, -4.193359375, -3.82958984375, -3.4658203125, -3.10205078125, -2.73828125, -2.37451171875, -2.0107421875, -1.64697265625, -1.283203125, -0.91943359375, -0.5556640625, -0.19189453125, 0.171875, 0.53564453125, 0.8994140625, 1.26318359375, 1.626953125, 1.99072265625, 2.3544921875, 2.71826171875, 3.08203125, 3.44580078125, 3.8095703125, 4.17333984375, 4.537109375, 4.90087890625, 5.2646484375, 5.62841796875, 5.9921875, 6.35595703125, 6.7197265625, 7.08349609375, 7.447265625, 7.81103515625, 8.1748046875, 8.53857421875, 8.90234375, 9.26611328125, 9.6298828125, 9.99365234375, 10.357421875, 10.72119140625, 11.0849609375, 11.44873046875, 11.8125]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 8.0, 22.0, 68.0, 182.0, 252.0, 216.0, 158.0, 75.0, 23.0, 8.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.831392288208008, -13.320860862731934, -11.81032943725586, -10.299797058105469, -8.789265632629395, -7.27873420715332, -5.76820182800293, -4.2576704025268555, -2.7471389770507812, -1.236607313156128, 0.2739243507385254, 1.7844562530517578, 3.294987678527832, 4.805519104003906, 6.316051483154297, 7.826582908630371, 9.337114334106445, 10.84764575958252, 12.358177185058594, 13.868709564208984, 15.379240989685059, 16.889772415161133, 18.400304794311523, 19.91083526611328, 21.421367645263672, 22.931900024414062, 24.44243049621582, 25.95296287536621, 27.46349334716797, 28.97402572631836, 30.48455810546875, 31.99509048461914, 33.50562286376953, 35.01615524291992, 36.52668762207031, 38.03721618652344, 39.54774856567383, 41.05828094482422, 42.56881332397461, 44.079345703125, 45.589874267578125, 47.100406646728516, 48.610939025878906, 50.12146759033203, 51.63199996948242, 53.14253234863281, 54.6530647277832, 56.163597106933594, 57.674129486083984, 59.184661865234375, 60.695194244384766, 62.205726623535156, 63.71625518798828, 65.22679138183594, 66.73731994628906, 68.24784851074219, 69.75838470458984, 71.26891326904297, 72.77944946289062, 74.28997802734375, 75.8005142211914, 77.31104278564453, 78.82157897949219, 80.33210754394531, 81.84263610839844]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 4.0, 10.0, 4.0, 5.0, 11.0, 14.0, 8.0, 19.0, 15.0, 20.0, 27.0, 27.0, 26.0, 23.0, 49.0, 39.0, 50.0, 43.0, 52.0, 37.0, 45.0, 49.0, 47.0, 36.0, 38.0, 32.0, 31.0, 29.0, 33.0, 30.0, 23.0, 27.0, 19.0, 22.0, 7.0, 10.0, 8.0, 6.0, 13.0, 7.0, 6.0, 3.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.446765899658203, -16.941373825073242, -16.43597984313965, -15.930586814880371, -15.425193786621094, -14.919801712036133, -14.414408683776855, -13.909015655517578, -13.4036226272583, -12.898229598999023, -12.392836570739746, -11.887443542480469, -11.382051467895508, -10.876657485961914, -10.371265411376953, -9.865872383117676, -9.360479354858398, -8.855086326599121, -8.349693298339844, -7.844300746917725, -7.338907718658447, -6.83351469039917, -6.328122138977051, -5.822729110717773, -5.317336082458496, -4.811943054199219, -4.306550025939941, -3.8011574745178223, -3.295764446258545, -2.7903714179992676, -2.2849786281585693, -1.779585838317871, -1.2741947174072266, -0.7688018083572388, -0.263408899307251, 0.24198400974273682, 0.7473769187927246, 1.252769947052002, 1.7581627368927002, 2.2635555267333984, 2.768948554992676, 3.274341583251953, 3.7797343730926514, 4.28512716293335, 4.790520191192627, 5.295913219451904, 5.801305770874023, 6.306698799133301, 6.812091827392578, 7.3174848556518555, 7.822877883911133, 8.32827091217041, 8.833663940429688, 9.339056015014648, 9.844449043273926, 10.349842071533203, 10.85523509979248, 11.360628128051758, 11.866021156311035, 12.371414184570312, 12.876806259155273, 13.382200241088867, 13.887592315673828, 14.392985343933105, 14.898378372192383]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 1.0, 5.0, 4.0, 7.0, 7.0, 10.0, 15.0, 8.0, 5.0, 8.0, 15.0, 19.0, 21.0, 22.0, 33.0, 20.0, 27.0, 33.0, 26.0, 45.0, 44.0, 44.0, 38.0, 32.0, 44.0, 39.0, 38.0, 38.0, 40.0, 43.0, 31.0, 31.0, 38.0, 25.0, 23.0, 25.0, 8.0, 12.0, 16.0, 13.0, 13.0, 6.0, 8.0, 5.0, 7.0, 6.0, 2.0, 3.0, 0.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7421875, -1.6841278076171875, -1.626068115234375, -1.5680084228515625, -1.50994873046875, -1.4518890380859375, -1.393829345703125, -1.3357696533203125, -1.2777099609375, -1.2196502685546875, -1.161590576171875, -1.1035308837890625, -1.04547119140625, -0.9874114990234375, -0.929351806640625, -0.8712921142578125, -0.813232421875, -0.7551727294921875, -0.697113037109375, -0.6390533447265625, -0.58099365234375, -0.5229339599609375, -0.464874267578125, -0.4068145751953125, -0.3487548828125, -0.2906951904296875, -0.232635498046875, -0.1745758056640625, -0.11651611328125, -0.0584564208984375, -0.000396728515625, 0.0576629638671875, 0.11572265625, 0.1737823486328125, 0.231842041015625, 0.2899017333984375, 0.34796142578125, 0.4060211181640625, 0.464080810546875, 0.5221405029296875, 0.5802001953125, 0.6382598876953125, 0.696319580078125, 0.7543792724609375, 0.81243896484375, 0.8704986572265625, 0.928558349609375, 0.9866180419921875, 1.044677734375, 1.1027374267578125, 1.160797119140625, 1.2188568115234375, 1.27691650390625, 1.3349761962890625, 1.393035888671875, 1.4510955810546875, 1.5091552734375, 1.5672149658203125, 1.625274658203125, 1.6833343505859375, 1.74139404296875, 1.7994537353515625, 1.857513427734375, 1.9155731201171875, 1.9736328125]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 7.0, 4.0, 8.0, 14.0, 24.0, 29.0, 43.0, 66.0, 99.0, 149.0, 187.0, 312.0, 417.0, 672.0, 968.0, 1361.0, 2032.0, 2893.0, 4263.0, 6013.0, 9129.0, 13329.0, 20393.0, 31397.0, 51219.0, 87215.0, 165808.0, 283212.0, 150000.0, 80975.0, 47764.0, 29522.0, 19304.0, 12575.0, 8542.0, 5955.0, 3961.0, 2736.0, 1875.0, 1274.0, 880.0, 601.0, 449.0, 273.0, 213.0, 137.0, 96.0, 60.0, 39.0, 28.0, 14.0, 10.0, 13.0, 6.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.323486328125, -0.31319427490234375, -0.3029022216796875, -0.29261016845703125, -0.282318115234375, -0.27202606201171875, -0.2617340087890625, -0.25144195556640625, -0.24114990234375, -0.23085784912109375, -0.2205657958984375, -0.21027374267578125, -0.199981689453125, -0.18968963623046875, -0.1793975830078125, -0.16910552978515625, -0.1588134765625, -0.14852142333984375, -0.1382293701171875, -0.12793731689453125, -0.117645263671875, -0.10735321044921875, -0.0970611572265625, -0.08676910400390625, -0.07647705078125, -0.06618499755859375, -0.0558929443359375, -0.04560089111328125, -0.035308837890625, -0.02501678466796875, -0.0147247314453125, -0.00443267822265625, 0.005859375, 0.01615142822265625, 0.0264434814453125, 0.03673553466796875, 0.047027587890625, 0.05731964111328125, 0.0676116943359375, 0.07790374755859375, 0.08819580078125, 0.09848785400390625, 0.1087799072265625, 0.11907196044921875, 0.129364013671875, 0.13965606689453125, 0.1499481201171875, 0.16024017333984375, 0.1705322265625, 0.18082427978515625, 0.1911163330078125, 0.20140838623046875, 0.211700439453125, 0.22199249267578125, 0.2322845458984375, 0.24257659912109375, 0.25286865234375, 0.26316070556640625, 0.2734527587890625, 0.28374481201171875, 0.294036865234375, 0.30432891845703125, 0.3146209716796875, 0.32491302490234375, 0.335205078125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 6.0, 5.0, 4.0, 4.0, 8.0, 2.0, 9.0, 10.0, 10.0, 14.0, 18.0, 27.0, 15.0, 21.0, 25.0, 32.0, 34.0, 38.0, 35.0, 29.0, 34.0, 39.0, 31.0, 1072.0, 51.0, 49.0, 36.0, 44.0, 41.0, 37.0, 34.0, 20.0, 30.0, 26.0, 22.0, 22.0, 12.0, 13.0, 16.0, 9.0, 12.0, 9.0, 7.0, 4.0, 8.0, 6.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.2392578125, -1.2024078369140625, -1.165557861328125, -1.1287078857421875, -1.09185791015625, -1.0550079345703125, -1.018157958984375, -0.9813079833984375, -0.9444580078125, -0.9076080322265625, -0.870758056640625, -0.8339080810546875, -0.79705810546875, -0.7602081298828125, -0.723358154296875, -0.6865081787109375, -0.649658203125, -0.6128082275390625, -0.575958251953125, -0.5391082763671875, -0.50225830078125, -0.4654083251953125, -0.428558349609375, -0.3917083740234375, -0.3548583984375, -0.3180084228515625, -0.281158447265625, -0.2443084716796875, -0.20745849609375, -0.1706085205078125, -0.133758544921875, -0.0969085693359375, -0.06005859375, -0.0232086181640625, 0.013641357421875, 0.0504913330078125, 0.08734130859375, 0.1241912841796875, 0.161041259765625, 0.1978912353515625, 0.2347412109375, 0.2715911865234375, 0.308441162109375, 0.3452911376953125, 0.38214111328125, 0.4189910888671875, 0.455841064453125, 0.4926910400390625, 0.529541015625, 0.5663909912109375, 0.603240966796875, 0.6400909423828125, 0.67694091796875, 0.7137908935546875, 0.750640869140625, 0.7874908447265625, 0.8243408203125, 0.8611907958984375, 0.898040771484375, 0.9348907470703125, 0.97174072265625, 1.0085906982421875, 1.045440673828125, 1.0822906494140625, 1.119140625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 6.0, 6.0, 4.0, 16.0, 13.0, 26.0, 37.0, 50.0, 76.0, 99.0, 144.0, 244.0, 358.0, 489.0, 737.0, 1093.0, 1660.0, 2400.0, 3477.0, 5183.0, 7527.0, 11576.0, 17713.0, 28041.0, 45921.0, 80403.0, 155560.0, 1348125.0, 168058.0, 84978.0, 48978.0, 29454.0, 18487.0, 11909.0, 7697.0, 5224.0, 3497.0, 2412.0, 1745.0, 1183.0, 800.0, 545.0, 401.0, 258.0, 191.0, 118.0, 78.0, 47.0, 37.0, 27.0, 14.0, 9.0, 6.0, 0.0, 4.0, 0.0, 2.0, 2.0], "bins": [-0.33544921875, -0.3254508972167969, -0.31545257568359375, -0.3054542541503906, -0.2954559326171875, -0.2854576110839844, -0.27545928955078125, -0.2654609680175781, -0.255462646484375, -0.24546432495117188, -0.23546600341796875, -0.22546768188476562, -0.2154693603515625, -0.20547103881835938, -0.19547271728515625, -0.18547439575195312, -0.17547607421875, -0.16547775268554688, -0.15547943115234375, -0.14548110961914062, -0.1354827880859375, -0.12548446655273438, -0.11548614501953125, -0.10548782348632812, -0.095489501953125, -0.08549118041992188, -0.07549285888671875, -0.06549453735351562, -0.0554962158203125, -0.045497894287109375, -0.03549957275390625, -0.025501251220703125, -0.0155029296875, -0.005504608154296875, 0.00449371337890625, 0.014492034912109375, 0.0244903564453125, 0.034488677978515625, 0.04448699951171875, 0.054485321044921875, 0.064483642578125, 0.07448196411132812, 0.08448028564453125, 0.09447860717773438, 0.1044769287109375, 0.11447525024414062, 0.12447357177734375, 0.13447189331054688, 0.14447021484375, 0.15446853637695312, 0.16446685791015625, 0.17446517944335938, 0.1844635009765625, 0.19446182250976562, 0.20446014404296875, 0.21445846557617188, 0.224456787109375, 0.23445510864257812, 0.24445343017578125, 0.2544517517089844, 0.2644500732421875, 0.2744483947753906, 0.28444671630859375, 0.2944450378417969, 0.304443359375]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 8.0, 5.0, 8.0, 9.0, 12.0, 22.0, 18.0, 17.0, 30.0, 46.0, 44.0, 62.0, 56.0, 57.0, 45.0, 59.0, 75.0, 57.0, 45.0, 44.0, 38.0, 44.0, 44.0, 34.0, 32.0, 23.0, 17.0, 4.0, 10.0, 5.0, 6.0, 2.0, 7.0, 3.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00025653839111328125, -0.00024934113025665283, -0.00024214386940002441, -0.000234946608543396, -0.00022774934768676758, -0.00022055208683013916, -0.00021335482597351074, -0.00020615756511688232, -0.0001989603042602539, -0.0001917630434036255, -0.00018456578254699707, -0.00017736852169036865, -0.00017017126083374023, -0.00016297399997711182, -0.0001557767391204834, -0.00014857947826385498, -0.00014138221740722656, -0.00013418495655059814, -0.00012698769569396973, -0.00011979043483734131, -0.00011259317398071289, -0.00010539591312408447, -9.819865226745605e-05, -9.100139141082764e-05, -8.380413055419922e-05, -7.66068696975708e-05, -6.940960884094238e-05, -6.221234798431396e-05, -5.501508712768555e-05, -4.781782627105713e-05, -4.062056541442871e-05, -3.342330455780029e-05, -2.6226043701171875e-05, -1.9028782844543457e-05, -1.1831521987915039e-05, -4.634261131286621e-06, 2.562999725341797e-06, 9.760260581970215e-06, 1.6957521438598633e-05, 2.415478229522705e-05, 3.135204315185547e-05, 3.854930400848389e-05, 4.5746564865112305e-05, 5.294382572174072e-05, 6.014108657836914e-05, 6.733834743499756e-05, 7.453560829162598e-05, 8.17328691482544e-05, 8.893013000488281e-05, 9.612739086151123e-05, 0.00010332465171813965, 0.00011052191257476807, 0.00011771917343139648, 0.0001249164342880249, 0.00013211369514465332, 0.00013931095600128174, 0.00014650821685791016, 0.00015370547771453857, 0.000160902738571167, 0.0001680999994277954, 0.00017529726028442383, 0.00018249452114105225, 0.00018969178199768066, 0.00019688904285430908, 0.0002040863037109375]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 2.0, 4.0, 8.0, 10.0, 7.0, 14.0, 18.0, 19.0, 36.0, 56.0, 56.0, 76.0, 97.0, 162.0, 245.0, 448.0, 727.0, 5406.0, 984683.0, 54058.0, 986.0, 477.0, 336.0, 191.0, 108.0, 93.0, 63.0, 41.0, 30.0, 17.0, 17.0, 15.0, 14.0, 8.0, 6.0, 3.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0036182403564453125, -0.003487497568130493, -0.003356754779815674, -0.0032260119915008545, -0.003095269203186035, -0.002964526414871216, -0.0028337836265563965, -0.002703040838241577, -0.002572298049926758, -0.0024415552616119385, -0.002310812473297119, -0.0021800696849823, -0.0020493268966674805, -0.0019185841083526611, -0.0017878413200378418, -0.0016570985317230225, -0.0015263557434082031, -0.0013956129550933838, -0.0012648701667785645, -0.0011341273784637451, -0.0010033845901489258, -0.0008726418018341064, -0.0007418990135192871, -0.0006111562252044678, -0.00048041343688964844, -0.0003496706485748291, -0.00021892786026000977, -8.818507194519043e-05, 4.2557716369628906e-05, 0.00017330050468444824, 0.0003040432929992676, 0.0004347860813140869, 0.0005655288696289062, 0.0006962716579437256, 0.0008270144462585449, 0.0009577572345733643, 0.0010885000228881836, 0.001219242811203003, 0.0013499855995178223, 0.0014807283878326416, 0.001611471176147461, 0.0017422139644622803, 0.0018729567527770996, 0.002003699541091919, 0.0021344423294067383, 0.0022651851177215576, 0.002395927906036377, 0.0025266706943511963, 0.0026574134826660156, 0.002788156270980835, 0.0029188990592956543, 0.0030496418476104736, 0.003180384635925293, 0.0033111274242401123, 0.0034418702125549316, 0.003572613000869751, 0.0037033557891845703, 0.0038340985774993896, 0.003964841365814209, 0.004095584154129028, 0.004226326942443848, 0.004357069730758667, 0.004487812519073486, 0.004618555307388306, 0.004749298095703125]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 7.0, 16.0, 60.0, 96.0, 145.0, 174.0, 171.0, 154.0, 101.0, 49.0, 18.0, 10.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00023732439149171114, -0.00022992145386524498, -0.00022251851623877883, -0.00021511557861231267, -0.00020771264098584652, -0.00020030970335938036, -0.0001929067657329142, -0.00018550382810644805, -0.0001781008904799819, -0.00017069795285351574, -0.0001632950152270496, -0.00015589207760058343, -0.00014848913997411728, -0.00014108620234765112, -0.00013368326472118497, -0.00012628032709471881, -0.00011887740402016789, -0.00011147446639370173, -0.00010407152876723558, -9.666859114076942e-05, -8.926565351430327e-05, -8.186271588783711e-05, -7.445978553732857e-05, -6.705684791086242e-05, -5.965391028439626e-05, -5.2250972657930106e-05, -4.484803503146395e-05, -3.74451010429766e-05, -3.0042163416510448e-05, -2.2639225790044293e-05, -1.5236291801556945e-05, -7.83335417509079e-06, -4.304311005398631e-07, 6.97250561643159e-06, 1.4375442333403043e-05, 2.1778378140879795e-05, 2.918131576734595e-05, 3.6584253393812105e-05, 4.398718738229945e-05, 5.139012500876561e-05, 5.879306263523176e-05, 6.619600026169792e-05, 7.359893788816407e-05, 8.100186823867261e-05, 8.840480586513877e-05, 9.580774349160492e-05, 0.00010321068111807108, 0.00011061361874453723, 0.00011801655637100339, 0.00012541949399746954, 0.0001328224316239357, 0.00014022536925040185, 0.000147628306876868, 0.00015503124450333416, 0.00016243418212980032, 0.00016983711975626647, 0.00017724005738273263, 0.00018464299500919878, 0.00019204593263566494, 0.0001994488702621311, 0.00020685180788859725, 0.0002142547455150634, 0.00022165768314152956, 0.00022906062076799572, 0.00023646354384254664]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 5.0, 7.0, 9.0, 7.0, 15.0, 14.0, 18.0, 17.0, 25.0, 23.0, 18.0, 15.0, 24.0, 32.0, 28.0, 32.0, 44.0, 39.0, 42.0, 40.0, 40.0, 40.0, 42.0, 41.0, 35.0, 34.0, 38.0, 38.0, 21.0, 26.0, 27.0, 22.0, 24.0, 15.0, 14.0, 24.0, 12.0, 9.0, 12.0, 7.0, 6.0, 6.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.00011795759201049805, -0.0001145070418715477, -0.00011105649173259735, -0.000107605941593647, -0.00010415539145469666, -0.00010070484131574631, -9.725429117679596e-05, -9.380374103784561e-05, -9.035319089889526e-05, -8.690264075994492e-05, -8.345209062099457e-05, -8.000154048204422e-05, -7.655099034309387e-05, -7.310044020414352e-05, -6.964989006519318e-05, -6.619933992624283e-05, -6.274878978729248e-05, -5.929823964834213e-05, -5.5847689509391785e-05, -5.239713937044144e-05, -4.894658923149109e-05, -4.549603909254074e-05, -4.204548895359039e-05, -3.8594938814640045e-05, -3.51443886756897e-05, -3.169383853673935e-05, -2.8243288397789e-05, -2.4792738258838654e-05, -2.1342188119888306e-05, -1.7891637980937958e-05, -1.444108784198761e-05, -1.0990537703037262e-05, -7.539987564086914e-06, -4.089437425136566e-06, -6.388872861862183e-07, 2.8116628527641296e-06, 6.2622129917144775e-06, 9.712763130664825e-06, 1.3163313269615173e-05, 1.661386340856552e-05, 2.006441354751587e-05, 2.3514963686466217e-05, 2.6965513825416565e-05, 3.0416063964366913e-05, 3.386661410331726e-05, 3.731716424226761e-05, 4.0767714381217957e-05, 4.4218264520168304e-05, 4.766881465911865e-05, 5.1119364798069e-05, 5.456991493701935e-05, 5.8020465075969696e-05, 6.147101521492004e-05, 6.492156535387039e-05, 6.837211549282074e-05, 7.182266563177109e-05, 7.527321577072144e-05, 7.872376590967178e-05, 8.217431604862213e-05, 8.562486618757248e-05, 8.907541632652283e-05, 9.252596646547318e-05, 9.597651660442352e-05, 9.942706674337387e-05, 0.00010287761688232422]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 1.0, 5.0, 4.0, 7.0, 7.0, 10.0, 15.0, 8.0, 5.0, 8.0, 15.0, 19.0, 21.0, 22.0, 33.0, 20.0, 27.0, 33.0, 26.0, 45.0, 44.0, 44.0, 38.0, 32.0, 44.0, 39.0, 38.0, 38.0, 40.0, 43.0, 31.0, 31.0, 38.0, 25.0, 23.0, 25.0, 8.0, 12.0, 16.0, 13.0, 13.0, 6.0, 8.0, 5.0, 7.0, 6.0, 2.0, 3.0, 0.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7421875, -1.6841278076171875, -1.626068115234375, -1.5680084228515625, -1.50994873046875, -1.4518890380859375, -1.393829345703125, -1.3357696533203125, -1.2777099609375, -1.2196502685546875, -1.161590576171875, -1.1035308837890625, -1.04547119140625, -0.9874114990234375, -0.929351806640625, -0.8712921142578125, -0.813232421875, -0.7551727294921875, -0.697113037109375, -0.6390533447265625, -0.58099365234375, -0.5229339599609375, -0.464874267578125, -0.4068145751953125, -0.3487548828125, -0.2906951904296875, -0.232635498046875, -0.1745758056640625, -0.11651611328125, -0.0584564208984375, -0.000396728515625, 0.0576629638671875, 0.11572265625, 0.1737823486328125, 0.231842041015625, 0.2899017333984375, 0.34796142578125, 0.4060211181640625, 0.464080810546875, 0.5221405029296875, 0.5802001953125, 0.6382598876953125, 0.696319580078125, 0.7543792724609375, 0.81243896484375, 0.8704986572265625, 0.928558349609375, 0.9866180419921875, 1.044677734375, 1.1027374267578125, 1.160797119140625, 1.2188568115234375, 1.27691650390625, 1.3349761962890625, 1.393035888671875, 1.4510955810546875, 1.5091552734375, 1.5672149658203125, 1.625274658203125, 1.6833343505859375, 1.74139404296875, 1.7994537353515625, 1.857513427734375, 1.9155731201171875, 1.9736328125]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 2.0, 3.0, 8.0, 4.0, 7.0, 4.0, 16.0, 13.0, 16.0, 21.0, 41.0, 59.0, 89.0, 108.0, 191.0, 292.0, 566.0, 854.0, 1601.0, 2894.0, 5706.0, 11125.0, 24271.0, 59467.0, 170982.0, 382467.0, 242565.0, 83470.0, 31876.0, 14371.0, 7031.0, 3684.0, 2058.0, 1082.0, 629.0, 342.0, 195.0, 119.0, 90.0, 80.0, 45.0, 33.0, 21.0, 20.0, 9.0, 12.0, 4.0, 4.0, 8.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0], "bins": [-2.2265625, -2.15625, -2.0859375, -2.015625, -1.9453125, -1.875, -1.8046875, -1.734375, -1.6640625, -1.59375, -1.5234375, -1.453125, -1.3828125, -1.3125, -1.2421875, -1.171875, -1.1015625, -1.03125, -0.9609375, -0.890625, -0.8203125, -0.75, -0.6796875, -0.609375, -0.5390625, -0.46875, -0.3984375, -0.328125, -0.2578125, -0.1875, -0.1171875, -0.046875, 0.0234375, 0.09375, 0.1640625, 0.234375, 0.3046875, 0.375, 0.4453125, 0.515625, 0.5859375, 0.65625, 0.7265625, 0.796875, 0.8671875, 0.9375, 1.0078125, 1.078125, 1.1484375, 1.21875, 1.2890625, 1.359375, 1.4296875, 1.5, 1.5703125, 1.640625, 1.7109375, 1.78125, 1.8515625, 1.921875, 1.9921875, 2.0625, 2.1328125, 2.203125, 2.2734375]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 7.0, 4.0, 9.0, 9.0, 10.0, 14.0, 17.0, 16.0, 25.0, 20.0, 35.0, 38.0, 34.0, 40.0, 62.0, 58.0, 68.0, 147.0, 324.0, 1398.0, 180.0, 88.0, 72.0, 55.0, 49.0, 29.0, 42.0, 31.0, 23.0, 31.0, 20.0, 18.0, 14.0, 13.0, 5.0, 8.0, 6.0, 5.0, 5.0, 6.0, 0.0, 5.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.44140625, -7.2021484375, -6.962890625, -6.7236328125, -6.484375, -6.2451171875, -6.005859375, -5.7666015625, -5.52734375, -5.2880859375, -5.048828125, -4.8095703125, -4.5703125, -4.3310546875, -4.091796875, -3.8525390625, -3.61328125, -3.3740234375, -3.134765625, -2.8955078125, -2.65625, -2.4169921875, -2.177734375, -1.9384765625, -1.69921875, -1.4599609375, -1.220703125, -0.9814453125, -0.7421875, -0.5029296875, -0.263671875, -0.0244140625, 0.21484375, 0.4541015625, 0.693359375, 0.9326171875, 1.171875, 1.4111328125, 1.650390625, 1.8896484375, 2.12890625, 2.3681640625, 2.607421875, 2.8466796875, 3.0859375, 3.3251953125, 3.564453125, 3.8037109375, 4.04296875, 4.2822265625, 4.521484375, 4.7607421875, 5.0, 5.2392578125, 5.478515625, 5.7177734375, 5.95703125, 6.1962890625, 6.435546875, 6.6748046875, 6.9140625, 7.1533203125, 7.392578125, 7.6318359375, 7.87109375]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 5.0, 6.0, 2.0, 7.0, 17.0, 31.0, 39.0, 60.0, 108.0, 201.0, 422.0, 1783.0, 2646260.0, 494612.0, 1340.0, 364.0, 170.0, 105.0, 58.0, 37.0, 30.0, 12.0, 17.0, 10.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-47.90625, -46.736083984375, -45.56591796875, -44.395751953125, -43.2255859375, -42.055419921875, -40.88525390625, -39.715087890625, -38.544921875, -37.374755859375, -36.20458984375, -35.034423828125, -33.8642578125, -32.694091796875, -31.52392578125, -30.353759765625, -29.18359375, -28.013427734375, -26.84326171875, -25.673095703125, -24.5029296875, -23.332763671875, -22.16259765625, -20.992431640625, -19.822265625, -18.652099609375, -17.48193359375, -16.311767578125, -15.1416015625, -13.971435546875, -12.80126953125, -11.631103515625, -10.4609375, -9.290771484375, -8.12060546875, -6.950439453125, -5.7802734375, -4.610107421875, -3.43994140625, -2.269775390625, -1.099609375, 0.070556640625, 1.24072265625, 2.410888671875, 3.5810546875, 4.751220703125, 5.92138671875, 7.091552734375, 8.26171875, 9.431884765625, 10.60205078125, 11.772216796875, 12.9423828125, 14.112548828125, 15.28271484375, 16.452880859375, 17.623046875, 18.793212890625, 19.96337890625, 21.133544921875, 22.3037109375, 23.473876953125, 24.64404296875, 25.814208984375, 26.984375]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [796.0, 218.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.200349807739258, 0.8117284774780273, 5.8238067626953125, 10.835885047912598, 15.847963333129883, 20.86004066467285, 25.872119903564453, 30.884199142456055, 35.896278381347656, 40.908355712890625, 45.920433044433594, 50.93251419067383, 55.9445915222168, 60.956668853759766, 65.96875, 70.98082733154297, 75.99290466308594, 81.0049819946289, 86.01705932617188, 91.02913665771484, 96.04121398925781, 101.05329895019531, 106.06537628173828, 111.07745361328125, 116.08953094482422, 121.10160827636719, 126.11368560791016, 131.12576293945312, 136.13784790039062, 141.14991760253906, 146.16200256347656, 151.174072265625, 156.1861572265625, 161.1982421875, 166.21031188964844, 171.22239685058594, 176.23446655273438, 181.24655151367188, 186.2586212158203, 191.2707061767578, 196.28277587890625, 201.29486083984375, 206.3069305419922, 211.3190155029297, 216.33108520507812, 221.34317016601562, 226.35523986816406, 231.36732482910156, 236.37940979003906, 241.39149475097656, 246.403564453125, 251.4156494140625, 256.427734375, 261.4397888183594, 266.4518737792969, 271.4639587402344, 276.4760437011719, 281.4881286621094, 286.5002136230469, 291.51226806640625, 296.52435302734375, 301.53643798828125, 306.54852294921875, 311.56060791015625, 316.5726623535156]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 4.0, 5.0, 6.0, 2.0, 4.0, 13.0, 11.0, 13.0, 18.0, 11.0, 15.0, 22.0, 25.0, 28.0, 22.0, 36.0, 37.0, 30.0, 39.0, 29.0, 39.0, 41.0, 39.0, 37.0, 35.0, 36.0, 33.0, 43.0, 38.0, 30.0, 34.0, 31.0, 24.0, 22.0, 24.0, 18.0, 17.0, 14.0, 12.0, 14.0, 12.0, 2.0, 11.0, 9.0, 4.0, 6.0, 3.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-18.929765701293945, -18.370332717895508, -17.81089973449707, -17.25146484375, -16.692031860351562, -16.132598876953125, -15.573165893554688, -15.01373291015625, -14.454298973083496, -13.894865989685059, -13.335432052612305, -12.775999069213867, -12.21656608581543, -11.657132148742676, -11.097699165344238, -10.538265228271484, -9.978832244873047, -9.41939926147461, -8.859965324401855, -8.300532341003418, -7.741098880767822, -7.181665420532227, -6.622232437133789, -6.062798976898193, -5.503365516662598, -4.943932056427002, -4.384498596191406, -3.8250656127929688, -3.265632152557373, -2.7061986923217773, -2.1467654705047607, -1.5873322486877441, -1.0278987884521484, -0.4684654474258423, 0.09096789360046387, 0.65040123462677, 1.2098345756530762, 1.7692680358886719, 2.3287012577056885, 2.888134479522705, 3.447567939758301, 4.0070013999938965, 4.566434860229492, 5.12586784362793, 5.685301303863525, 6.244734764099121, 6.804167747497559, 7.363601207733154, 7.92303466796875, 8.482467651367188, 9.041901588439941, 9.601334571838379, 10.160768508911133, 10.72020149230957, 11.279634475708008, 11.839067459106445, 12.3985013961792, 12.957934379577637, 13.51736831665039, 14.076801300048828, 14.636234283447266, 15.19566822052002, 15.755101203918457, 16.31453514099121, 16.87396812438965]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 3.0, 3.0, 2.0, 3.0, 4.0, 4.0, 6.0, 6.0, 12.0, 13.0, 11.0, 13.0, 14.0, 20.0, 12.0, 31.0, 16.0, 26.0, 24.0, 29.0, 28.0, 34.0, 45.0, 35.0, 38.0, 30.0, 37.0, 39.0, 46.0, 32.0, 36.0, 48.0, 38.0, 34.0, 32.0, 27.0, 34.0, 18.0, 20.0, 19.0, 18.0, 8.0, 12.0, 13.0, 9.0, 4.0, 7.0, 2.0, 5.0, 5.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8095703125, -1.7487945556640625, -1.688018798828125, -1.6272430419921875, -1.56646728515625, -1.5056915283203125, -1.444915771484375, -1.3841400146484375, -1.3233642578125, -1.2625885009765625, -1.201812744140625, -1.1410369873046875, -1.08026123046875, -1.0194854736328125, -0.958709716796875, -0.8979339599609375, -0.837158203125, -0.7763824462890625, -0.715606689453125, -0.6548309326171875, -0.59405517578125, -0.5332794189453125, -0.472503662109375, -0.4117279052734375, -0.3509521484375, -0.2901763916015625, -0.229400634765625, -0.1686248779296875, -0.10784912109375, -0.0470733642578125, 0.013702392578125, 0.0744781494140625, 0.13525390625, 0.1960296630859375, 0.256805419921875, 0.3175811767578125, 0.37835693359375, 0.4391326904296875, 0.499908447265625, 0.5606842041015625, 0.6214599609375, 0.6822357177734375, 0.743011474609375, 0.8037872314453125, 0.86456298828125, 0.9253387451171875, 0.986114501953125, 1.0468902587890625, 1.107666015625, 1.1684417724609375, 1.229217529296875, 1.2899932861328125, 1.35076904296875, 1.4115447998046875, 1.472320556640625, 1.5330963134765625, 1.5938720703125, 1.6546478271484375, 1.715423583984375, 1.7761993408203125, 1.83697509765625, 1.8977508544921875, 1.958526611328125, 2.0193023681640625, 2.080078125]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 4.0, 6.0, 0.0, 4.0, 15.0, 13.0, 13.0, 9.0, 17.0, 15.0, 18.0, 27.0, 40.0, 36.0, 47.0, 63.0, 84.0, 77.0, 112.0, 202.0, 393.0, 1331.0, 15589.0, 944079.0, 3130760.0, 96166.0, 3589.0, 620.0, 260.0, 145.0, 106.0, 96.0, 59.0, 54.0, 43.0, 30.0, 29.0, 16.0, 19.0, 23.0, 21.0, 13.0, 9.0, 10.0, 5.0, 3.0, 4.0, 2.0, 7.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.578125, -8.29443359375, -8.0107421875, -7.72705078125, -7.443359375, -7.15966796875, -6.8759765625, -6.59228515625, -6.30859375, -6.02490234375, -5.7412109375, -5.45751953125, -5.173828125, -4.89013671875, -4.6064453125, -4.32275390625, -4.0390625, -3.75537109375, -3.4716796875, -3.18798828125, -2.904296875, -2.62060546875, -2.3369140625, -2.05322265625, -1.76953125, -1.48583984375, -1.2021484375, -0.91845703125, -0.634765625, -0.35107421875, -0.0673828125, 0.21630859375, 0.5, 0.78369140625, 1.0673828125, 1.35107421875, 1.634765625, 1.91845703125, 2.2021484375, 2.48583984375, 2.76953125, 3.05322265625, 3.3369140625, 3.62060546875, 3.904296875, 4.18798828125, 4.4716796875, 4.75537109375, 5.0390625, 5.32275390625, 5.6064453125, 5.89013671875, 6.173828125, 6.45751953125, 6.7412109375, 7.02490234375, 7.30859375, 7.59228515625, 7.8759765625, 8.15966796875, 8.443359375, 8.72705078125, 9.0107421875, 9.29443359375, 9.578125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 9.0, 9.0, 19.0, 26.0, 28.0, 45.0, 56.0, 88.0, 122.0, 178.0, 239.0, 341.0, 414.0, 480.0, 468.0, 407.0, 320.0, 231.0, 172.0, 137.0, 84.0, 61.0, 39.0, 35.0, 15.0, 15.0, 12.0, 7.0, 5.0, 2.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.84375, -5.67138671875, -5.4990234375, -5.32666015625, -5.154296875, -4.98193359375, -4.8095703125, -4.63720703125, -4.46484375, -4.29248046875, -4.1201171875, -3.94775390625, -3.775390625, -3.60302734375, -3.4306640625, -3.25830078125, -3.0859375, -2.91357421875, -2.7412109375, -2.56884765625, -2.396484375, -2.22412109375, -2.0517578125, -1.87939453125, -1.70703125, -1.53466796875, -1.3623046875, -1.18994140625, -1.017578125, -0.84521484375, -0.6728515625, -0.50048828125, -0.328125, -0.15576171875, 0.0166015625, 0.18896484375, 0.361328125, 0.53369140625, 0.7060546875, 0.87841796875, 1.05078125, 1.22314453125, 1.3955078125, 1.56787109375, 1.740234375, 1.91259765625, 2.0849609375, 2.25732421875, 2.4296875, 2.60205078125, 2.7744140625, 2.94677734375, 3.119140625, 3.29150390625, 3.4638671875, 3.63623046875, 3.80859375, 3.98095703125, 4.1533203125, 4.32568359375, 4.498046875, 4.67041015625, 4.8427734375, 5.01513671875, 5.1875]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 5.0, 17.0, 12.0, 23.0, 34.0, 56.0, 76.0, 96.0, 115.0, 206.0, 277.0, 506.0, 1288.0, 9381.0, 457966.0, 3587997.0, 129679.0, 4420.0, 909.0, 412.0, 247.0, 154.0, 97.0, 83.0, 63.0, 53.0, 32.0, 23.0, 12.0, 10.0, 15.0, 4.0, 4.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.78125, -13.3272705078125, -12.873291015625, -12.4193115234375, -11.96533203125, -11.5113525390625, -11.057373046875, -10.6033935546875, -10.1494140625, -9.6954345703125, -9.241455078125, -8.7874755859375, -8.33349609375, -7.8795166015625, -7.425537109375, -6.9715576171875, -6.517578125, -6.0635986328125, -5.609619140625, -5.1556396484375, -4.70166015625, -4.2476806640625, -3.793701171875, -3.3397216796875, -2.8857421875, -2.4317626953125, -1.977783203125, -1.5238037109375, -1.06982421875, -0.6158447265625, -0.161865234375, 0.2921142578125, 0.74609375, 1.2000732421875, 1.654052734375, 2.1080322265625, 2.56201171875, 3.0159912109375, 3.469970703125, 3.9239501953125, 4.3779296875, 4.8319091796875, 5.285888671875, 5.7398681640625, 6.19384765625, 6.6478271484375, 7.101806640625, 7.5557861328125, 8.009765625, 8.4637451171875, 8.917724609375, 9.3717041015625, 9.82568359375, 10.2796630859375, 10.733642578125, 11.1876220703125, 11.6416015625, 12.0955810546875, 12.549560546875, 13.0035400390625, 13.45751953125, 13.9114990234375, 14.365478515625, 14.8194580078125, 15.2734375]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 74.0, 564.0, 351.0, 24.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-207.5766143798828, -202.94308471679688, -198.30955505371094, -193.676025390625, -189.04251098632812, -184.4089813232422, -179.77545166015625, -175.1419219970703, -170.50839233398438, -165.87486267089844, -161.2413330078125, -156.60780334472656, -151.97427368164062, -147.34075927734375, -142.7072296142578, -138.07369995117188, -133.44017028808594, -128.806640625, -124.17311096191406, -119.53958892822266, -114.90605926513672, -110.27252960205078, -105.63900756835938, -101.00547790527344, -96.3719482421875, -91.73841857910156, -87.10488891601562, -82.47136688232422, -77.83783721923828, -73.20430755615234, -68.57078552246094, -63.937255859375, -59.30372619628906, -54.670196533203125, -50.03667068481445, -45.40314483642578, -40.769615173339844, -36.136085510253906, -31.502559661865234, -26.869033813476562, -22.235504150390625, -17.60197639465332, -12.968448638916016, -8.334920883178711, -3.7013931274414062, 0.9321346282958984, 5.565662384033203, 10.199188232421875, 14.832717895507812, 19.466245651245117, 24.099773406982422, 28.733301162719727, 33.36682891845703, 38.00035858154297, 42.63388442993164, 47.26741027832031, 51.90093994140625, 56.53446960449219, 61.16799545288086, 65.80152130126953, 70.43505096435547, 75.0685806274414, 79.70210266113281, 84.33563232421875, 88.96916198730469]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 12.0, 5.0, 8.0, 13.0, 17.0, 17.0, 11.0, 15.0, 16.0, 23.0, 28.0, 20.0, 26.0, 24.0, 38.0, 32.0, 40.0, 41.0, 45.0, 46.0, 43.0, 37.0, 38.0, 38.0, 38.0, 38.0, 42.0, 26.0, 27.0, 25.0, 22.0, 18.0, 27.0, 15.0, 11.0, 17.0, 12.0, 8.0, 11.0, 6.0, 6.0, 3.0, 3.0, 2.0, 3.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-14.296612739562988, -13.795836448669434, -13.295059204101562, -12.794282913208008, -12.293505668640137, -11.792729377746582, -11.291952133178711, -10.791175842285156, -10.290399551391602, -9.789623260498047, -9.288846015930176, -8.788069725036621, -8.28729248046875, -7.786516189575195, -7.285739421844482, -6.7849626541137695, -6.284185409545898, -5.7834086418151855, -5.282631874084473, -4.781855583190918, -4.281078338623047, -3.780301809310913, -3.2795252799987793, -2.7787485122680664, -2.2779717445373535, -1.7771949768066406, -1.2764183282852173, -0.775641679763794, -0.27486491203308105, 0.22591185569763184, 0.7266883850097656, 1.2274651527404785, 1.7282428741455078, 2.2290196418762207, 2.7297964096069336, 3.2305729389190674, 3.7313497066497803, 4.232126235961914, 4.732903003692627, 5.23367977142334, 5.734456539154053, 6.235233306884766, 6.7360100746154785, 7.236786842346191, 7.737563133239746, 8.238340377807617, 8.739116668701172, 9.239892959594727, 9.740670204162598, 10.241446495056152, 10.742223739624023, 11.243000030517578, 11.74377727508545, 12.244553565979004, 12.745330810546875, 13.24610710144043, 13.746883392333984, 14.247659683227539, 14.74843692779541, 15.249213218688965, 15.749990463256836, 16.25076675415039, 16.751543045043945, 17.2523193359375, 17.753097534179688]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 5.0, 3.0, 11.0, 10.0, 6.0, 5.0, 16.0, 13.0, 16.0, 17.0, 19.0, 24.0, 20.0, 24.0, 34.0, 32.0, 37.0, 44.0, 30.0, 29.0, 40.0, 53.0, 49.0, 33.0, 31.0, 62.0, 40.0, 31.0, 32.0, 34.0, 34.0, 19.0, 24.0, 21.0, 19.0, 16.0, 13.0, 11.0, 7.0, 7.0, 5.0, 6.0, 5.0, 2.0, 0.0, 3.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.88671875, -1.821563720703125, -1.75640869140625, -1.691253662109375, -1.6260986328125, -1.560943603515625, -1.49578857421875, -1.430633544921875, -1.365478515625, -1.300323486328125, -1.23516845703125, -1.170013427734375, -1.1048583984375, -1.039703369140625, -0.97454833984375, -0.909393310546875, -0.84423828125, -0.779083251953125, -0.71392822265625, -0.648773193359375, -0.5836181640625, -0.518463134765625, -0.45330810546875, -0.388153076171875, -0.322998046875, -0.257843017578125, -0.19268798828125, -0.127532958984375, -0.0623779296875, 0.002777099609375, 0.06793212890625, 0.133087158203125, 0.1982421875, 0.263397216796875, 0.32855224609375, 0.393707275390625, 0.4588623046875, 0.524017333984375, 0.58917236328125, 0.654327392578125, 0.719482421875, 0.784637451171875, 0.84979248046875, 0.914947509765625, 0.9801025390625, 1.045257568359375, 1.11041259765625, 1.175567626953125, 1.24072265625, 1.305877685546875, 1.37103271484375, 1.436187744140625, 1.5013427734375, 1.566497802734375, 1.63165283203125, 1.696807861328125, 1.761962890625, 1.827117919921875, 1.89227294921875, 1.957427978515625, 2.0225830078125, 2.087738037109375, 2.15289306640625, 2.218048095703125, 2.283203125]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 4.0, 3.0, 8.0, 14.0, 24.0, 28.0, 40.0, 51.0, 109.0, 144.0, 200.0, 320.0, 452.0, 694.0, 942.0, 1425.0, 2012.0, 3074.0, 4442.0, 6586.0, 10091.0, 15605.0, 24442.0, 40073.0, 69895.0, 134757.0, 296781.0, 199650.0, 95370.0, 52828.0, 31236.0, 19591.0, 12445.0, 8223.0, 5515.0, 3688.0, 2412.0, 1752.0, 1139.0, 781.0, 555.0, 342.0, 281.0, 172.0, 112.0, 86.0, 64.0, 33.0, 28.0, 11.0, 11.0, 9.0, 8.0, 2.0, 3.0, 0.0, 2.0], "bins": [-0.41845703125, -0.40605926513671875, -0.3936614990234375, -0.38126373291015625, -0.368865966796875, -0.35646820068359375, -0.3440704345703125, -0.33167266845703125, -0.31927490234375, -0.30687713623046875, -0.2944793701171875, -0.28208160400390625, -0.269683837890625, -0.25728607177734375, -0.2448883056640625, -0.23249053955078125, -0.2200927734375, -0.20769500732421875, -0.1952972412109375, -0.18289947509765625, -0.170501708984375, -0.15810394287109375, -0.1457061767578125, -0.13330841064453125, -0.12091064453125, -0.10851287841796875, -0.0961151123046875, -0.08371734619140625, -0.071319580078125, -0.05892181396484375, -0.0465240478515625, -0.03412628173828125, -0.021728515625, -0.00933074951171875, 0.0030670166015625, 0.01546478271484375, 0.027862548828125, 0.04026031494140625, 0.0526580810546875, 0.06505584716796875, 0.07745361328125, 0.08985137939453125, 0.1022491455078125, 0.11464691162109375, 0.127044677734375, 0.13944244384765625, 0.1518402099609375, 0.16423797607421875, 0.1766357421875, 0.18903350830078125, 0.2014312744140625, 0.21382904052734375, 0.226226806640625, 0.23862457275390625, 0.2510223388671875, 0.26342010498046875, 0.27581787109375, 0.28821563720703125, 0.3006134033203125, 0.31301116943359375, 0.325408935546875, 0.33780670166015625, 0.3502044677734375, 0.36260223388671875, 0.375]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 7.0, 8.0, 3.0, 4.0, 17.0, 13.0, 17.0, 16.0, 15.0, 16.0, 24.0, 43.0, 33.0, 30.0, 30.0, 37.0, 31.0, 43.0, 45.0, 39.0, 1064.0, 31.0, 45.0, 33.0, 38.0, 57.0, 27.0, 40.0, 30.0, 31.0, 27.0, 20.0, 24.0, 14.0, 11.0, 21.0, 6.0, 7.0, 6.0, 11.0, 2.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.318359375, -1.2742919921875, -1.230224609375, -1.1861572265625, -1.14208984375, -1.0980224609375, -1.053955078125, -1.0098876953125, -0.9658203125, -0.9217529296875, -0.877685546875, -0.8336181640625, -0.78955078125, -0.7454833984375, -0.701416015625, -0.6573486328125, -0.61328125, -0.5692138671875, -0.525146484375, -0.4810791015625, -0.43701171875, -0.3929443359375, -0.348876953125, -0.3048095703125, -0.2607421875, -0.2166748046875, -0.172607421875, -0.1285400390625, -0.08447265625, -0.0404052734375, 0.003662109375, 0.0477294921875, 0.091796875, 0.1358642578125, 0.179931640625, 0.2239990234375, 0.26806640625, 0.3121337890625, 0.356201171875, 0.4002685546875, 0.4443359375, 0.4884033203125, 0.532470703125, 0.5765380859375, 0.62060546875, 0.6646728515625, 0.708740234375, 0.7528076171875, 0.796875, 0.8409423828125, 0.885009765625, 0.9290771484375, 0.97314453125, 1.0172119140625, 1.061279296875, 1.1053466796875, 1.1494140625, 1.1934814453125, 1.237548828125, 1.2816162109375, 1.32568359375, 1.3697509765625, 1.413818359375, 1.4578857421875, 1.501953125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 14.0, 19.0, 26.0, 32.0, 55.0, 75.0, 117.0, 163.0, 267.0, 330.0, 553.0, 757.0, 1044.0, 1630.0, 2485.0, 3699.0, 5658.0, 8495.0, 13580.0, 21556.0, 35388.0, 60776.0, 109978.0, 229462.0, 1309848.0, 120548.0, 66201.0, 38956.0, 23437.0, 14610.0, 9330.0, 5975.0, 3916.0, 2671.0, 1770.0, 1231.0, 813.0, 520.0, 361.0, 255.0, 164.0, 117.0, 82.0, 60.0, 33.0, 28.0, 12.0, 11.0, 11.0, 4.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.361083984375, -0.3490791320800781, -0.33707427978515625, -0.3250694274902344, -0.3130645751953125, -0.3010597229003906, -0.28905487060546875, -0.2770500183105469, -0.265045166015625, -0.2530403137207031, -0.24103546142578125, -0.22903060913085938, -0.2170257568359375, -0.20502090454101562, -0.19301605224609375, -0.18101119995117188, -0.16900634765625, -0.15700149536132812, -0.14499664306640625, -0.13299179077148438, -0.1209869384765625, -0.10898208618164062, -0.09697723388671875, -0.08497238159179688, -0.072967529296875, -0.060962677001953125, -0.04895782470703125, -0.036952972412109375, -0.0249481201171875, -0.012943267822265625, -0.00093841552734375, 0.011066436767578125, 0.0230712890625, 0.035076141357421875, 0.04708099365234375, 0.059085845947265625, 0.0710906982421875, 0.08309555053710938, 0.09510040283203125, 0.10710525512695312, 0.119110107421875, 0.13111495971679688, 0.14311981201171875, 0.15512466430664062, 0.1671295166015625, 0.17913436889648438, 0.19113922119140625, 0.20314407348632812, 0.21514892578125, 0.22715377807617188, 0.23915863037109375, 0.2511634826660156, 0.2631683349609375, 0.2751731872558594, 0.28717803955078125, 0.2991828918457031, 0.311187744140625, 0.3231925964355469, 0.33519744873046875, 0.3472023010253906, 0.3592071533203125, 0.3712120056152344, 0.38321685791015625, 0.3952217102050781, 0.4072265625]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 2.0, 2.0, 6.0, 6.0, 5.0, 5.0, 6.0, 7.0, 15.0, 21.0, 23.0, 24.0, 23.0, 21.0, 30.0, 39.0, 45.0, 46.0, 49.0, 56.0, 55.0, 71.0, 44.0, 59.0, 42.0, 36.0, 42.0, 33.0, 30.0, 22.0, 25.0, 21.0, 16.0, 15.0, 14.0, 7.0, 8.0, 11.0, 6.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.00023508071899414062, -0.00022794120013713837, -0.0002208016812801361, -0.00021366216242313385, -0.0002065226435661316, -0.00019938312470912933, -0.00019224360585212708, -0.00018510408699512482, -0.00017796456813812256, -0.0001708250492811203, -0.00016368553042411804, -0.00015654601156711578, -0.00014940649271011353, -0.00014226697385311127, -0.000135127454996109, -0.00012798793613910675, -0.00012084841728210449, -0.00011370889842510223, -0.00010656937956809998, -9.942986071109772e-05, -9.229034185409546e-05, -8.51508229970932e-05, -7.801130414009094e-05, -7.087178528308868e-05, -6.373226642608643e-05, -5.659274756908417e-05, -4.945322871208191e-05, -4.231370985507965e-05, -3.517419099807739e-05, -2.8034672141075134e-05, -2.0895153284072876e-05, -1.3755634427070618e-05, -6.616115570068359e-06, 5.234032869338989e-07, 7.662922143936157e-06, 1.4802441000938416e-05, 2.1941959857940674e-05, 2.9081478714942932e-05, 3.622099757194519e-05, 4.336051642894745e-05, 5.050003528594971e-05, 5.7639554142951965e-05, 6.477907299995422e-05, 7.191859185695648e-05, 7.905811071395874e-05, 8.6197629570961e-05, 9.333714842796326e-05, 0.00010047666728496552, 0.00010761618614196777, 0.00011475570499897003, 0.00012189522385597229, 0.00012903474271297455, 0.0001361742615699768, 0.00014331378042697906, 0.00015045329928398132, 0.00015759281814098358, 0.00016473233699798584, 0.0001718718558549881, 0.00017901137471199036, 0.00018615089356899261, 0.00019329041242599487, 0.00020042993128299713, 0.0002075694501399994, 0.00021470896899700165, 0.0002218484878540039]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 4.0, 8.0, 7.0, 16.0, 12.0, 25.0, 19.0, 28.0, 41.0, 52.0, 81.0, 99.0, 133.0, 224.0, 350.0, 603.0, 1453.0, 307681.0, 733709.0, 2137.0, 673.0, 385.0, 247.0, 172.0, 106.0, 68.0, 57.0, 46.0, 35.0, 22.0, 13.0, 10.0, 11.0, 12.0, 2.0, 2.0, 4.0, 4.0, 1.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004329681396484375, -0.004185795783996582, -0.004041910171508789, -0.003898024559020996, -0.003754138946533203, -0.00361025333404541, -0.003466367721557617, -0.0033224821090698242, -0.0031785964965820312, -0.0030347108840942383, -0.0028908252716064453, -0.0027469396591186523, -0.0026030540466308594, -0.0024591684341430664, -0.0023152828216552734, -0.0021713972091674805, -0.0020275115966796875, -0.0018836259841918945, -0.0017397403717041016, -0.0015958547592163086, -0.0014519691467285156, -0.0013080835342407227, -0.0011641979217529297, -0.0010203123092651367, -0.0008764266967773438, -0.0007325410842895508, -0.0005886554718017578, -0.00044476985931396484, -0.0003008842468261719, -0.0001569986343383789, -1.3113021850585938e-05, 0.00013077259063720703, 0.000274658203125, 0.00041854381561279297, 0.0005624294281005859, 0.0007063150405883789, 0.0008502006530761719, 0.0009940862655639648, 0.0011379718780517578, 0.0012818574905395508, 0.0014257431030273438, 0.0015696287155151367, 0.0017135143280029297, 0.0018573999404907227, 0.0020012855529785156, 0.0021451711654663086, 0.0022890567779541016, 0.0024329423904418945, 0.0025768280029296875, 0.0027207136154174805, 0.0028645992279052734, 0.0030084848403930664, 0.0031523704528808594, 0.0032962560653686523, 0.0034401416778564453, 0.0035840272903442383, 0.0037279129028320312, 0.0038717985153198242, 0.004015684127807617, 0.00415956974029541, 0.004303455352783203, 0.004447340965270996, 0.004591226577758789, 0.004735112190246582, 0.004878997802734375]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 10.0, 29.0, 69.0, 129.0, 166.0, 217.0, 169.0, 114.0, 68.0, 24.0, 14.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002702518249861896, -0.00026107270969077945, -0.0002518935943953693, -0.00024271449365187436, -0.00023353539290837944, -0.00022435627761296928, -0.00021517716231755912, -0.00020599804702214897, -0.00019681894627865404, -0.00018763983098324388, -0.00017846073023974895, -0.0001692816149443388, -0.00016010249964892864, -0.00015092339890543371, -0.00014174428361002356, -0.00013256518286652863, -0.00012338606757111847, -0.00011420695955166593, -0.00010502785153221339, -9.584873623680323e-05, -8.666962821735069e-05, -7.749052019789815e-05, -6.8311404902488e-05, -5.913229688303545e-05, -4.995318886358291e-05, -4.077408084413037e-05, -3.159496918669902e-05, -2.2415859348257072e-05, -1.3236749509815127e-05, -4.057641490362585e-06, 5.1214701670687646e-06, 1.4300581824500114e-05, 2.3479689843952656e-05, 3.26587978634052e-05, 4.183790952083655e-05, 5.1017021178267896e-05, 6.019612919772044e-05, 6.937523721717298e-05, 7.855435251258314e-05, 8.773346053203568e-05, 9.691256855148822e-05, 0.00010609167657094076, 0.0001152707845903933, 0.00012444989988580346, 0.00013362901518121362, 0.00014280811592470855, 0.0001519872312201187, 0.00016116633196361363, 0.00017034544725902379, 0.00017952456255443394, 0.00018870366329792887, 0.00019788277859333903, 0.00020706187933683395, 0.0002162409946322441, 0.00022542010992765427, 0.00023459922522306442, 0.00024377832596655935, 0.0002529574267100543, 0.00026213654200546443, 0.0002713156573008746, 0.00028049477259628475, 0.00028967385878786445, 0.0002988529740832746, 0.00030803208937868476, 0.0003172112046740949]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 6.0, 6.0, 3.0, 8.0, 3.0, 4.0, 13.0, 5.0, 7.0, 14.0, 21.0, 26.0, 8.0, 19.0, 20.0, 27.0, 19.0, 32.0, 21.0, 28.0, 21.0, 37.0, 42.0, 34.0, 35.0, 39.0, 40.0, 35.0, 32.0, 32.0, 42.0, 37.0, 34.0, 22.0, 27.0, 27.0, 10.0, 23.0, 21.0, 19.0, 21.0, 15.0, 8.0, 11.0, 15.0, 11.0, 4.0, 3.0, 7.0, 7.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.00011897087097167969, -0.0001154458150267601, -0.00011192075908184052, -0.00010839570313692093, -0.00010487064719200134, -0.00010134559124708176, -9.782053530216217e-05, -9.429547935724258e-05, -9.0770423412323e-05, -8.724536746740341e-05, -8.372031152248383e-05, -8.019525557756424e-05, -7.667019963264465e-05, -7.314514368772507e-05, -6.962008774280548e-05, -6.60950317978859e-05, -6.256997585296631e-05, -5.904491990804672e-05, -5.5519863963127136e-05, -5.199480801820755e-05, -4.8469752073287964e-05, -4.494469612836838e-05, -4.141964018344879e-05, -3.7894584238529205e-05, -3.436952829360962e-05, -3.084447234869003e-05, -2.7319416403770447e-05, -2.379436045885086e-05, -2.0269304513931274e-05, -1.6744248569011688e-05, -1.3219192624092102e-05, -9.694136679172516e-06, -6.16908073425293e-06, -2.6440247893333435e-06, 8.810311555862427e-07, 4.406087100505829e-06, 7.931143045425415e-06, 1.1456198990345001e-05, 1.4981254935264587e-05, 1.8506310880184174e-05, 2.203136682510376e-05, 2.5556422770023346e-05, 2.9081478714942932e-05, 3.260653465986252e-05, 3.6131590604782104e-05, 3.965664654970169e-05, 4.318170249462128e-05, 4.670675843954086e-05, 5.023181438446045e-05, 5.3756870329380035e-05, 5.728192627429962e-05, 6.080698221921921e-05, 6.43320381641388e-05, 6.785709410905838e-05, 7.138215005397797e-05, 7.490720599889755e-05, 7.843226194381714e-05, 8.195731788873672e-05, 8.548237383365631e-05, 8.90074297785759e-05, 9.253248572349548e-05, 9.605754166841507e-05, 9.958259761333466e-05, 0.00010310765355825424, 0.00010663270950317383]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 5.0, 3.0, 11.0, 10.0, 6.0, 5.0, 16.0, 13.0, 16.0, 17.0, 19.0, 24.0, 20.0, 24.0, 34.0, 32.0, 37.0, 44.0, 30.0, 29.0, 40.0, 53.0, 49.0, 33.0, 31.0, 62.0, 40.0, 31.0, 32.0, 34.0, 34.0, 19.0, 24.0, 21.0, 19.0, 16.0, 13.0, 11.0, 7.0, 7.0, 5.0, 6.0, 5.0, 2.0, 0.0, 3.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.88671875, -1.821563720703125, -1.75640869140625, -1.691253662109375, -1.6260986328125, -1.560943603515625, -1.49578857421875, -1.430633544921875, -1.365478515625, -1.300323486328125, -1.23516845703125, -1.170013427734375, -1.1048583984375, -1.039703369140625, -0.97454833984375, -0.909393310546875, -0.84423828125, -0.779083251953125, -0.71392822265625, -0.648773193359375, -0.5836181640625, -0.518463134765625, -0.45330810546875, -0.388153076171875, -0.322998046875, -0.257843017578125, -0.19268798828125, -0.127532958984375, -0.0623779296875, 0.002777099609375, 0.06793212890625, 0.133087158203125, 0.1982421875, 0.263397216796875, 0.32855224609375, 0.393707275390625, 0.4588623046875, 0.524017333984375, 0.58917236328125, 0.654327392578125, 0.719482421875, 0.784637451171875, 0.84979248046875, 0.914947509765625, 0.9801025390625, 1.045257568359375, 1.11041259765625, 1.175567626953125, 1.24072265625, 1.305877685546875, 1.37103271484375, 1.436187744140625, 1.5013427734375, 1.566497802734375, 1.63165283203125, 1.696807861328125, 1.761962890625, 1.827117919921875, 1.89227294921875, 1.957427978515625, 2.0225830078125, 2.087738037109375, 2.15289306640625, 2.218048095703125, 2.283203125]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 6.0, 4.0, 5.0, 6.0, 16.0, 12.0, 12.0, 19.0, 32.0, 58.0, 77.0, 110.0, 184.0, 276.0, 443.0, 773.0, 1291.0, 2583.0, 4604.0, 8163.0, 14784.0, 26778.0, 48868.0, 97813.0, 218782.0, 302176.0, 160426.0, 73923.0, 38330.0, 21185.0, 11916.0, 6485.0, 3614.0, 1970.0, 1077.0, 633.0, 382.0, 229.0, 151.0, 112.0, 64.0, 45.0, 36.0, 28.0, 15.0, 17.0, 14.0, 4.0, 7.0, 7.0, 3.0, 5.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-1.7490234375, -1.69488525390625, -1.6407470703125, -1.58660888671875, -1.532470703125, -1.47833251953125, -1.4241943359375, -1.37005615234375, -1.31591796875, -1.26177978515625, -1.2076416015625, -1.15350341796875, -1.099365234375, -1.04522705078125, -0.9910888671875, -0.93695068359375, -0.8828125, -0.82867431640625, -0.7745361328125, -0.72039794921875, -0.666259765625, -0.61212158203125, -0.5579833984375, -0.50384521484375, -0.44970703125, -0.39556884765625, -0.3414306640625, -0.28729248046875, -0.233154296875, -0.17901611328125, -0.1248779296875, -0.07073974609375, -0.0166015625, 0.03753662109375, 0.0916748046875, 0.14581298828125, 0.199951171875, 0.25408935546875, 0.3082275390625, 0.36236572265625, 0.41650390625, 0.47064208984375, 0.5247802734375, 0.57891845703125, 0.633056640625, 0.68719482421875, 0.7413330078125, 0.79547119140625, 0.849609375, 0.90374755859375, 0.9578857421875, 1.01202392578125, 1.066162109375, 1.12030029296875, 1.1744384765625, 1.22857666015625, 1.28271484375, 1.33685302734375, 1.3909912109375, 1.44512939453125, 1.499267578125, 1.55340576171875, 1.6075439453125, 1.66168212890625, 1.7158203125]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 3.0, 5.0, 9.0, 6.0, 7.0, 15.0, 16.0, 13.0, 19.0, 19.0, 24.0, 22.0, 32.0, 41.0, 39.0, 35.0, 41.0, 55.0, 65.0, 147.0, 363.0, 1406.0, 174.0, 69.0, 52.0, 48.0, 38.0, 41.0, 39.0, 26.0, 26.0, 21.0, 22.0, 20.0, 16.0, 13.0, 11.0, 8.0, 9.0, 9.0, 7.0, 6.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-8.7578125, -8.50787353515625, -8.2579345703125, -8.00799560546875, -7.758056640625, -7.50811767578125, -7.2581787109375, -7.00823974609375, -6.75830078125, -6.50836181640625, -6.2584228515625, -6.00848388671875, -5.758544921875, -5.50860595703125, -5.2586669921875, -5.00872802734375, -4.7587890625, -4.50885009765625, -4.2589111328125, -4.00897216796875, -3.759033203125, -3.50909423828125, -3.2591552734375, -3.00921630859375, -2.75927734375, -2.50933837890625, -2.2593994140625, -2.00946044921875, -1.759521484375, -1.50958251953125, -1.2596435546875, -1.00970458984375, -0.759765625, -0.50982666015625, -0.2598876953125, -0.00994873046875, 0.239990234375, 0.48992919921875, 0.7398681640625, 0.98980712890625, 1.23974609375, 1.48968505859375, 1.7396240234375, 1.98956298828125, 2.239501953125, 2.48944091796875, 2.7393798828125, 2.98931884765625, 3.2392578125, 3.48919677734375, 3.7391357421875, 3.98907470703125, 4.239013671875, 4.48895263671875, 4.7388916015625, 4.98883056640625, 5.23876953125, 5.48870849609375, 5.7386474609375, 5.98858642578125, 6.238525390625, 6.48846435546875, 6.7384033203125, 6.98834228515625, 7.23828125]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 4.0, 3.0, 2.0, 8.0, 10.0, 5.0, 13.0, 13.0, 15.0, 17.0, 28.0, 33.0, 45.0, 69.0, 83.0, 125.0, 227.0, 397.0, 922.0, 11733.0, 3095074.0, 34483.0, 1208.0, 427.0, 229.0, 148.0, 87.0, 74.0, 44.0, 32.0, 29.0, 34.0, 14.0, 13.0, 8.0, 5.0, 9.0, 7.0, 4.0, 5.0, 3.0, 5.0, 0.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-28.59375, -27.716552734375, -26.83935546875, -25.962158203125, -25.0849609375, -24.207763671875, -23.33056640625, -22.453369140625, -21.576171875, -20.698974609375, -19.82177734375, -18.944580078125, -18.0673828125, -17.190185546875, -16.31298828125, -15.435791015625, -14.55859375, -13.681396484375, -12.80419921875, -11.927001953125, -11.0498046875, -10.172607421875, -9.29541015625, -8.418212890625, -7.541015625, -6.663818359375, -5.78662109375, -4.909423828125, -4.0322265625, -3.155029296875, -2.27783203125, -1.400634765625, -0.5234375, 0.353759765625, 1.23095703125, 2.108154296875, 2.9853515625, 3.862548828125, 4.73974609375, 5.616943359375, 6.494140625, 7.371337890625, 8.24853515625, 9.125732421875, 10.0029296875, 10.880126953125, 11.75732421875, 12.634521484375, 13.51171875, 14.388916015625, 15.26611328125, 16.143310546875, 17.0205078125, 17.897705078125, 18.77490234375, 19.652099609375, 20.529296875, 21.406494140625, 22.28369140625, 23.160888671875, 24.0380859375, 24.915283203125, 25.79248046875, 26.669677734375, 27.546875]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 6.0, 10.0, 25.0, 33.0, 60.0, 99.0, 115.0, 149.0, 142.0, 133.0, 91.0, 72.0, 38.0, 16.0, 8.0, 3.0, 3.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.52664566040039, -14.085351943969727, -13.644058227539062, -13.202764511108398, -12.761470794677734, -12.32017707824707, -11.878883361816406, -11.437589645385742, -10.996295928955078, -10.555002212524414, -10.11370849609375, -9.672414779663086, -9.231121063232422, -8.789827346801758, -8.348533630371094, -7.9072394371032715, -7.465945243835449, -7.024651527404785, -6.583357810974121, -6.142064094543457, -5.700770378112793, -5.259476661682129, -4.818182468414307, -4.376888751983643, -3.9355950355529785, -3.4943013191223145, -3.0530076026916504, -2.6117136478424072, -2.170419931411743, -1.729126214981079, -1.287832260131836, -0.8465385437011719, -0.4052457809448242, 0.03604799509048462, 0.47734177112579346, 0.9186356067657471, 1.3599293231964111, 1.8012230396270752, 2.2425169944763184, 2.6838107109069824, 3.1251044273376465, 3.5663981437683105, 4.007691860198975, 4.448986053466797, 4.890279769897461, 5.331573486328125, 5.772867202758789, 6.214160919189453, 6.655454635620117, 7.096748352050781, 7.538042068481445, 7.979335784912109, 8.420629501342773, 8.861923217773438, 9.303216934204102, 9.744510650634766, 10.18580436706543, 10.627098083496094, 11.068391799926758, 11.509685516357422, 11.950979232788086, 12.39227294921875, 12.833566665649414, 13.274860382080078, 13.716155052185059]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 4.0, 7.0, 6.0, 15.0, 10.0, 7.0, 22.0, 23.0, 19.0, 22.0, 24.0, 34.0, 23.0, 30.0, 32.0, 33.0, 26.0, 39.0, 35.0, 41.0, 36.0, 36.0, 38.0, 35.0, 31.0, 34.0, 30.0, 36.0, 34.0, 24.0, 29.0, 24.0, 21.0, 27.0, 26.0, 25.0, 9.0, 9.0, 10.0, 12.0, 7.0, 6.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-22.539243698120117, -21.860074996948242, -21.180908203125, -20.501739501953125, -19.82257080078125, -19.143402099609375, -18.4642333984375, -17.785066604614258, -17.105897903442383, -16.426729202270508, -15.74756145477295, -15.06839370727539, -14.389225006103516, -13.71005630493164, -13.030888557434082, -12.351720809936523, -11.672552108764648, -10.993383407592773, -10.314215660095215, -9.635047912597656, -8.955879211425781, -8.276710510253906, -7.597542762756348, -6.918374538421631, -6.239206314086914, -5.560038089752197, -4.8808698654174805, -4.201701641082764, -3.522533416748047, -2.84336519241333, -2.1641969680786133, -1.4850287437438965, -0.8058586120605469, -0.12669038772583008, 0.5524778366088867, 1.2316460609436035, 1.9108142852783203, 2.589982509613037, 3.269150733947754, 3.9483189582824707, 4.6274871826171875, 5.306655406951904, 5.985823631286621, 6.664991855621338, 7.344160079956055, 8.02332878112793, 8.702496528625488, 9.381664276123047, 10.060832977294922, 10.740001678466797, 11.419169425964355, 12.098337173461914, 12.777505874633789, 13.456674575805664, 14.135842323303223, 14.815010070800781, 15.494178771972656, 16.17334747314453, 16.852516174316406, 17.53168296813965, 18.210851669311523, 18.8900203704834, 19.56918716430664, 20.248355865478516, 20.92752456665039]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [5.0, 1.0, 1.0, 3.0, 4.0, 5.0, 3.0, 3.0, 5.0, 12.0, 12.0, 9.0, 10.0, 14.0, 15.0, 16.0, 22.0, 21.0, 19.0, 28.0, 33.0, 25.0, 38.0, 33.0, 30.0, 45.0, 38.0, 46.0, 30.0, 43.0, 38.0, 50.0, 48.0, 40.0, 35.0, 25.0, 32.0, 29.0, 18.0, 17.0, 17.0, 16.0, 17.0, 13.0, 6.0, 12.0, 7.0, 8.0, 4.0, 2.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.9931640625, -1.9227142333984375, -1.852264404296875, -1.7818145751953125, -1.71136474609375, -1.6409149169921875, -1.570465087890625, -1.5000152587890625, -1.4295654296875, -1.3591156005859375, -1.288665771484375, -1.2182159423828125, -1.14776611328125, -1.0773162841796875, -1.006866455078125, -0.9364166259765625, -0.865966796875, -0.7955169677734375, -0.725067138671875, -0.6546173095703125, -0.58416748046875, -0.5137176513671875, -0.443267822265625, -0.3728179931640625, -0.3023681640625, -0.2319183349609375, -0.161468505859375, -0.0910186767578125, -0.02056884765625, 0.0498809814453125, 0.120330810546875, 0.1907806396484375, 0.26123046875, 0.3316802978515625, 0.402130126953125, 0.4725799560546875, 0.54302978515625, 0.6134796142578125, 0.683929443359375, 0.7543792724609375, 0.8248291015625, 0.8952789306640625, 0.965728759765625, 1.0361785888671875, 1.10662841796875, 1.1770782470703125, 1.247528076171875, 1.3179779052734375, 1.388427734375, 1.4588775634765625, 1.529327392578125, 1.5997772216796875, 1.67022705078125, 1.7406768798828125, 1.811126708984375, 1.8815765380859375, 1.9520263671875, 2.0224761962890625, 2.092926025390625, 2.1633758544921875, 2.23382568359375, 2.3042755126953125, 2.374725341796875, 2.4451751708984375, 2.515625]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 3.0, 4.0, 8.0, 16.0, 15.0, 14.0, 23.0, 21.0, 37.0, 48.0, 95.0, 152.0, 236.0, 398.0, 991.0, 2955.0, 13246.0, 90253.0, 644746.0, 2020426.0, 1185892.0, 200123.0, 26597.0, 5053.0, 1457.0, 618.0, 296.0, 173.0, 119.0, 89.0, 54.0, 38.0, 18.0, 17.0, 18.0, 7.0, 12.0, 2.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.40625, -4.271484375, -4.13671875, -4.001953125, -3.8671875, -3.732421875, -3.59765625, -3.462890625, -3.328125, -3.193359375, -3.05859375, -2.923828125, -2.7890625, -2.654296875, -2.51953125, -2.384765625, -2.25, -2.115234375, -1.98046875, -1.845703125, -1.7109375, -1.576171875, -1.44140625, -1.306640625, -1.171875, -1.037109375, -0.90234375, -0.767578125, -0.6328125, -0.498046875, -0.36328125, -0.228515625, -0.09375, 0.041015625, 0.17578125, 0.310546875, 0.4453125, 0.580078125, 0.71484375, 0.849609375, 0.984375, 1.119140625, 1.25390625, 1.388671875, 1.5234375, 1.658203125, 1.79296875, 1.927734375, 2.0625, 2.197265625, 2.33203125, 2.466796875, 2.6015625, 2.736328125, 2.87109375, 3.005859375, 3.140625, 3.275390625, 3.41015625, 3.544921875, 3.6796875, 3.814453125, 3.94921875, 4.083984375, 4.21875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 3.0, 10.0, 13.0, 16.0, 28.0, 54.0, 58.0, 91.0, 162.0, 232.0, 310.0, 431.0, 513.0, 535.0, 490.0, 369.0, 271.0, 171.0, 109.0, 66.0, 61.0, 26.0, 24.0, 15.0, 5.0, 5.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.21875, -5.99774169921875, -5.7767333984375, -5.55572509765625, -5.334716796875, -5.11370849609375, -4.8927001953125, -4.67169189453125, -4.45068359375, -4.22967529296875, -4.0086669921875, -3.78765869140625, -3.566650390625, -3.34564208984375, -3.1246337890625, -2.90362548828125, -2.6826171875, -2.46160888671875, -2.2406005859375, -2.01959228515625, -1.798583984375, -1.57757568359375, -1.3565673828125, -1.13555908203125, -0.91455078125, -0.69354248046875, -0.4725341796875, -0.25152587890625, -0.030517578125, 0.19049072265625, 0.4114990234375, 0.63250732421875, 0.853515625, 1.07452392578125, 1.2955322265625, 1.51654052734375, 1.737548828125, 1.95855712890625, 2.1795654296875, 2.40057373046875, 2.62158203125, 2.84259033203125, 3.0635986328125, 3.28460693359375, 3.505615234375, 3.72662353515625, 3.9476318359375, 4.16864013671875, 4.3896484375, 4.61065673828125, 4.8316650390625, 5.05267333984375, 5.273681640625, 5.49468994140625, 5.7156982421875, 5.93670654296875, 6.15771484375, 6.37872314453125, 6.5997314453125, 6.82073974609375, 7.041748046875, 7.26275634765625, 7.4837646484375, 7.70477294921875, 7.92578125]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 6.0, 7.0, 7.0, 9.0, 17.0, 16.0, 30.0, 41.0, 75.0, 72.0, 124.0, 165.0, 284.0, 550.0, 1624.0, 16959.0, 1029131.0, 3072042.0, 68404.0, 2931.0, 776.0, 362.0, 191.0, 128.0, 82.0, 78.0, 55.0, 43.0, 29.0, 17.0, 11.0, 7.0, 4.0, 7.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.21875, -14.7735595703125, -14.328369140625, -13.8831787109375, -13.43798828125, -12.9927978515625, -12.547607421875, -12.1024169921875, -11.6572265625, -11.2120361328125, -10.766845703125, -10.3216552734375, -9.87646484375, -9.4312744140625, -8.986083984375, -8.5408935546875, -8.095703125, -7.6505126953125, -7.205322265625, -6.7601318359375, -6.31494140625, -5.8697509765625, -5.424560546875, -4.9793701171875, -4.5341796875, -4.0889892578125, -3.643798828125, -3.1986083984375, -2.75341796875, -2.3082275390625, -1.863037109375, -1.4178466796875, -0.97265625, -0.5274658203125, -0.082275390625, 0.3629150390625, 0.80810546875, 1.2532958984375, 1.698486328125, 2.1436767578125, 2.5888671875, 3.0340576171875, 3.479248046875, 3.9244384765625, 4.36962890625, 4.8148193359375, 5.260009765625, 5.7052001953125, 6.150390625, 6.5955810546875, 7.040771484375, 7.4859619140625, 7.93115234375, 8.3763427734375, 8.821533203125, 9.2667236328125, 9.7119140625, 10.1571044921875, 10.602294921875, 11.0474853515625, 11.49267578125, 11.9378662109375, 12.383056640625, 12.8282470703125, 13.2734375]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 17.0, 26.0, 71.0, 124.0, 202.0, 229.0, 168.0, 88.0, 57.0, 21.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.436946868896484, -42.96480178833008, -41.49265670776367, -40.0205078125, -38.548362731933594, -37.07621765136719, -35.60407257080078, -34.131927490234375, -32.65978240966797, -31.187637329101562, -29.715490341186523, -28.243345260620117, -26.77120018005371, -25.299053192138672, -23.826908111572266, -22.35476303100586, -20.88261604309082, -19.410470962524414, -17.938323974609375, -16.46617889404297, -14.994033813476562, -13.52188777923584, -12.049741744995117, -10.577596664428711, -9.105450630187988, -7.633305072784424, -6.161159515380859, -4.689013481140137, -3.2168679237365723, -1.7447223663330078, -0.27257633209228516, 1.199568748474121, 2.6717147827148438, 4.143860340118408, 5.616005897521973, 7.088151931762695, 8.560297012329102, 10.032443046569824, 11.504589080810547, 12.976734161376953, 14.448880195617676, 15.921026229858398, 17.393171310424805, 18.865318298339844, 20.33746337890625, 21.809608459472656, 23.281753540039062, 24.75389862060547, 26.226045608520508, 27.698190689086914, 29.170337677001953, 30.64248275756836, 32.114627838134766, 33.58677291870117, 35.058921813964844, 36.53106689453125, 38.003211975097656, 39.47535705566406, 40.94750213623047, 42.419647216796875, 43.89179611206055, 45.36394119262695, 46.83608627319336, 48.308231353759766, 49.78037643432617]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 6.0, 0.0, 0.0, 4.0, 3.0, 3.0, 0.0, 7.0, 8.0, 5.0, 11.0, 14.0, 15.0, 12.0, 16.0, 20.0, 24.0, 29.0, 25.0, 31.0, 34.0, 44.0, 38.0, 32.0, 24.0, 33.0, 38.0, 33.0, 42.0, 45.0, 39.0, 25.0, 43.0, 35.0, 30.0, 32.0, 23.0, 32.0, 19.0, 14.0, 12.0, 15.0, 17.0, 14.0, 17.0, 12.0, 10.0, 5.0, 7.0, 6.0, 1.0, 3.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-16.432432174682617, -15.915843963623047, -15.399256706237793, -14.882668495178223, -14.366081237792969, -13.849493026733398, -13.332904815673828, -12.816316604614258, -12.299729347229004, -11.783141136169434, -11.26655387878418, -10.74996566772461, -10.233377456665039, -9.716790199279785, -9.200201988220215, -8.683614730834961, -8.16702651977539, -7.6504387855529785, -7.133851051330566, -6.617262840270996, -6.100675106048584, -5.584087371826172, -5.067499160766602, -4.5509114265441895, -4.034323692321777, -3.5177359580993652, -3.001147985458374, -2.484560012817383, -1.9679722785949707, -1.4513845443725586, -0.9347965717315674, -0.41820859909057617, 0.09837722778320312, 0.6149650812149048, 1.1315529346466064, 1.648140788078308, 2.1647286415100098, 2.681316375732422, 3.197904348373413, 3.7144923210144043, 4.231080055236816, 4.7476677894592285, 5.264255523681641, 5.780843734741211, 6.297431468963623, 6.814019203186035, 7.3306074142456055, 7.847195148468018, 8.36378288269043, 8.88037109375, 9.396958351135254, 9.913546562194824, 10.430133819580078, 10.946722030639648, 11.463310241699219, 11.979898452758789, 12.496485710144043, 13.013073921203613, 13.529661178588867, 14.046249389648438, 14.562837600708008, 15.079424858093262, 15.596013069152832, 16.112600326538086, 16.629188537597656]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 0.0, 3.0, 4.0, 4.0, 6.0, 8.0, 8.0, 8.0, 14.0, 13.0, 17.0, 11.0, 21.0, 11.0, 19.0, 21.0, 24.0, 23.0, 29.0, 38.0, 31.0, 40.0, 51.0, 42.0, 49.0, 41.0, 33.0, 44.0, 33.0, 46.0, 50.0, 25.0, 29.0, 32.0, 22.0, 22.0, 26.0, 16.0, 17.0, 15.0, 14.0, 10.0, 5.0, 8.0, 9.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.0234375, -1.95208740234375, -1.8807373046875, -1.80938720703125, -1.738037109375, -1.66668701171875, -1.5953369140625, -1.52398681640625, -1.45263671875, -1.38128662109375, -1.3099365234375, -1.23858642578125, -1.167236328125, -1.09588623046875, -1.0245361328125, -0.95318603515625, -0.8818359375, -0.81048583984375, -0.7391357421875, -0.66778564453125, -0.596435546875, -0.52508544921875, -0.4537353515625, -0.38238525390625, -0.31103515625, -0.23968505859375, -0.1683349609375, -0.09698486328125, -0.025634765625, 0.04571533203125, 0.1170654296875, 0.18841552734375, 0.259765625, 0.33111572265625, 0.4024658203125, 0.47381591796875, 0.545166015625, 0.61651611328125, 0.6878662109375, 0.75921630859375, 0.83056640625, 0.90191650390625, 0.9732666015625, 1.04461669921875, 1.115966796875, 1.18731689453125, 1.2586669921875, 1.33001708984375, 1.4013671875, 1.47271728515625, 1.5440673828125, 1.61541748046875, 1.686767578125, 1.75811767578125, 1.8294677734375, 1.90081787109375, 1.97216796875, 2.04351806640625, 2.1148681640625, 2.18621826171875, 2.257568359375, 2.32891845703125, 2.4002685546875, 2.47161865234375, 2.54296875]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 7.0, 6.0, 23.0, 30.0, 54.0, 62.0, 77.0, 136.0, 201.0, 294.0, 395.0, 549.0, 863.0, 1257.0, 1806.0, 2674.0, 3805.0, 5484.0, 8146.0, 11627.0, 17505.0, 26208.0, 40953.0, 68879.0, 124148.0, 260479.0, 206517.0, 101634.0, 57913.0, 35290.0, 22923.0, 15102.0, 10488.0, 7073.0, 4935.0, 3467.0, 2332.0, 1625.0, 1204.0, 747.0, 521.0, 325.0, 257.0, 194.0, 126.0, 72.0, 55.0, 37.0, 25.0, 12.0, 8.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.391845703125, -0.37953948974609375, -0.3672332763671875, -0.35492706298828125, -0.342620849609375, -0.33031463623046875, -0.3180084228515625, -0.30570220947265625, -0.29339599609375, -0.28108978271484375, -0.2687835693359375, -0.25647735595703125, -0.244171142578125, -0.23186492919921875, -0.2195587158203125, -0.20725250244140625, -0.1949462890625, -0.18264007568359375, -0.1703338623046875, -0.15802764892578125, -0.145721435546875, -0.13341522216796875, -0.1211090087890625, -0.10880279541015625, -0.09649658203125, -0.08419036865234375, -0.0718841552734375, -0.05957794189453125, -0.047271728515625, -0.03496551513671875, -0.0226593017578125, -0.01035308837890625, 0.001953125, 0.01425933837890625, 0.0265655517578125, 0.03887176513671875, 0.051177978515625, 0.06348419189453125, 0.0757904052734375, 0.08809661865234375, 0.10040283203125, 0.11270904541015625, 0.1250152587890625, 0.13732147216796875, 0.149627685546875, 0.16193389892578125, 0.1742401123046875, 0.18654632568359375, 0.1988525390625, 0.21115875244140625, 0.2234649658203125, 0.23577117919921875, 0.248077392578125, 0.26038360595703125, 0.2726898193359375, 0.28499603271484375, 0.29730224609375, 0.30960845947265625, 0.3219146728515625, 0.33422088623046875, 0.346527099609375, 0.35883331298828125, 0.3711395263671875, 0.38344573974609375, 0.395751953125]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 0.0, 3.0, 3.0, 3.0, 2.0, 4.0, 5.0, 5.0, 2.0, 4.0, 18.0, 12.0, 15.0, 11.0, 20.0, 23.0, 22.0, 20.0, 27.0, 17.0, 30.0, 41.0, 34.0, 27.0, 28.0, 43.0, 38.0, 40.0, 1063.0, 42.0, 48.0, 27.0, 33.0, 29.0, 27.0, 30.0, 24.0, 33.0, 31.0, 18.0, 15.0, 17.0, 14.0, 11.0, 16.0, 12.0, 13.0, 10.0, 5.0, 5.0, 1.0, 4.0, 5.0, 2.0, 2.0, 0.0, 2.0, 4.0, 0.0, 1.0], "bins": [-1.40234375, -1.3595123291015625, -1.316680908203125, -1.2738494873046875, -1.23101806640625, -1.1881866455078125, -1.145355224609375, -1.1025238037109375, -1.0596923828125, -1.0168609619140625, -0.974029541015625, -0.9311981201171875, -0.88836669921875, -0.8455352783203125, -0.802703857421875, -0.7598724365234375, -0.717041015625, -0.6742095947265625, -0.631378173828125, -0.5885467529296875, -0.54571533203125, -0.5028839111328125, -0.460052490234375, -0.4172210693359375, -0.3743896484375, -0.3315582275390625, -0.288726806640625, -0.2458953857421875, -0.20306396484375, -0.1602325439453125, -0.117401123046875, -0.0745697021484375, -0.03173828125, 0.0110931396484375, 0.053924560546875, 0.0967559814453125, 0.13958740234375, 0.1824188232421875, 0.225250244140625, 0.2680816650390625, 0.3109130859375, 0.3537445068359375, 0.396575927734375, 0.4394073486328125, 0.48223876953125, 0.5250701904296875, 0.567901611328125, 0.6107330322265625, 0.653564453125, 0.6963958740234375, 0.739227294921875, 0.7820587158203125, 0.82489013671875, 0.8677215576171875, 0.910552978515625, 0.9533843994140625, 0.9962158203125, 1.0390472412109375, 1.081878662109375, 1.1247100830078125, 1.16754150390625, 1.2103729248046875, 1.253204345703125, 1.2960357666015625, 1.3388671875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 7.0, 1.0, 6.0, 7.0, 12.0, 15.0, 29.0, 38.0, 58.0, 78.0, 114.0, 180.0, 223.0, 338.0, 537.0, 650.0, 1030.0, 1518.0, 2065.0, 3145.0, 4553.0, 6539.0, 9904.0, 14499.0, 22395.0, 35776.0, 57815.0, 100816.0, 205360.0, 1316894.0, 123325.0, 68614.0, 41938.0, 26310.0, 16901.0, 11258.0, 7738.0, 5136.0, 3486.0, 2381.0, 1664.0, 1194.0, 796.0, 509.0, 439.0, 272.0, 199.0, 122.0, 104.0, 57.0, 30.0, 22.0, 21.0, 13.0, 6.0, 2.0, 8.0, 1.0, 1.0, 1.0], "bins": [-0.40380859375, -0.391632080078125, -0.37945556640625, -0.367279052734375, -0.3551025390625, -0.342926025390625, -0.33074951171875, -0.318572998046875, -0.306396484375, -0.294219970703125, -0.28204345703125, -0.269866943359375, -0.2576904296875, -0.245513916015625, -0.23333740234375, -0.221160888671875, -0.208984375, -0.196807861328125, -0.18463134765625, -0.172454833984375, -0.1602783203125, -0.148101806640625, -0.13592529296875, -0.123748779296875, -0.111572265625, -0.099395751953125, -0.08721923828125, -0.075042724609375, -0.0628662109375, -0.050689697265625, -0.03851318359375, -0.026336669921875, -0.01416015625, -0.001983642578125, 0.01019287109375, 0.022369384765625, 0.0345458984375, 0.046722412109375, 0.05889892578125, 0.071075439453125, 0.083251953125, 0.095428466796875, 0.10760498046875, 0.119781494140625, 0.1319580078125, 0.144134521484375, 0.15631103515625, 0.168487548828125, 0.1806640625, 0.192840576171875, 0.20501708984375, 0.217193603515625, 0.2293701171875, 0.241546630859375, 0.25372314453125, 0.265899658203125, 0.278076171875, 0.290252685546875, 0.30242919921875, 0.314605712890625, 0.3267822265625, 0.338958740234375, 0.35113525390625, 0.363311767578125, 0.37548828125]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 4.0, 7.0, 7.0, 14.0, 13.0, 18.0, 26.0, 26.0, 34.0, 35.0, 58.0, 57.0, 65.0, 76.0, 74.0, 79.0, 64.0, 61.0, 51.0, 36.0, 36.0, 34.0, 23.0, 19.0, 22.0, 11.0, 11.0, 11.0, 8.0, 7.0, 4.0, 5.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00031113624572753906, -0.00030126050114631653, -0.000291384756565094, -0.00028150901198387146, -0.0002716332674026489, -0.0002617575228214264, -0.00025188177824020386, -0.00024200603365898132, -0.0002321302890777588, -0.00022225454449653625, -0.00021237879991531372, -0.0002025030553340912, -0.00019262731075286865, -0.00018275156617164612, -0.00017287582159042358, -0.00016300007700920105, -0.00015312433242797852, -0.00014324858784675598, -0.00013337284326553345, -0.0001234970986843109, -0.00011362135410308838, -0.00010374560952186584, -9.386986494064331e-05, -8.399412035942078e-05, -7.411837577819824e-05, -6.424263119697571e-05, -5.4366886615753174e-05, -4.449114203453064e-05, -3.4615397453308105e-05, -2.473965287208557e-05, -1.4863908290863037e-05, -4.988163709640503e-06, 4.887580871582031e-06, 1.4763325452804565e-05, 2.46390700340271e-05, 3.4514814615249634e-05, 4.439055919647217e-05, 5.42663037776947e-05, 6.414204835891724e-05, 7.401779294013977e-05, 8.38935375213623e-05, 9.376928210258484e-05, 0.00010364502668380737, 0.00011352077126502991, 0.00012339651584625244, 0.00013327226042747498, 0.0001431480050086975, 0.00015302374958992004, 0.00016289949417114258, 0.0001727752387523651, 0.00018265098333358765, 0.00019252672791481018, 0.00020240247249603271, 0.00021227821707725525, 0.00022215396165847778, 0.00023202970623970032, 0.00024190545082092285, 0.0002517811954021454, 0.0002616569399833679, 0.00027153268456459045, 0.000281408429145813, 0.0002912841737270355, 0.00030115991830825806, 0.0003110356628894806, 0.0003209114074707031]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 4.0, 5.0, 9.0, 13.0, 12.0, 16.0, 39.0, 27.0, 65.0, 57.0, 87.0, 125.0, 213.0, 452.0, 1031.0, 49079.0, 993322.0, 2454.0, 617.0, 338.0, 212.0, 127.0, 71.0, 50.0, 35.0, 27.0, 14.0, 13.0, 13.0, 5.0, 6.0, 5.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.006374359130859375, -0.0061827898025512695, -0.005991220474243164, -0.005799651145935059, -0.005608081817626953, -0.005416512489318848, -0.005224943161010742, -0.005033373832702637, -0.004841804504394531, -0.004650235176086426, -0.00445866584777832, -0.004267096519470215, -0.004075527191162109, -0.003883957862854004, -0.0036923885345458984, -0.003500819206237793, -0.0033092498779296875, -0.003117680549621582, -0.0029261112213134766, -0.002734541893005371, -0.0025429725646972656, -0.00235140323638916, -0.0021598339080810547, -0.0019682645797729492, -0.0017766952514648438, -0.0015851259231567383, -0.0013935565948486328, -0.0012019872665405273, -0.0010104179382324219, -0.0008188486099243164, -0.0006272792816162109, -0.00043570995330810547, -0.000244140625, -5.257129669189453e-05, 0.00013899803161621094, 0.0003305673599243164, 0.0005221366882324219, 0.0007137060165405273, 0.0009052753448486328, 0.0010968446731567383, 0.0012884140014648438, 0.0014799833297729492, 0.0016715526580810547, 0.0018631219863891602, 0.0020546913146972656, 0.002246260643005371, 0.0024378299713134766, 0.002629399299621582, 0.0028209686279296875, 0.003012537956237793, 0.0032041072845458984, 0.003395676612854004, 0.0035872459411621094, 0.003778815269470215, 0.00397038459777832, 0.004161953926086426, 0.004353523254394531, 0.004545092582702637, 0.004736661911010742, 0.004928231239318848, 0.005119800567626953, 0.005311369895935059, 0.005502939224243164, 0.0056945085525512695, 0.005886077880859375]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 31.0, 171.0, 409.0, 312.0, 78.0, 8.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.001052223495207727, -0.001031066058203578, -0.0010099085047841072, -0.0009887510677799582, -0.0009675935725681484, -0.0009464360773563385, -0.0009252786403521895, -0.0009041211451403797, -0.0008829636499285698, -0.0008618061547167599, -0.000840648717712611, -0.0008194912225008011, -0.0007983337272889912, -0.0007771762320771813, -0.0007560187950730324, -0.0007348612998612225, -0.0007137038628570735, -0.0006925463676452637, -0.0006713889306411147, -0.0006502314354293048, -0.000629073940217495, -0.000607916503213346, -0.0005867590080015361, -0.0005656015127897263, -0.0005444440757855773, -0.0005232865805737674, -0.0005021291435696185, -0.0004809716483578086, -0.0004598141531459987, -0.0004386566870380193, -0.0004174992209300399, -0.00039634172571823, -0.00037518423050642014, -0.0003540267643984407, -0.00033286926918663085, -0.00031171180307865143, -0.00029055430786684155, -0.00026939684175886214, -0.0002482393756508827, -0.00022708189499098808, -0.00020592441433109343, -0.00018476693367119879, -0.00016360945301130414, -0.00014245198690332472, -0.00012129450624343008, -0.00010013702558353543, -7.897955947555602e-05, -5.782207881566137e-05, -3.6664598155766726e-05, -1.5507121133850887e-05, 5.650355888064951e-06, 2.6807829272001982e-05, 4.796530993189663e-05, 6.912279059179127e-05, 9.028025669977069e-05, 0.00011143773735966533, 0.00013259521801955998, 0.00015375269867945462, 0.00017491017933934927, 0.0001960676454473287, 0.00021722512610722333, 0.00023838260676711798, 0.0002595400728750974, 0.0002806975389830768, 0.0003018550341948867]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 9.0, 9.0, 13.0, 8.0, 11.0, 14.0, 16.0, 18.0, 24.0, 29.0, 19.0, 20.0, 35.0, 30.0, 48.0, 34.0, 42.0, 37.0, 54.0, 41.0, 46.0, 42.0, 46.0, 34.0, 46.0, 32.0, 41.0, 25.0, 20.0, 26.0, 11.0, 20.0, 20.0, 15.0, 17.0, 11.0, 6.0, 10.0, 8.0, 4.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001252293586730957, -0.00012072548270225525, -0.0001162216067314148, -0.00011171773076057434, -0.00010721385478973389, -0.00010270997881889343, -9.820610284805298e-05, -9.370222687721252e-05, -8.919835090637207e-05, -8.469447493553162e-05, -8.019059896469116e-05, -7.568672299385071e-05, -7.118284702301025e-05, -6.66789710521698e-05, -6.217509508132935e-05, -5.767121911048889e-05, -5.316734313964844e-05, -4.8663467168807983e-05, -4.415959119796753e-05, -3.9655715227127075e-05, -3.515183925628662e-05, -3.064796328544617e-05, -2.6144087314605713e-05, -2.164021134376526e-05, -1.7136335372924805e-05, -1.263245940208435e-05, -8.128583431243896e-06, -3.6247074604034424e-06, 8.791685104370117e-07, 5.383044481277466e-06, 9.88692045211792e-06, 1.4390796422958374e-05, 1.8894672393798828e-05, 2.3398548364639282e-05, 2.7902424335479736e-05, 3.240630030632019e-05, 3.6910176277160645e-05, 4.14140522480011e-05, 4.591792821884155e-05, 5.042180418968201e-05, 5.492568016052246e-05, 5.9429556131362915e-05, 6.393343210220337e-05, 6.843730807304382e-05, 7.294118404388428e-05, 7.744506001472473e-05, 8.194893598556519e-05, 8.645281195640564e-05, 9.09566879272461e-05, 9.546056389808655e-05, 9.9964439868927e-05, 0.00010446831583976746, 0.00010897219181060791, 0.00011347606778144836, 0.00011797994375228882, 0.00012248381972312927, 0.00012698769569396973, 0.00013149157166481018, 0.00013599544763565063, 0.0001404993236064911, 0.00014500319957733154, 0.000149507075548172, 0.00015401095151901245, 0.0001585148274898529, 0.00016301870346069336]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 0.0, 3.0, 4.0, 4.0, 6.0, 8.0, 8.0, 8.0, 14.0, 13.0, 17.0, 11.0, 21.0, 11.0, 18.0, 22.0, 24.0, 23.0, 29.0, 38.0, 31.0, 40.0, 51.0, 42.0, 49.0, 41.0, 33.0, 44.0, 33.0, 46.0, 50.0, 25.0, 29.0, 32.0, 22.0, 22.0, 26.0, 16.0, 17.0, 15.0, 14.0, 10.0, 5.0, 8.0, 9.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.0234375, -1.95208740234375, -1.8807373046875, -1.80938720703125, -1.738037109375, -1.66668701171875, -1.5953369140625, -1.52398681640625, -1.45263671875, -1.38128662109375, -1.3099365234375, -1.23858642578125, -1.167236328125, -1.09588623046875, -1.0245361328125, -0.95318603515625, -0.8818359375, -0.81048583984375, -0.7391357421875, -0.66778564453125, -0.596435546875, -0.52508544921875, -0.4537353515625, -0.38238525390625, -0.31103515625, -0.23968505859375, -0.1683349609375, -0.09698486328125, -0.025634765625, 0.04571533203125, 0.1170654296875, 0.18841552734375, 0.259765625, 0.33111572265625, 0.4024658203125, 0.47381591796875, 0.545166015625, 0.61651611328125, 0.6878662109375, 0.75921630859375, 0.83056640625, 0.90191650390625, 0.9732666015625, 1.04461669921875, 1.115966796875, 1.18731689453125, 1.2586669921875, 1.33001708984375, 1.4013671875, 1.47271728515625, 1.5440673828125, 1.61541748046875, 1.686767578125, 1.75811767578125, 1.8294677734375, 1.90081787109375, 1.97216796875, 2.04351806640625, 2.1148681640625, 2.18621826171875, 2.257568359375, 2.32891845703125, 2.4002685546875, 2.47161865234375, 2.54296875]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 4.0, 8.0, 12.0, 29.0, 28.0, 46.0, 83.0, 109.0, 165.0, 272.0, 375.0, 746.0, 1437.0, 3049.0, 6783.0, 15015.0, 32352.0, 68894.0, 148818.0, 275635.0, 254427.0, 128304.0, 59757.0, 27843.0, 12853.0, 5893.0, 2642.0, 1285.0, 675.0, 381.0, 212.0, 150.0, 82.0, 59.0, 49.0, 25.0, 19.0, 18.0, 8.0, 9.0, 7.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.16015625, -2.087921142578125, -2.01568603515625, -1.943450927734375, -1.8712158203125, -1.798980712890625, -1.72674560546875, -1.654510498046875, -1.582275390625, -1.510040283203125, -1.43780517578125, -1.365570068359375, -1.2933349609375, -1.221099853515625, -1.14886474609375, -1.076629638671875, -1.00439453125, -0.932159423828125, -0.85992431640625, -0.787689208984375, -0.7154541015625, -0.643218994140625, -0.57098388671875, -0.498748779296875, -0.426513671875, -0.354278564453125, -0.28204345703125, -0.209808349609375, -0.1375732421875, -0.065338134765625, 0.00689697265625, 0.079132080078125, 0.1513671875, 0.223602294921875, 0.29583740234375, 0.368072509765625, 0.4403076171875, 0.512542724609375, 0.58477783203125, 0.657012939453125, 0.729248046875, 0.801483154296875, 0.87371826171875, 0.945953369140625, 1.0181884765625, 1.090423583984375, 1.16265869140625, 1.234893798828125, 1.30712890625, 1.379364013671875, 1.45159912109375, 1.523834228515625, 1.5960693359375, 1.668304443359375, 1.74053955078125, 1.812774658203125, 1.885009765625, 1.957244873046875, 2.02947998046875, 2.101715087890625, 2.1739501953125, 2.246185302734375, 2.31842041015625, 2.390655517578125, 2.462890625]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 2.0, 8.0, 6.0, 14.0, 11.0, 11.0, 12.0, 16.0, 30.0, 31.0, 38.0, 45.0, 57.0, 68.0, 85.0, 141.0, 411.0, 1477.0, 168.0, 81.0, 57.0, 64.0, 43.0, 44.0, 33.0, 27.0, 24.0, 10.0, 9.0, 6.0, 5.0, 6.0, 2.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-15.359375, -14.9559326171875, -14.552490234375, -14.1490478515625, -13.74560546875, -13.3421630859375, -12.938720703125, -12.5352783203125, -12.1318359375, -11.7283935546875, -11.324951171875, -10.9215087890625, -10.51806640625, -10.1146240234375, -9.711181640625, -9.3077392578125, -8.904296875, -8.5008544921875, -8.097412109375, -7.6939697265625, -7.29052734375, -6.8870849609375, -6.483642578125, -6.0802001953125, -5.6767578125, -5.2733154296875, -4.869873046875, -4.4664306640625, -4.06298828125, -3.6595458984375, -3.256103515625, -2.8526611328125, -2.44921875, -2.0457763671875, -1.642333984375, -1.2388916015625, -0.83544921875, -0.4320068359375, -0.028564453125, 0.3748779296875, 0.7783203125, 1.1817626953125, 1.585205078125, 1.9886474609375, 2.39208984375, 2.7955322265625, 3.198974609375, 3.6024169921875, 4.005859375, 4.4093017578125, 4.812744140625, 5.2161865234375, 5.61962890625, 6.0230712890625, 6.426513671875, 6.8299560546875, 7.2333984375, 7.6368408203125, 8.040283203125, 8.4437255859375, 8.84716796875, 9.2506103515625, 9.654052734375, 10.0574951171875, 10.4609375]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 3.0, 5.0, 5.0, 11.0, 8.0, 12.0, 18.0, 20.0, 29.0, 26.0, 61.0, 77.0, 118.0, 189.0, 336.0, 622.0, 3461.0, 2998112.0, 140093.0, 1213.0, 485.0, 263.0, 147.0, 97.0, 68.0, 52.0, 45.0, 30.0, 27.0, 15.0, 18.0, 17.0, 5.0, 5.0, 6.0, 3.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.390625, -26.328857421875, -25.26708984375, -24.205322265625, -23.1435546875, -22.081787109375, -21.02001953125, -19.958251953125, -18.896484375, -17.834716796875, -16.77294921875, -15.711181640625, -14.6494140625, -13.587646484375, -12.52587890625, -11.464111328125, -10.40234375, -9.340576171875, -8.27880859375, -7.217041015625, -6.1552734375, -5.093505859375, -4.03173828125, -2.969970703125, -1.908203125, -0.846435546875, 0.21533203125, 1.277099609375, 2.3388671875, 3.400634765625, 4.46240234375, 5.524169921875, 6.5859375, 7.647705078125, 8.70947265625, 9.771240234375, 10.8330078125, 11.894775390625, 12.95654296875, 14.018310546875, 15.080078125, 16.141845703125, 17.20361328125, 18.265380859375, 19.3271484375, 20.388916015625, 21.45068359375, 22.512451171875, 23.57421875, 24.635986328125, 25.69775390625, 26.759521484375, 27.8212890625, 28.883056640625, 29.94482421875, 31.006591796875, 32.068359375, 33.130126953125, 34.19189453125, 35.253662109375, 36.3154296875, 37.377197265625, 38.43896484375, 39.500732421875, 40.5625]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 10.0, 38.0, 109.0, 222.0, 303.0, 203.0, 93.0, 28.0, 10.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.79438591003418, -28.78071403503418, -27.76704216003418, -26.75337028503418, -25.73969841003418, -24.72602653503418, -23.712352752685547, -22.698680877685547, -21.685009002685547, -20.671337127685547, -19.657665252685547, -18.643993377685547, -17.630321502685547, -16.616649627685547, -15.60297679901123, -14.58930492401123, -13.575634002685547, -12.561962127685547, -11.548290252685547, -10.534618377685547, -9.520946502685547, -8.507274627685547, -7.4936017990112305, -6.4799299240112305, -5.4662580490112305, -4.4525861740112305, -3.4389140605926514, -2.4252419471740723, -1.4115700721740723, -0.39789819717407227, 0.6157741546630859, 1.629446029663086, 2.643115997314453, 3.656787872314453, 4.670459747314453, 5.684132099151611, 6.697803974151611, 7.711475849151611, 8.72514820098877, 9.73882007598877, 10.75249195098877, 11.76616382598877, 12.77983570098877, 13.793508529663086, 14.807180404663086, 15.820852279663086, 16.834524154663086, 17.848196029663086, 18.861867904663086, 19.875539779663086, 20.889211654663086, 21.902883529663086, 22.916555404663086, 23.930227279663086, 24.94390106201172, 25.95757293701172, 26.97124481201172, 27.98491668701172, 28.99858856201172, 30.01226043701172, 31.02593231201172, 32.03960418701172, 33.05327606201172, 34.06694793701172, 35.08061981201172]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0, 5.0, 5.0, 6.0, 5.0, 9.0, 11.0, 17.0, 18.0, 19.0, 20.0, 15.0, 26.0, 24.0, 23.0, 33.0, 35.0, 32.0, 37.0, 41.0, 38.0, 36.0, 36.0, 49.0, 51.0, 42.0, 35.0, 35.0, 32.0, 29.0, 23.0, 28.0, 24.0, 26.0, 26.0, 20.0, 19.0, 18.0, 14.0, 7.0, 5.0, 9.0, 3.0, 4.0, 4.0, 3.0, 6.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.522613525390625, -18.866973876953125, -18.211334228515625, -17.555696487426758, -16.900056838989258, -16.244417190551758, -15.588777542114258, -14.933137893676758, -14.277499198913574, -13.621859550476074, -12.96622085571289, -12.31058120727539, -11.65494155883789, -10.999302864074707, -10.343663215637207, -9.688024520874023, -9.032384872436523, -8.376745223999023, -7.72110652923584, -7.06546688079834, -6.409827709197998, -5.754188537597656, -5.098548889160156, -4.4429097175598145, -3.7872705459594727, -3.131631374359131, -2.47599196434021, -1.8203526735305786, -1.1647133827209473, -0.5090742111206055, 0.14656519889831543, 0.8022046089172363, 1.4578437805175781, 2.11348295211792, 2.769122362136841, 3.4247617721557617, 4.0804009437561035, 4.736040115356445, 5.391679763793945, 6.047318935394287, 6.702958106994629, 7.358597278594971, 8.014236450195312, 8.669876098632812, 9.325515747070312, 9.981154441833496, 10.636794090270996, 11.29243278503418, 11.94807243347168, 12.60371208190918, 13.259350776672363, 13.914990425109863, 14.570629119873047, 15.226268768310547, 15.881908416748047, 16.537548065185547, 17.193187713623047, 17.848827362060547, 18.504467010498047, 19.160104751586914, 19.815744400024414, 20.471384048461914, 21.127023696899414, 21.782663345336914, 22.43830108642578]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 6.0, 1.0, 6.0, 4.0, 7.0, 5.0, 4.0, 12.0, 11.0, 6.0, 18.0, 16.0, 22.0, 12.0, 25.0, 20.0, 19.0, 27.0, 33.0, 33.0, 32.0, 43.0, 42.0, 26.0, 40.0, 49.0, 41.0, 49.0, 44.0, 32.0, 30.0, 22.0, 38.0, 39.0, 28.0, 26.0, 18.0, 13.0, 14.0, 16.0, 13.0, 9.0, 10.0, 12.0, 6.0, 10.0, 6.0, 1.0, 4.0, 2.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0], "bins": [-2.412109375, -2.335784912109375, -2.25946044921875, -2.183135986328125, -2.1068115234375, -2.030487060546875, -1.95416259765625, -1.877838134765625, -1.801513671875, -1.725189208984375, -1.64886474609375, -1.572540283203125, -1.4962158203125, -1.419891357421875, -1.34356689453125, -1.267242431640625, -1.19091796875, -1.114593505859375, -1.03826904296875, -0.961944580078125, -0.8856201171875, -0.809295654296875, -0.73297119140625, -0.656646728515625, -0.580322265625, -0.503997802734375, -0.42767333984375, -0.351348876953125, -0.2750244140625, -0.198699951171875, -0.12237548828125, -0.046051025390625, 0.0302734375, 0.106597900390625, 0.18292236328125, 0.259246826171875, 0.3355712890625, 0.411895751953125, 0.48822021484375, 0.564544677734375, 0.640869140625, 0.717193603515625, 0.79351806640625, 0.869842529296875, 0.9461669921875, 1.022491455078125, 1.09881591796875, 1.175140380859375, 1.25146484375, 1.327789306640625, 1.40411376953125, 1.480438232421875, 1.5567626953125, 1.633087158203125, 1.70941162109375, 1.785736083984375, 1.862060546875, 1.938385009765625, 2.01470947265625, 2.091033935546875, 2.1673583984375, 2.243682861328125, 2.32000732421875, 2.396331787109375, 2.47265625]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 6.0, 7.0, 3.0, 5.0, 8.0, 12.0, 15.0, 9.0, 14.0, 20.0, 22.0, 20.0, 28.0, 25.0, 34.0, 60.0, 73.0, 144.0, 282.0, 643.0, 2787.0, 46087.0, 1621350.0, 2416521.0, 99917.0, 4383.0, 869.0, 357.0, 170.0, 98.0, 69.0, 50.0, 34.0, 21.0, 26.0, 11.0, 14.0, 9.0, 17.0, 7.0, 11.0, 11.0, 9.0, 6.0, 4.0, 3.0, 5.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-8.7109375, -8.4395751953125, -8.168212890625, -7.8968505859375, -7.62548828125, -7.3541259765625, -7.082763671875, -6.8114013671875, -6.5400390625, -6.2686767578125, -5.997314453125, -5.7259521484375, -5.45458984375, -5.1832275390625, -4.911865234375, -4.6405029296875, -4.369140625, -4.0977783203125, -3.826416015625, -3.5550537109375, -3.28369140625, -3.0123291015625, -2.740966796875, -2.4696044921875, -2.1982421875, -1.9268798828125, -1.655517578125, -1.3841552734375, -1.11279296875, -0.8414306640625, -0.570068359375, -0.2987060546875, -0.02734375, 0.2440185546875, 0.515380859375, 0.7867431640625, 1.05810546875, 1.3294677734375, 1.600830078125, 1.8721923828125, 2.1435546875, 2.4149169921875, 2.686279296875, 2.9576416015625, 3.22900390625, 3.5003662109375, 3.771728515625, 4.0430908203125, 4.314453125, 4.5858154296875, 4.857177734375, 5.1285400390625, 5.39990234375, 5.6712646484375, 5.942626953125, 6.2139892578125, 6.4853515625, 6.7567138671875, 7.028076171875, 7.2994384765625, 7.57080078125, 7.8421630859375, 8.113525390625, 8.3848876953125, 8.65625]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 6.0, 5.0, 6.0, 7.0, 11.0, 15.0, 22.0, 30.0, 52.0, 67.0, 92.0, 126.0, 164.0, 234.0, 306.0, 385.0, 401.0, 478.0, 389.0, 350.0, 265.0, 189.0, 125.0, 90.0, 80.0, 55.0, 40.0, 24.0, 21.0, 10.0, 14.0, 5.0, 5.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-7.17578125, -6.9925537109375, -6.809326171875, -6.6260986328125, -6.44287109375, -6.2596435546875, -6.076416015625, -5.8931884765625, -5.7099609375, -5.5267333984375, -5.343505859375, -5.1602783203125, -4.97705078125, -4.7938232421875, -4.610595703125, -4.4273681640625, -4.244140625, -4.0609130859375, -3.877685546875, -3.6944580078125, -3.51123046875, -3.3280029296875, -3.144775390625, -2.9615478515625, -2.7783203125, -2.5950927734375, -2.411865234375, -2.2286376953125, -2.04541015625, -1.8621826171875, -1.678955078125, -1.4957275390625, -1.3125, -1.1292724609375, -0.946044921875, -0.7628173828125, -0.57958984375, -0.3963623046875, -0.213134765625, -0.0299072265625, 0.1533203125, 0.3365478515625, 0.519775390625, 0.7030029296875, 0.88623046875, 1.0694580078125, 1.252685546875, 1.4359130859375, 1.619140625, 1.8023681640625, 1.985595703125, 2.1688232421875, 2.35205078125, 2.5352783203125, 2.718505859375, 2.9017333984375, 3.0849609375, 3.2681884765625, 3.451416015625, 3.6346435546875, 3.81787109375, 4.0010986328125, 4.184326171875, 4.3675537109375, 4.55078125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 3.0, 0.0, 2.0, 8.0, 3.0, 10.0, 14.0, 10.0, 22.0, 28.0, 47.0, 41.0, 68.0, 90.0, 106.0, 147.0, 203.0, 303.0, 574.0, 2231.0, 40027.0, 2164632.0, 1947216.0, 34738.0, 2103.0, 578.0, 307.0, 219.0, 153.0, 91.0, 83.0, 57.0, 59.0, 37.0, 21.0, 11.0, 12.0, 10.0, 9.0, 7.0, 7.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.265625, -10.83203125, -10.3984375, -9.96484375, -9.53125, -9.09765625, -8.6640625, -8.23046875, -7.796875, -7.36328125, -6.9296875, -6.49609375, -6.0625, -5.62890625, -5.1953125, -4.76171875, -4.328125, -3.89453125, -3.4609375, -3.02734375, -2.59375, -2.16015625, -1.7265625, -1.29296875, -0.859375, -0.42578125, 0.0078125, 0.44140625, 0.875, 1.30859375, 1.7421875, 2.17578125, 2.609375, 3.04296875, 3.4765625, 3.91015625, 4.34375, 4.77734375, 5.2109375, 5.64453125, 6.078125, 6.51171875, 6.9453125, 7.37890625, 7.8125, 8.24609375, 8.6796875, 9.11328125, 9.546875, 9.98046875, 10.4140625, 10.84765625, 11.28125, 11.71484375, 12.1484375, 12.58203125, 13.015625, 13.44921875, 13.8828125, 14.31640625, 14.75, 15.18359375, 15.6171875, 16.05078125, 16.484375]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 19.0, 31.0, 63.0, 87.0, 123.0, 168.0, 169.0, 155.0, 102.0, 43.0, 27.0, 17.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.459632873535156, -26.364343643188477, -25.269054412841797, -24.173765182495117, -23.078475952148438, -21.983186721801758, -20.887897491455078, -19.7926082611084, -18.69731903076172, -17.60202980041504, -16.50674057006836, -15.41145133972168, -14.316162109375, -13.22087287902832, -12.12558364868164, -11.030294418334961, -9.935005187988281, -8.839715957641602, -7.744426727294922, -6.649137496948242, -5.5538482666015625, -4.458559036254883, -3.363269805908203, -2.2679805755615234, -1.1726913452148438, -0.07740211486816406, 1.0178871154785156, 2.1131763458251953, 3.208465576171875, 4.303754806518555, 5.399044036865234, 6.494333267211914, 7.589618682861328, 8.684907913208008, 9.780197143554688, 10.875486373901367, 11.970775604248047, 13.066064834594727, 14.161354064941406, 15.256643295288086, 16.351932525634766, 17.447221755981445, 18.542510986328125, 19.637800216674805, 20.733089447021484, 21.828378677368164, 22.923667907714844, 24.018957138061523, 25.114246368408203, 26.209535598754883, 27.304824829101562, 28.400114059448242, 29.495403289794922, 30.5906925201416, 31.68598175048828, 32.781272888183594, 33.87656021118164, 34.97184753417969, 36.067138671875, 37.16242980957031, 38.25771713256836, 39.353004455566406, 40.44829559326172, 41.54358673095703, 42.63887405395508]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 4.0, 7.0, 10.0, 12.0, 9.0, 14.0, 18.0, 25.0, 26.0, 35.0, 36.0, 26.0, 34.0, 36.0, 39.0, 33.0, 36.0, 44.0, 43.0, 46.0, 32.0, 45.0, 40.0, 41.0, 42.0, 36.0, 33.0, 35.0, 32.0, 26.0, 16.0, 21.0, 13.0, 12.0, 11.0, 10.0, 5.0, 5.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.082216262817383, -17.480741500854492, -16.879268646240234, -16.277793884277344, -15.676319122314453, -15.074845314025879, -14.473371505737305, -13.871896743774414, -13.27042293548584, -12.668949127197266, -12.067474365234375, -11.4660005569458, -10.864526748657227, -10.263051986694336, -9.661578178405762, -9.060104370117188, -8.458629608154297, -7.8571553230285645, -7.255681037902832, -6.654207229614258, -6.052732944488525, -5.451258659362793, -4.849784851074219, -4.248310565948486, -3.646836280822754, -3.0453619956970215, -2.443887948989868, -1.8424137830734253, -1.2409396171569824, -0.63946533203125, -0.03799128532409668, 0.5634827613830566, 1.1649551391601562, 1.7664293050765991, 2.367903470993042, 2.9693775177001953, 3.5708518028259277, 4.17232608795166, 4.773799896240234, 5.375274181365967, 5.976748466491699, 6.578222751617432, 7.179697036743164, 7.781170845031738, 8.382644653320312, 8.984119415283203, 9.585593223571777, 10.187067031860352, 10.788541793823242, 11.390015602111816, 11.991490364074707, 12.592964172363281, 13.194438934326172, 13.795912742614746, 14.39738655090332, 14.998861312866211, 15.600335121154785, 16.20180892944336, 16.80328369140625, 17.40475845336914, 18.0062313079834, 18.60770606994629, 19.20918083190918, 19.810653686523438, 20.412128448486328]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 7.0, 3.0, 9.0, 5.0, 15.0, 13.0, 15.0, 14.0, 20.0, 16.0, 18.0, 20.0, 21.0, 29.0, 23.0, 30.0, 30.0, 36.0, 41.0, 44.0, 52.0, 41.0, 44.0, 40.0, 39.0, 36.0, 35.0, 33.0, 32.0, 38.0, 23.0, 20.0, 24.0, 25.0, 12.0, 10.0, 13.0, 13.0, 7.0, 12.0, 11.0, 9.0, 9.0, 5.0, 4.0, 3.0, 6.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.42578125, -2.35235595703125, -2.2789306640625, -2.20550537109375, -2.132080078125, -2.05865478515625, -1.9852294921875, -1.91180419921875, -1.83837890625, -1.76495361328125, -1.6915283203125, -1.61810302734375, -1.544677734375, -1.47125244140625, -1.3978271484375, -1.32440185546875, -1.2509765625, -1.17755126953125, -1.1041259765625, -1.03070068359375, -0.957275390625, -0.88385009765625, -0.8104248046875, -0.73699951171875, -0.66357421875, -0.59014892578125, -0.5167236328125, -0.44329833984375, -0.369873046875, -0.29644775390625, -0.2230224609375, -0.14959716796875, -0.076171875, -0.00274658203125, 0.0706787109375, 0.14410400390625, 0.217529296875, 0.29095458984375, 0.3643798828125, 0.43780517578125, 0.51123046875, 0.58465576171875, 0.6580810546875, 0.73150634765625, 0.804931640625, 0.87835693359375, 0.9517822265625, 1.02520751953125, 1.0986328125, 1.17205810546875, 1.2454833984375, 1.31890869140625, 1.392333984375, 1.46575927734375, 1.5391845703125, 1.61260986328125, 1.68603515625, 1.75946044921875, 1.8328857421875, 1.90631103515625, 1.979736328125, 2.05316162109375, 2.1265869140625, 2.20001220703125, 2.2734375]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 3.0, 10.0, 10.0, 17.0, 24.0, 37.0, 45.0, 83.0, 105.0, 149.0, 232.0, 384.0, 533.0, 819.0, 1184.0, 1723.0, 2551.0, 3651.0, 5387.0, 7826.0, 11184.0, 16615.0, 25372.0, 40039.0, 66139.0, 122234.0, 264629.0, 215312.0, 100836.0, 56405.0, 34962.0, 22674.0, 15127.0, 10316.0, 6886.0, 4774.0, 3258.0, 2317.0, 1443.0, 1045.0, 753.0, 491.0, 325.0, 229.0, 131.0, 99.0, 64.0, 47.0, 41.0, 16.0, 11.0, 8.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.4189453125, -0.4053688049316406, -0.39179229736328125, -0.3782157897949219, -0.3646392822265625, -0.3510627746582031, -0.33748626708984375, -0.3239097595214844, -0.310333251953125, -0.2967567443847656, -0.28318023681640625, -0.2696037292480469, -0.2560272216796875, -0.24245071411132812, -0.22887420654296875, -0.21529769897460938, -0.20172119140625, -0.18814468383789062, -0.17456817626953125, -0.16099166870117188, -0.1474151611328125, -0.13383865356445312, -0.12026214599609375, -0.10668563842773438, -0.093109130859375, -0.07953262329101562, -0.06595611572265625, -0.052379608154296875, -0.0388031005859375, -0.025226593017578125, -0.01165008544921875, 0.001926422119140625, 0.0155029296875, 0.029079437255859375, 0.04265594482421875, 0.056232452392578125, 0.0698089599609375, 0.08338546752929688, 0.09696197509765625, 0.11053848266601562, 0.124114990234375, 0.13769149780273438, 0.15126800537109375, 0.16484451293945312, 0.1784210205078125, 0.19199752807617188, 0.20557403564453125, 0.21915054321289062, 0.23272705078125, 0.24630355834960938, 0.25988006591796875, 0.2734565734863281, 0.2870330810546875, 0.3006095886230469, 0.31418609619140625, 0.3277626037597656, 0.341339111328125, 0.3549156188964844, 0.36849212646484375, 0.3820686340332031, 0.3956451416015625, 0.4092216491699219, 0.42279815673828125, 0.4363746643066406, 0.449951171875]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 6.0, 9.0, 7.0, 7.0, 14.0, 13.0, 11.0, 9.0, 24.0, 25.0, 23.0, 20.0, 23.0, 22.0, 30.0, 24.0, 38.0, 38.0, 50.0, 37.0, 43.0, 1063.0, 42.0, 40.0, 47.0, 39.0, 36.0, 28.0, 31.0, 36.0, 18.0, 30.0, 27.0, 18.0, 21.0, 11.0, 12.0, 15.0, 7.0, 10.0, 8.0, 10.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.53125, -1.4826507568359375, -1.434051513671875, -1.3854522705078125, -1.33685302734375, -1.2882537841796875, -1.239654541015625, -1.1910552978515625, -1.1424560546875, -1.0938568115234375, -1.045257568359375, -0.9966583251953125, -0.94805908203125, -0.8994598388671875, -0.850860595703125, -0.8022613525390625, -0.753662109375, -0.7050628662109375, -0.656463623046875, -0.6078643798828125, -0.55926513671875, -0.5106658935546875, -0.462066650390625, -0.4134674072265625, -0.3648681640625, -0.3162689208984375, -0.267669677734375, -0.2190704345703125, -0.17047119140625, -0.1218719482421875, -0.073272705078125, -0.0246734619140625, 0.02392578125, 0.0725250244140625, 0.121124267578125, 0.1697235107421875, 0.21832275390625, 0.2669219970703125, 0.315521240234375, 0.3641204833984375, 0.4127197265625, 0.4613189697265625, 0.509918212890625, 0.5585174560546875, 0.60711669921875, 0.6557159423828125, 0.704315185546875, 0.7529144287109375, 0.801513671875, 0.8501129150390625, 0.898712158203125, 0.9473114013671875, 0.99591064453125, 1.0445098876953125, 1.093109130859375, 1.1417083740234375, 1.1903076171875, 1.2389068603515625, 1.287506103515625, 1.3361053466796875, 1.38470458984375, 1.4333038330078125, 1.481903076171875, 1.5305023193359375, 1.5791015625]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 7.0, 18.0, 19.0, 28.0, 53.0, 61.0, 78.0, 130.0, 195.0, 261.0, 422.0, 662.0, 947.0, 1447.0, 2107.0, 3272.0, 4734.0, 7312.0, 11066.0, 17337.0, 27105.0, 44512.0, 75686.0, 145470.0, 1343819.0, 181949.0, 89946.0, 50980.0, 30767.0, 19588.0, 12439.0, 8352.0, 5361.0, 3657.0, 2461.0, 1603.0, 1100.0, 734.0, 500.0, 332.0, 206.0, 142.0, 85.0, 66.0, 32.0, 31.0, 25.0, 8.0, 5.0, 5.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.43017578125, -0.4165802001953125, -0.402984619140625, -0.3893890380859375, -0.37579345703125, -0.3621978759765625, -0.348602294921875, -0.3350067138671875, -0.3214111328125, -0.3078155517578125, -0.294219970703125, -0.2806243896484375, -0.26702880859375, -0.2534332275390625, -0.239837646484375, -0.2262420654296875, -0.212646484375, -0.1990509033203125, -0.185455322265625, -0.1718597412109375, -0.15826416015625, -0.1446685791015625, -0.131072998046875, -0.1174774169921875, -0.1038818359375, -0.0902862548828125, -0.076690673828125, -0.0630950927734375, -0.04949951171875, -0.0359039306640625, -0.022308349609375, -0.0087127685546875, 0.0048828125, 0.0184783935546875, 0.032073974609375, 0.0456695556640625, 0.05926513671875, 0.0728607177734375, 0.086456298828125, 0.1000518798828125, 0.1136474609375, 0.1272430419921875, 0.140838623046875, 0.1544342041015625, 0.16802978515625, 0.1816253662109375, 0.195220947265625, 0.2088165283203125, 0.222412109375, 0.2360076904296875, 0.249603271484375, 0.2631988525390625, 0.27679443359375, 0.2903900146484375, 0.303985595703125, 0.3175811767578125, 0.3311767578125, 0.3447723388671875, 0.358367919921875, 0.3719635009765625, 0.38555908203125, 0.3991546630859375, 0.412750244140625, 0.4263458251953125, 0.43994140625]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 2.0, 4.0, 1.0, 4.0, 8.0, 6.0, 12.0, 9.0, 17.0, 15.0, 12.0, 16.0, 28.0, 25.0, 34.0, 29.0, 51.0, 49.0, 41.0, 46.0, 50.0, 59.0, 50.0, 67.0, 54.0, 54.0, 42.0, 33.0, 37.0, 26.0, 25.0, 13.0, 16.0, 13.0, 14.0, 9.0, 4.0, 8.0, 5.0, 5.0, 1.0, 5.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.0002791881561279297, -0.0002708137035369873, -0.0002624392509460449, -0.00025406479835510254, -0.00024569034576416016, -0.00023731589317321777, -0.0002289414405822754, -0.000220566987991333, -0.00021219253540039062, -0.00020381808280944824, -0.00019544363021850586, -0.00018706917762756348, -0.0001786947250366211, -0.0001703202724456787, -0.00016194581985473633, -0.00015357136726379395, -0.00014519691467285156, -0.00013682246208190918, -0.0001284480094909668, -0.00012007355690002441, -0.00011169910430908203, -0.00010332465171813965, -9.495019912719727e-05, -8.657574653625488e-05, -7.82012939453125e-05, -6.982684135437012e-05, -6.145238876342773e-05, -5.307793617248535e-05, -4.470348358154297e-05, -3.6329030990600586e-05, -2.7954578399658203e-05, -1.958012580871582e-05, -1.1205673217773438e-05, -2.8312206268310547e-06, 5.543231964111328e-06, 1.3917684555053711e-05, 2.2292137145996094e-05, 3.0666589736938477e-05, 3.904104232788086e-05, 4.741549491882324e-05, 5.5789947509765625e-05, 6.416440010070801e-05, 7.253885269165039e-05, 8.091330528259277e-05, 8.928775787353516e-05, 9.766221046447754e-05, 0.00010603666305541992, 0.0001144111156463623, 0.0001227855682373047, 0.00013116002082824707, 0.00013953447341918945, 0.00014790892601013184, 0.00015628337860107422, 0.0001646578311920166, 0.00017303228378295898, 0.00018140673637390137, 0.00018978118896484375, 0.00019815564155578613, 0.00020653009414672852, 0.0002149045467376709, 0.00022327899932861328, 0.00023165345191955566, 0.00024002790451049805, 0.00024840235710144043, 0.0002567768096923828]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 1.0, 0.0, 3.0, 5.0, 1.0, 5.0, 7.0, 5.0, 7.0, 5.0, 11.0, 18.0, 13.0, 26.0, 30.0, 42.0, 41.0, 62.0, 73.0, 145.0, 236.0, 400.0, 806.0, 5103.0, 996327.0, 42811.0, 1104.0, 461.0, 233.0, 162.0, 103.0, 79.0, 54.0, 41.0, 26.0, 16.0, 26.0, 12.0, 9.0, 9.0, 10.0, 13.0, 9.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00519561767578125, -0.0050261616706848145, -0.004856705665588379, -0.004687249660491943, -0.004517793655395508, -0.004348337650299072, -0.004178881645202637, -0.004009425640106201, -0.0038399696350097656, -0.00367051362991333, -0.0035010576248168945, -0.003331601619720459, -0.0031621456146240234, -0.002992689609527588, -0.0028232336044311523, -0.002653777599334717, -0.0024843215942382812, -0.0023148655891418457, -0.00214540958404541, -0.0019759535789489746, -0.001806497573852539, -0.0016370415687561035, -0.001467585563659668, -0.0012981295585632324, -0.0011286735534667969, -0.0009592175483703613, -0.0007897615432739258, -0.0006203055381774902, -0.0004508495330810547, -0.00028139352798461914, -0.0001119375228881836, 5.751848220825195e-05, 0.0002269744873046875, 0.00039643049240112305, 0.0005658864974975586, 0.0007353425025939941, 0.0009047985076904297, 0.0010742545127868652, 0.0012437105178833008, 0.0014131665229797363, 0.0015826225280761719, 0.0017520785331726074, 0.001921534538269043, 0.0020909905433654785, 0.002260446548461914, 0.0024299025535583496, 0.002599358558654785, 0.0027688145637512207, 0.0029382705688476562, 0.003107726573944092, 0.0032771825790405273, 0.003446638584136963, 0.0036160945892333984, 0.003785550594329834, 0.0039550065994262695, 0.004124462604522705, 0.004293918609619141, 0.004463374614715576, 0.004632830619812012, 0.004802286624908447, 0.004971742630004883, 0.005141198635101318, 0.005310654640197754, 0.0054801106452941895, 0.005649566650390625]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 11.0, 62.0, 204.0, 405.0, 253.0, 63.0, 16.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009686995763331652, -0.0009487346396781504, -0.0009287697612307966, -0.0009088048245757818, -0.0008888398879207671, -0.0008688750094734132, -0.0008489100728183985, -0.0008289451943710446, -0.0008089802577160299, -0.0007890153210610151, -0.0007690504426136613, -0.0007490855059586465, -0.0007291205693036318, -0.0007091556908562779, -0.0006891907542012632, -0.0006692258175462484, -0.0006492609390988946, -0.0006292960024438798, -0.000609331123996526, -0.0005893661873415112, -0.0005694012506864965, -0.0005494363722391427, -0.0005294714355841279, -0.0005095065571367741, -0.0004895415622740984, -0.0004695766547229141, -0.00044961171806789935, -0.00042964681051671505, -0.00040968190296553075, -0.00038971699541434646, -0.0003697520587593317, -0.0003497871512081474, -0.0003298222436569631, -0.0003098573361057788, -0.00028989239945076406, -0.00026992749189957976, -0.00024996258434839547, -0.00022999766224529594, -0.00021003274014219642, -0.00019006783259101212, -0.0001701029104879126, -0.00015013798838481307, -0.00013017308083362877, -0.00011020815873052925, -9.024324390338734e-05, -7.027832907624543e-05, -5.03134069731459e-05, -3.0348499421961606e-05, -1.038357731886208e-05, 9.581339327269234e-06, 2.9546255973400548e-05, 4.9511174438521266e-05, 6.947608926566318e-05, 8.944100409280509e-05, 0.00010940592619590461, 0.0001293708337470889, 0.00014933575585018843, 0.00016930067795328796, 0.00018926558550447226, 0.00020923050760757178, 0.0002291954297106713, 0.0002491603372618556, 0.00026912527391687036, 0.0002890901523642242, 0.00030905508901923895]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 1.0, 2.0, 3.0, 4.0, 0.0, 8.0, 9.0, 12.0, 10.0, 7.0, 13.0, 12.0, 24.0, 22.0, 21.0, 29.0, 40.0, 27.0, 37.0, 35.0, 49.0, 37.0, 38.0, 57.0, 39.0, 47.0, 43.0, 51.0, 38.0, 35.0, 30.0, 23.0, 27.0, 31.0, 25.0, 22.0, 17.0, 17.0, 12.0, 15.0, 6.0, 10.0, 5.0, 8.0, 1.0, 2.0, 3.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015354156494140625, -0.00014870613813400269, -0.00014387071132659912, -0.00013903528451919556, -0.000134199857711792, -0.00012936443090438843, -0.00012452900409698486, -0.0001196935772895813, -0.00011485815048217773, -0.00011002272367477417, -0.0001051872968673706, -0.00010035187005996704, -9.551644325256348e-05, -9.068101644515991e-05, -8.584558963775635e-05, -8.101016283035278e-05, -7.617473602294922e-05, -7.133930921554565e-05, -6.650388240814209e-05, -6.166845560073853e-05, -5.683302879333496e-05, -5.1997601985931396e-05, -4.716217517852783e-05, -4.232674837112427e-05, -3.74913215637207e-05, -3.265589475631714e-05, -2.7820467948913574e-05, -2.298504114151001e-05, -1.8149614334106445e-05, -1.3314187526702881e-05, -8.478760719299316e-06, -3.643333911895752e-06, 1.1920928955078125e-06, 6.027519702911377e-06, 1.0862946510314941e-05, 1.5698373317718506e-05, 2.053380012512207e-05, 2.5369226932525635e-05, 3.02046537399292e-05, 3.5040080547332764e-05, 3.987550735473633e-05, 4.471093416213989e-05, 4.954636096954346e-05, 5.438178777694702e-05, 5.9217214584350586e-05, 6.405264139175415e-05, 6.888806819915771e-05, 7.372349500656128e-05, 7.855892181396484e-05, 8.339434862136841e-05, 8.822977542877197e-05, 9.306520223617554e-05, 9.79006290435791e-05, 0.00010273605585098267, 0.00010757148265838623, 0.0001124069094657898, 0.00011724233627319336, 0.00012207776308059692, 0.0001269131898880005, 0.00013174861669540405, 0.00013658404350280762, 0.00014141947031021118, 0.00014625489711761475, 0.0001510903239250183, 0.00015592575073242188]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 7.0, 3.0, 9.0, 5.0, 15.0, 13.0, 15.0, 14.0, 20.0, 16.0, 18.0, 20.0, 21.0, 29.0, 23.0, 30.0, 30.0, 36.0, 41.0, 44.0, 52.0, 41.0, 44.0, 40.0, 39.0, 36.0, 35.0, 33.0, 32.0, 38.0, 23.0, 20.0, 24.0, 25.0, 12.0, 10.0, 13.0, 13.0, 7.0, 12.0, 11.0, 9.0, 9.0, 5.0, 4.0, 3.0, 6.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.42578125, -2.35235595703125, -2.2789306640625, -2.20550537109375, -2.132080078125, -2.05865478515625, -1.9852294921875, -1.91180419921875, -1.83837890625, -1.76495361328125, -1.6915283203125, -1.61810302734375, -1.544677734375, -1.47125244140625, -1.3978271484375, -1.32440185546875, -1.2509765625, -1.17755126953125, -1.1041259765625, -1.03070068359375, -0.957275390625, -0.88385009765625, -0.8104248046875, -0.73699951171875, -0.66357421875, -0.59014892578125, -0.5167236328125, -0.44329833984375, -0.369873046875, -0.29644775390625, -0.2230224609375, -0.14959716796875, -0.076171875, -0.00274658203125, 0.0706787109375, 0.14410400390625, 0.217529296875, 0.29095458984375, 0.3643798828125, 0.43780517578125, 0.51123046875, 0.58465576171875, 0.6580810546875, 0.73150634765625, 0.804931640625, 0.87835693359375, 0.9517822265625, 1.02520751953125, 1.0986328125, 1.17205810546875, 1.2454833984375, 1.31890869140625, 1.392333984375, 1.46575927734375, 1.5391845703125, 1.61260986328125, 1.68603515625, 1.75946044921875, 1.8328857421875, 1.90631103515625, 1.979736328125, 2.05316162109375, 2.1265869140625, 2.20001220703125, 2.2734375]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 6.0, 7.0, 11.0, 19.0, 30.0, 35.0, 49.0, 71.0, 114.0, 140.0, 237.0, 321.0, 538.0, 1039.0, 2322.0, 6001.0, 16627.0, 44756.0, 114712.0, 287360.0, 343159.0, 140792.0, 55805.0, 21025.0, 7433.0, 2930.0, 1191.0, 658.0, 403.0, 247.0, 155.0, 112.0, 71.0, 57.0, 36.0, 34.0, 13.0, 12.0, 12.0, 9.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.326171875, -3.228668212890625, -3.13116455078125, -3.033660888671875, -2.9361572265625, -2.838653564453125, -2.74114990234375, -2.643646240234375, -2.546142578125, -2.448638916015625, -2.35113525390625, -2.253631591796875, -2.1561279296875, -2.058624267578125, -1.96112060546875, -1.863616943359375, -1.76611328125, -1.668609619140625, -1.57110595703125, -1.473602294921875, -1.3760986328125, -1.278594970703125, -1.18109130859375, -1.083587646484375, -0.986083984375, -0.888580322265625, -0.79107666015625, -0.693572998046875, -0.5960693359375, -0.498565673828125, -0.40106201171875, -0.303558349609375, -0.2060546875, -0.108551025390625, -0.01104736328125, 0.086456298828125, 0.1839599609375, 0.281463623046875, 0.37896728515625, 0.476470947265625, 0.573974609375, 0.671478271484375, 0.76898193359375, 0.866485595703125, 0.9639892578125, 1.061492919921875, 1.15899658203125, 1.256500244140625, 1.35400390625, 1.451507568359375, 1.54901123046875, 1.646514892578125, 1.7440185546875, 1.841522216796875, 1.93902587890625, 2.036529541015625, 2.134033203125, 2.231536865234375, 2.32904052734375, 2.426544189453125, 2.5240478515625, 2.621551513671875, 2.71905517578125, 2.816558837890625, 2.9140625]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 3.0, 3.0, 1.0, 4.0, 1.0, 7.0, 10.0, 10.0, 15.0, 15.0, 14.0, 26.0, 22.0, 33.0, 24.0, 44.0, 33.0, 43.0, 49.0, 85.0, 125.0, 335.0, 1451.0, 185.0, 93.0, 72.0, 45.0, 33.0, 43.0, 31.0, 36.0, 20.0, 33.0, 23.0, 20.0, 13.0, 11.0, 19.0, 5.0, 8.0, 6.0, 2.0, 5.0, 1.0, 2.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.8515625, -7.5513916015625, -7.251220703125, -6.9510498046875, -6.65087890625, -6.3507080078125, -6.050537109375, -5.7503662109375, -5.4501953125, -5.1500244140625, -4.849853515625, -4.5496826171875, -4.24951171875, -3.9493408203125, -3.649169921875, -3.3489990234375, -3.048828125, -2.7486572265625, -2.448486328125, -2.1483154296875, -1.84814453125, -1.5479736328125, -1.247802734375, -0.9476318359375, -0.6474609375, -0.3472900390625, -0.047119140625, 0.2530517578125, 0.55322265625, 0.8533935546875, 1.153564453125, 1.4537353515625, 1.75390625, 2.0540771484375, 2.354248046875, 2.6544189453125, 2.95458984375, 3.2547607421875, 3.554931640625, 3.8551025390625, 4.1552734375, 4.4554443359375, 4.755615234375, 5.0557861328125, 5.35595703125, 5.6561279296875, 5.956298828125, 6.2564697265625, 6.556640625, 6.8568115234375, 7.156982421875, 7.4571533203125, 7.75732421875, 8.0574951171875, 8.357666015625, 8.6578369140625, 8.9580078125, 9.2581787109375, 9.558349609375, 9.8585205078125, 10.15869140625, 10.4588623046875, 10.759033203125, 11.0592041015625, 11.359375]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 5.0, 6.0, 10.0, 6.0, 13.0, 10.0, 17.0, 22.0, 33.0, 31.0, 40.0, 59.0, 76.0, 115.0, 168.0, 232.0, 413.0, 1152.0, 49961.0, 3085490.0, 6176.0, 680.0, 318.0, 188.0, 115.0, 88.0, 65.0, 59.0, 46.0, 25.0, 16.0, 11.0, 12.0, 8.0, 7.0, 9.0, 6.0, 6.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.046875, -26.057373046875, -25.06787109375, -24.078369140625, -23.0888671875, -22.099365234375, -21.10986328125, -20.120361328125, -19.130859375, -18.141357421875, -17.15185546875, -16.162353515625, -15.1728515625, -14.183349609375, -13.19384765625, -12.204345703125, -11.21484375, -10.225341796875, -9.23583984375, -8.246337890625, -7.2568359375, -6.267333984375, -5.27783203125, -4.288330078125, -3.298828125, -2.309326171875, -1.31982421875, -0.330322265625, 0.6591796875, 1.648681640625, 2.63818359375, 3.627685546875, 4.6171875, 5.606689453125, 6.59619140625, 7.585693359375, 8.5751953125, 9.564697265625, 10.55419921875, 11.543701171875, 12.533203125, 13.522705078125, 14.51220703125, 15.501708984375, 16.4912109375, 17.480712890625, 18.47021484375, 19.459716796875, 20.44921875, 21.438720703125, 22.42822265625, 23.417724609375, 24.4072265625, 25.396728515625, 26.38623046875, 27.375732421875, 28.365234375, 29.354736328125, 30.34423828125, 31.333740234375, 32.3232421875, 33.312744140625, 34.30224609375, 35.291748046875, 36.28125]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 7.0, 260.0, 724.0, 27.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.614267349243164, -20.674463272094727, -16.73465919494629, -12.794856071472168, -8.85505199432373, -4.915248870849609, -0.9754447937011719, 2.9643592834472656, 6.904163360595703, 10.84396743774414, 14.783771514892578, 18.723575592041016, 22.663379669189453, 26.603181838989258, 30.542985916137695, 34.4827880859375, 38.42259216308594, 42.362396240234375, 46.30220031738281, 50.24200439453125, 54.18180847167969, 58.121612548828125, 62.06141662597656, 66.001220703125, 69.94102478027344, 73.88082885742188, 77.82063293457031, 81.76043701171875, 85.70024108886719, 89.64004516601562, 93.57984924316406, 97.5196533203125, 101.4594497680664, 105.39925384521484, 109.33905792236328, 113.27886199951172, 117.21866607666016, 121.1584701538086, 125.09827423095703, 129.03807067871094, 132.97787475585938, 136.9176788330078, 140.85748291015625, 144.7972869873047, 148.73709106445312, 152.67689514160156, 156.61669921875, 160.55650329589844, 164.49630737304688, 168.4361114501953, 172.37591552734375, 176.3157196044922, 180.25552368164062, 184.19532775878906, 188.1351318359375, 192.07493591308594, 196.01473999023438, 199.9545440673828, 203.89434814453125, 207.8341522216797, 211.77395629882812, 215.71376037597656, 219.653564453125, 223.59336853027344, 227.53317260742188]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 1.0, 3.0, 7.0, 9.0, 12.0, 6.0, 7.0, 7.0, 15.0, 10.0, 18.0, 18.0, 22.0, 25.0, 35.0, 33.0, 24.0, 30.0, 40.0, 36.0, 38.0, 40.0, 44.0, 46.0, 35.0, 45.0, 43.0, 32.0, 29.0, 31.0, 34.0, 24.0, 31.0, 33.0, 25.0, 20.0, 21.0, 19.0, 13.0, 8.0, 8.0, 7.0, 5.0, 7.0, 4.0, 3.0, 2.0, 4.0, 0.0, 2.0, 1.0], "bins": [-29.23430061340332, -28.441085815429688, -27.647872924804688, -26.854658126831055, -26.061443328857422, -25.268230438232422, -24.47501564025879, -23.681800842285156, -22.888587951660156, -22.095373153686523, -21.302160263061523, -20.50894546508789, -19.715730667114258, -18.922515869140625, -18.129302978515625, -17.336088180541992, -16.54287338256836, -15.749659538269043, -14.95644474029541, -14.163230895996094, -13.370016098022461, -12.576802253723145, -11.783588409423828, -10.990373611450195, -10.197159767150879, -9.403945922851562, -8.61073112487793, -7.817517280578613, -7.024302959442139, -6.231088638305664, -5.437874794006348, -4.644660472869873, -3.8514480590820312, -3.0582337379455566, -2.265019655227661, -1.4718055725097656, -0.678591251373291, 0.1146230697631836, 0.9078369140625, 1.7010512351989746, 2.494265556335449, 3.287479877471924, 4.080694198608398, 4.873908042907715, 5.6671223640441895, 6.460336685180664, 7.2535505294799805, 8.046764373779297, 8.83997917175293, 9.633193016052246, 10.426407814025879, 11.219621658325195, 12.012836456298828, 12.806050300598145, 13.599264144897461, 14.392478942871094, 15.18569278717041, 15.978906631469727, 16.77212142944336, 17.56533432006836, 18.358549118041992, 19.151763916015625, 19.944976806640625, 20.738191604614258, 21.53140640258789]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 5.0, 2.0, 6.0, 7.0, 5.0, 5.0, 11.0, 18.0, 12.0, 13.0, 15.0, 19.0, 22.0, 24.0, 26.0, 41.0, 28.0, 31.0, 46.0, 38.0, 41.0, 46.0, 48.0, 50.0, 37.0, 35.0, 46.0, 38.0, 44.0, 29.0, 24.0, 29.0, 32.0, 18.0, 14.0, 22.0, 8.0, 10.0, 14.0, 11.0, 5.0, 9.0, 7.0, 5.0, 7.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.904296875, -2.813507080078125, -2.72271728515625, -2.631927490234375, -2.5411376953125, -2.450347900390625, -2.35955810546875, -2.268768310546875, -2.177978515625, -2.087188720703125, -1.99639892578125, -1.905609130859375, -1.8148193359375, -1.724029541015625, -1.63323974609375, -1.542449951171875, -1.45166015625, -1.360870361328125, -1.27008056640625, -1.179290771484375, -1.0885009765625, -0.997711181640625, -0.90692138671875, -0.816131591796875, -0.725341796875, -0.634552001953125, -0.54376220703125, -0.452972412109375, -0.3621826171875, -0.271392822265625, -0.18060302734375, -0.089813232421875, 0.0009765625, 0.091766357421875, 0.18255615234375, 0.273345947265625, 0.3641357421875, 0.454925537109375, 0.54571533203125, 0.636505126953125, 0.727294921875, 0.818084716796875, 0.90887451171875, 0.999664306640625, 1.0904541015625, 1.181243896484375, 1.27203369140625, 1.362823486328125, 1.45361328125, 1.544403076171875, 1.63519287109375, 1.725982666015625, 1.8167724609375, 1.907562255859375, 1.99835205078125, 2.089141845703125, 2.179931640625, 2.270721435546875, 2.36151123046875, 2.452301025390625, 2.5430908203125, 2.633880615234375, 2.72467041015625, 2.815460205078125, 2.90625]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 3.0, 4.0, 8.0, 6.0, 10.0, 9.0, 15.0, 11.0, 18.0, 14.0, 14.0, 20.0, 19.0, 39.0, 45.0, 43.0, 65.0, 139.0, 293.0, 850.0, 4361.0, 120869.0, 2561323.0, 1463866.0, 38001.0, 2667.0, 786.0, 279.0, 162.0, 80.0, 51.0, 38.0, 22.0, 19.0, 27.0, 19.0, 10.0, 14.0, 5.0, 10.0, 9.0, 10.0, 8.0, 12.0, 0.0, 5.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.609375, -9.31689453125, -9.0244140625, -8.73193359375, -8.439453125, -8.14697265625, -7.8544921875, -7.56201171875, -7.26953125, -6.97705078125, -6.6845703125, -6.39208984375, -6.099609375, -5.80712890625, -5.5146484375, -5.22216796875, -4.9296875, -4.63720703125, -4.3447265625, -4.05224609375, -3.759765625, -3.46728515625, -3.1748046875, -2.88232421875, -2.58984375, -2.29736328125, -2.0048828125, -1.71240234375, -1.419921875, -1.12744140625, -0.8349609375, -0.54248046875, -0.25, 0.04248046875, 0.3349609375, 0.62744140625, 0.919921875, 1.21240234375, 1.5048828125, 1.79736328125, 2.08984375, 2.38232421875, 2.6748046875, 2.96728515625, 3.259765625, 3.55224609375, 3.8447265625, 4.13720703125, 4.4296875, 4.72216796875, 5.0146484375, 5.30712890625, 5.599609375, 5.89208984375, 6.1845703125, 6.47705078125, 6.76953125, 7.06201171875, 7.3544921875, 7.64697265625, 7.939453125, 8.23193359375, 8.5244140625, 8.81689453125, 9.109375]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 10.0, 14.0, 17.0, 16.0, 22.0, 38.0, 51.0, 60.0, 91.0, 110.0, 174.0, 222.0, 274.0, 322.0, 370.0, 399.0, 384.0, 356.0, 275.0, 202.0, 159.0, 123.0, 109.0, 67.0, 48.0, 50.0, 30.0, 23.0, 14.0, 11.0, 5.0, 8.0, 5.0, 4.0, 0.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.71875, -5.5430908203125, -5.367431640625, -5.1917724609375, -5.01611328125, -4.8404541015625, -4.664794921875, -4.4891357421875, -4.3134765625, -4.1378173828125, -3.962158203125, -3.7864990234375, -3.61083984375, -3.4351806640625, -3.259521484375, -3.0838623046875, -2.908203125, -2.7325439453125, -2.556884765625, -2.3812255859375, -2.20556640625, -2.0299072265625, -1.854248046875, -1.6785888671875, -1.5029296875, -1.3272705078125, -1.151611328125, -0.9759521484375, -0.80029296875, -0.6246337890625, -0.448974609375, -0.2733154296875, -0.09765625, 0.0780029296875, 0.253662109375, 0.4293212890625, 0.60498046875, 0.7806396484375, 0.956298828125, 1.1319580078125, 1.3076171875, 1.4832763671875, 1.658935546875, 1.8345947265625, 2.01025390625, 2.1859130859375, 2.361572265625, 2.5372314453125, 2.712890625, 2.8885498046875, 3.064208984375, 3.2398681640625, 3.41552734375, 3.5911865234375, 3.766845703125, 3.9425048828125, 4.1181640625, 4.2938232421875, 4.469482421875, 4.6451416015625, 4.82080078125, 4.9964599609375, 5.172119140625, 5.3477783203125, 5.5234375]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 3.0, 8.0, 9.0, 9.0, 17.0, 16.0, 31.0, 49.0, 62.0, 91.0, 106.0, 182.0, 214.0, 285.0, 504.0, 1217.0, 25683.0, 3447004.0, 712177.0, 4573.0, 729.0, 388.0, 264.0, 190.0, 125.0, 99.0, 70.0, 49.0, 35.0, 25.0, 22.0, 13.0, 14.0, 9.0, 4.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.03125, -17.405029296875, -16.77880859375, -16.152587890625, -15.5263671875, -14.900146484375, -14.27392578125, -13.647705078125, -13.021484375, -12.395263671875, -11.76904296875, -11.142822265625, -10.5166015625, -9.890380859375, -9.26416015625, -8.637939453125, -8.01171875, -7.385498046875, -6.75927734375, -6.133056640625, -5.5068359375, -4.880615234375, -4.25439453125, -3.628173828125, -3.001953125, -2.375732421875, -1.74951171875, -1.123291015625, -0.4970703125, 0.129150390625, 0.75537109375, 1.381591796875, 2.0078125, 2.634033203125, 3.26025390625, 3.886474609375, 4.5126953125, 5.138916015625, 5.76513671875, 6.391357421875, 7.017578125, 7.643798828125, 8.27001953125, 8.896240234375, 9.5224609375, 10.148681640625, 10.77490234375, 11.401123046875, 12.02734375, 12.653564453125, 13.27978515625, 13.906005859375, 14.5322265625, 15.158447265625, 15.78466796875, 16.410888671875, 17.037109375, 17.663330078125, 18.28955078125, 18.915771484375, 19.5419921875, 20.168212890625, 20.79443359375, 21.420654296875, 22.046875]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 10.0, 56.0, 244.0, 411.0, 238.0, 54.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.37199401855469, -96.48629760742188, -93.60060119628906, -90.71491241455078, -87.82921600341797, -84.94351959228516, -82.05783081054688, -79.17213439941406, -76.28643798828125, -73.40074157714844, -70.51504516601562, -67.62935638427734, -64.74365997314453, -61.85796356201172, -58.97227096557617, -56.086578369140625, -53.20088195800781, -50.315185546875, -47.42949295043945, -44.543800354003906, -41.658103942871094, -38.77240753173828, -35.886714935302734, -33.00102233886719, -30.115325927734375, -27.229631423950195, -24.343936920166016, -21.458242416381836, -18.572547912597656, -15.686853408813477, -12.801158905029297, -9.915464401245117, -7.0297698974609375, -4.144075393676758, -1.2583808898925781, 1.6273136138916016, 4.513008117675781, 7.398702621459961, 10.28439712524414, 13.17009162902832, 16.0557861328125, 18.94148063659668, 21.82717514038086, 24.71286964416504, 27.59856414794922, 30.4842586517334, 33.36995315551758, 36.255645751953125, 39.14134216308594, 42.02703857421875, 44.9127311706543, 47.798423767089844, 50.684120178222656, 53.56981658935547, 56.455509185791016, 59.34120178222656, 62.226898193359375, 65.11259460449219, 67.998291015625, 70.88397979736328, 73.7696762084961, 76.6553726196289, 79.54106140136719, 82.4267578125, 85.31245422363281]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 8.0, 7.0, 10.0, 13.0, 14.0, 17.0, 21.0, 16.0, 22.0, 24.0, 31.0, 39.0, 41.0, 40.0, 38.0, 35.0, 43.0, 49.0, 41.0, 44.0, 52.0, 49.0, 35.0, 46.0, 31.0, 34.0, 35.0, 30.0, 24.0, 18.0, 15.0, 12.0, 7.0, 11.0, 11.0, 5.0, 12.0, 10.0, 6.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.26325225830078, -18.639440536499023, -18.015626907348633, -17.391815185546875, -16.768003463745117, -16.14419174194336, -15.520378112792969, -14.896566390991211, -14.272753715515137, -13.648941040039062, -13.025129318237305, -12.40131664276123, -11.777503967285156, -11.153692245483398, -10.529879570007324, -9.90606689453125, -9.282255172729492, -8.658442497253418, -8.03463077545166, -7.410818099975586, -6.78700590133667, -6.163193702697754, -5.53938102722168, -4.915568828582764, -4.291756629943848, -3.6679444313049316, -3.0441319942474365, -2.4203195571899414, -1.7965073585510254, -1.1726951599121094, -0.5488827228546143, 0.07492971420288086, 0.6987419128417969, 1.3225542306900024, 1.946366548538208, 2.570178985595703, 3.193991184234619, 3.817803382873535, 4.441616058349609, 5.065428256988525, 5.689240455627441, 6.313052654266357, 6.936864852905273, 7.560677528381348, 8.184490203857422, 8.80830192565918, 9.432114601135254, 10.055927276611328, 10.679738998413086, 11.30355167388916, 11.927363395690918, 12.551176071166992, 13.17498779296875, 13.798800468444824, 14.422613143920898, 15.046424865722656, 15.67023754119873, 16.294050216674805, 16.917861938476562, 17.54167366027832, 18.16548728942871, 18.78929901123047, 19.413110733032227, 20.036924362182617, 20.660736083984375]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 6.0, 10.0, 9.0, 10.0, 15.0, 22.0, 15.0, 25.0, 22.0, 34.0, 35.0, 29.0, 35.0, 37.0, 41.0, 43.0, 49.0, 42.0, 51.0, 39.0, 52.0, 37.0, 43.0, 42.0, 36.0, 29.0, 33.0, 24.0, 18.0, 32.0, 21.0, 14.0, 10.0, 6.0, 10.0, 5.0, 5.0, 4.0, 6.0, 2.0, 0.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.11328125, -3.019744873046875, -2.92620849609375, -2.832672119140625, -2.7391357421875, -2.645599365234375, -2.55206298828125, -2.458526611328125, -2.364990234375, -2.271453857421875, -2.17791748046875, -2.084381103515625, -1.9908447265625, -1.897308349609375, -1.80377197265625, -1.710235595703125, -1.61669921875, -1.523162841796875, -1.42962646484375, -1.336090087890625, -1.2425537109375, -1.149017333984375, -1.05548095703125, -0.961944580078125, -0.868408203125, -0.774871826171875, -0.68133544921875, -0.587799072265625, -0.4942626953125, -0.400726318359375, -0.30718994140625, -0.213653564453125, -0.1201171875, -0.026580810546875, 0.06695556640625, 0.160491943359375, 0.2540283203125, 0.347564697265625, 0.44110107421875, 0.534637451171875, 0.628173828125, 0.721710205078125, 0.81524658203125, 0.908782958984375, 1.0023193359375, 1.095855712890625, 1.18939208984375, 1.282928466796875, 1.37646484375, 1.470001220703125, 1.56353759765625, 1.657073974609375, 1.7506103515625, 1.844146728515625, 1.93768310546875, 2.031219482421875, 2.124755859375, 2.218292236328125, 2.31182861328125, 2.405364990234375, 2.4989013671875, 2.592437744140625, 2.68597412109375, 2.779510498046875, 2.873046875]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 10.0, 10.0, 14.0, 13.0, 22.0, 36.0, 37.0, 63.0, 102.0, 127.0, 211.0, 299.0, 462.0, 780.0, 1129.0, 1866.0, 2919.0, 4876.0, 7488.0, 12303.0, 19930.0, 32437.0, 54822.0, 103209.0, 232474.0, 289340.0, 123512.0, 63711.0, 36927.0, 22611.0, 13801.0, 8593.0, 5287.0, 3303.0, 2123.0, 1243.0, 850.0, 561.0, 340.0, 247.0, 163.0, 104.0, 68.0, 51.0, 28.0, 25.0, 10.0, 10.0, 8.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.52197265625, -0.5046463012695312, -0.4873199462890625, -0.46999359130859375, -0.452667236328125, -0.43534088134765625, -0.4180145263671875, -0.40068817138671875, -0.38336181640625, -0.36603546142578125, -0.3487091064453125, -0.33138275146484375, -0.314056396484375, -0.29673004150390625, -0.2794036865234375, -0.26207733154296875, -0.2447509765625, -0.22742462158203125, -0.2100982666015625, -0.19277191162109375, -0.175445556640625, -0.15811920166015625, -0.1407928466796875, -0.12346649169921875, -0.10614013671875, -0.08881378173828125, -0.0714874267578125, -0.05416107177734375, -0.036834716796875, -0.01950836181640625, -0.0021820068359375, 0.01514434814453125, 0.032470703125, 0.04979705810546875, 0.0671234130859375, 0.08444976806640625, 0.101776123046875, 0.11910247802734375, 0.1364288330078125, 0.15375518798828125, 0.17108154296875, 0.18840789794921875, 0.2057342529296875, 0.22306060791015625, 0.240386962890625, 0.25771331787109375, 0.2750396728515625, 0.29236602783203125, 0.3096923828125, 0.32701873779296875, 0.3443450927734375, 0.36167144775390625, 0.378997802734375, 0.39632415771484375, 0.4136505126953125, 0.43097686767578125, 0.44830322265625, 0.46562957763671875, 0.4829559326171875, 0.5002822875976562, 0.517608642578125, 0.5349349975585938, 0.5522613525390625, 0.5695877075195312, 0.5869140625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 4.0, 0.0, 5.0, 2.0, 6.0, 5.0, 7.0, 12.0, 6.0, 15.0, 14.0, 10.0, 17.0, 18.0, 30.0, 23.0, 27.0, 34.0, 28.0, 27.0, 32.0, 31.0, 35.0, 48.0, 47.0, 1057.0, 38.0, 38.0, 37.0, 42.0, 33.0, 37.0, 31.0, 31.0, 30.0, 29.0, 25.0, 24.0, 20.0, 14.0, 21.0, 10.0, 8.0, 5.0, 6.0, 4.0, 4.0, 0.0, 2.0, 7.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.640625, -1.5855865478515625, -1.530548095703125, -1.4755096435546875, -1.42047119140625, -1.3654327392578125, -1.310394287109375, -1.2553558349609375, -1.2003173828125, -1.1452789306640625, -1.090240478515625, -1.0352020263671875, -0.98016357421875, -0.9251251220703125, -0.870086669921875, -0.8150482177734375, -0.760009765625, -0.7049713134765625, -0.649932861328125, -0.5948944091796875, -0.53985595703125, -0.4848175048828125, -0.429779052734375, -0.3747406005859375, -0.3197021484375, -0.2646636962890625, -0.209625244140625, -0.1545867919921875, -0.09954833984375, -0.0445098876953125, 0.010528564453125, 0.0655670166015625, 0.12060546875, 0.1756439208984375, 0.230682373046875, 0.2857208251953125, 0.34075927734375, 0.3957977294921875, 0.450836181640625, 0.5058746337890625, 0.5609130859375, 0.6159515380859375, 0.670989990234375, 0.7260284423828125, 0.78106689453125, 0.8361053466796875, 0.891143798828125, 0.9461822509765625, 1.001220703125, 1.0562591552734375, 1.111297607421875, 1.1663360595703125, 1.22137451171875, 1.2764129638671875, 1.331451416015625, 1.3864898681640625, 1.4415283203125, 1.4965667724609375, 1.551605224609375, 1.6066436767578125, 1.66168212890625, 1.7167205810546875, 1.771759033203125, 1.8267974853515625, 1.8818359375]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 6.0, 5.0, 12.0, 8.0, 25.0, 27.0, 44.0, 81.0, 99.0, 163.0, 196.0, 357.0, 468.0, 726.0, 1051.0, 1483.0, 2226.0, 3194.0, 4941.0, 7389.0, 11353.0, 17699.0, 28251.0, 45215.0, 78062.0, 146501.0, 1337546.0, 178003.0, 90189.0, 52024.0, 31605.0, 19887.0, 12868.0, 8464.0, 5580.0, 3675.0, 2521.0, 1687.0, 1135.0, 776.0, 538.0, 326.0, 259.0, 162.0, 105.0, 83.0, 36.0, 33.0, 14.0, 15.0, 18.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44873046875, -0.43358612060546875, -0.4184417724609375, -0.40329742431640625, -0.388153076171875, -0.37300872802734375, -0.3578643798828125, -0.34272003173828125, -0.32757568359375, -0.31243133544921875, -0.2972869873046875, -0.28214263916015625, -0.266998291015625, -0.25185394287109375, -0.2367095947265625, -0.22156524658203125, -0.2064208984375, -0.19127655029296875, -0.1761322021484375, -0.16098785400390625, -0.145843505859375, -0.13069915771484375, -0.1155548095703125, -0.10041046142578125, -0.08526611328125, -0.07012176513671875, -0.0549774169921875, -0.03983306884765625, -0.024688720703125, -0.00954437255859375, 0.0055999755859375, 0.02074432373046875, 0.035888671875, 0.05103302001953125, 0.0661773681640625, 0.08132171630859375, 0.096466064453125, 0.11161041259765625, 0.1267547607421875, 0.14189910888671875, 0.15704345703125, 0.17218780517578125, 0.1873321533203125, 0.20247650146484375, 0.217620849609375, 0.23276519775390625, 0.2479095458984375, 0.26305389404296875, 0.2781982421875, 0.29334259033203125, 0.3084869384765625, 0.32363128662109375, 0.338775634765625, 0.35391998291015625, 0.3690643310546875, 0.38420867919921875, 0.39935302734375, 0.41449737548828125, 0.4296417236328125, 0.44478607177734375, 0.459930419921875, 0.47507476806640625, 0.4902191162109375, 0.5053634643554688, 0.5205078125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 5.0, 4.0, 9.0, 8.0, 11.0, 15.0, 17.0, 19.0, 25.0, 24.0, 48.0, 51.0, 40.0, 53.0, 59.0, 61.0, 69.0, 66.0, 65.0, 62.0, 48.0, 56.0, 38.0, 29.0, 24.0, 19.0, 14.0, 13.0, 15.0, 11.0, 9.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003540515899658203, -0.0003424994647502899, -0.0003309473395347595, -0.0003193952143192291, -0.00030784308910369873, -0.00029629096388816833, -0.00028473883867263794, -0.00027318671345710754, -0.00026163458824157715, -0.00025008246302604675, -0.00023853033781051636, -0.00022697821259498596, -0.00021542608737945557, -0.00020387396216392517, -0.00019232183694839478, -0.00018076971173286438, -0.00016921758651733398, -0.0001576654613018036, -0.0001461133360862732, -0.0001345612108707428, -0.0001230090856552124, -0.00011145696043968201, -9.990483522415161e-05, -8.835271000862122e-05, -7.680058479309082e-05, -6.524845957756042e-05, -5.369633436203003e-05, -4.2144209146499634e-05, -3.059208393096924e-05, -1.9039958715438843e-05, -7.487833499908447e-06, 4.064291715621948e-06, 1.5616416931152344e-05, 2.716854214668274e-05, 3.8720667362213135e-05, 5.027279257774353e-05, 6.182491779327393e-05, 7.337704300880432e-05, 8.492916822433472e-05, 9.648129343986511e-05, 0.00010803341865539551, 0.0001195855438709259, 0.0001311376690864563, 0.0001426897943019867, 0.0001542419195175171, 0.00016579404473304749, 0.00017734616994857788, 0.00018889829516410828, 0.00020045042037963867, 0.00021200254559516907, 0.00022355467081069946, 0.00023510679602622986, 0.00024665892124176025, 0.00025821104645729065, 0.00026976317167282104, 0.00028131529688835144, 0.00029286742210388184, 0.00030441954731941223, 0.0003159716725349426, 0.000327523797750473, 0.0003390759229660034, 0.0003506280481815338, 0.0003621801733970642, 0.0003737322986125946, 0.000385284423828125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 1.0, 10.0, 7.0, 9.0, 16.0, 18.0, 21.0, 30.0, 29.0, 58.0, 67.0, 107.0, 155.0, 370.0, 863.0, 28850.0, 1014845.0, 1845.0, 527.0, 251.0, 123.0, 107.0, 61.0, 49.0, 30.0, 27.0, 26.0, 13.0, 8.0, 9.0, 6.0, 7.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00848388671875, -0.008228898048400879, -0.007973909378051758, -0.007718920707702637, -0.007463932037353516, -0.0072089433670043945, -0.0069539546966552734, -0.006698966026306152, -0.006443977355957031, -0.00618898868560791, -0.005934000015258789, -0.005679011344909668, -0.005424022674560547, -0.005169034004211426, -0.004914045333862305, -0.004659056663513184, -0.0044040679931640625, -0.004149079322814941, -0.0038940906524658203, -0.0036391019821166992, -0.003384113311767578, -0.003129124641418457, -0.002874135971069336, -0.002619147300720215, -0.0023641586303710938, -0.0021091699600219727, -0.0018541812896728516, -0.0015991926193237305, -0.0013442039489746094, -0.0010892152786254883, -0.0008342266082763672, -0.0005792379379272461, -0.000324249267578125, -6.92605972290039e-05, 0.0001857280731201172, 0.0004407167434692383, 0.0006957054138183594, 0.0009506940841674805, 0.0012056827545166016, 0.0014606714248657227, 0.0017156600952148438, 0.001970648765563965, 0.002225637435913086, 0.002480626106262207, 0.002735614776611328, 0.0029906034469604492, 0.0032455921173095703, 0.0035005807876586914, 0.0037555694580078125, 0.004010558128356934, 0.004265546798706055, 0.004520535469055176, 0.004775524139404297, 0.005030512809753418, 0.005285501480102539, 0.00554049015045166, 0.005795478820800781, 0.006050467491149902, 0.0063054561614990234, 0.0065604448318481445, 0.006815433502197266, 0.007070422172546387, 0.007325410842895508, 0.007580399513244629, 0.00783538818359375]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 11.0, 59.0, 313.0, 479.0, 140.0, 13.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006493672262877226, -0.0006214406457729638, -0.0005935140652582049, -0.0005655874847434461, -0.0005376609042286873, -0.0005097342655062675, -0.0004818077140953392, -0.0004538811044767499, -0.00042595452396199107, -0.00039802794344723225, -0.0003701013629324734, -0.0003421747824177146, -0.0003142481727991253, -0.0002863215922843665, -0.00025839501176960766, -0.0002304684167029336, -0.00020254185074009, -0.0001746152702253312, -0.00014668867515865713, -0.00011876209464389831, -9.083550685318187e-05, -6.290891906246543e-05, -3.4982338547706604e-05, -7.05574348103255e-06, 2.0870837033726275e-05, 4.8797424824442714e-05, 7.672401261515915e-05, 0.00010465059312991798, 0.0001325771736446768, 0.00016050376871135086, 0.00018843034922610968, 0.00021635694429278374, 0.00024428352480754256, 0.0002722101053223014, 0.0003001366858370602, 0.00032806326635181904, 0.0003559898759704083, 0.00038391645648516715, 0.00041184303699992597, 0.00043976964661851525, 0.0004676962271332741, 0.0004956228076480329, 0.0005235493881627917, 0.0005514759686775506, 0.0005794025491923094, 0.0006073291879147291, 0.000635255710221827, 0.0006631823489442468, 0.0006911088712513447, 0.0007190354517661035, 0.0007469620322808623, 0.0007748886127956212, 0.00080281519331038, 0.0008307418320327997, 0.0008586683543398976, 0.0008865949930623174, 0.0009145215735770762, 0.000942448154091835, 0.0009703747346065938, 0.0009983013151213527, 0.0010262279538437724, 0.0010541544761508703, 0.00108208111487329, 0.001110007637180388, 0.0011379342759028077]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 10.0, 1.0, 11.0, 8.0, 17.0, 11.0, 10.0, 16.0, 19.0, 18.0, 34.0, 27.0, 37.0, 46.0, 33.0, 28.0, 33.0, 32.0, 46.0, 49.0, 39.0, 43.0, 41.0, 57.0, 43.0, 40.0, 34.0, 26.0, 33.0, 25.0, 25.0, 27.0, 17.0, 9.0, 15.0, 19.0, 6.0, 2.0, 6.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016677379608154297, -0.00016130134463310242, -0.00015582889318466187, -0.0001503564417362213, -0.00014488399028778076, -0.0001394115388393402, -0.00013393908739089966, -0.0001284666359424591, -0.00012299418449401855, -0.000117521733045578, -0.00011204928159713745, -0.0001065768301486969, -0.00010110437870025635, -9.56319272518158e-05, -9.015947580337524e-05, -8.468702435493469e-05, -7.921457290649414e-05, -7.374212145805359e-05, -6.826967000961304e-05, -6.279721856117249e-05, -5.7324767112731934e-05, -5.185231566429138e-05, -4.637986421585083e-05, -4.090741276741028e-05, -3.5434961318969727e-05, -2.9962509870529175e-05, -2.4490058422088623e-05, -1.901760697364807e-05, -1.354515552520752e-05, -8.072704076766968e-06, -2.600252628326416e-06, 2.8721988201141357e-06, 8.344650268554688e-06, 1.381710171699524e-05, 1.928955316543579e-05, 2.4762004613876343e-05, 3.0234456062316895e-05, 3.5706907510757446e-05, 4.1179358959198e-05, 4.665181040763855e-05, 5.21242618560791e-05, 5.759671330451965e-05, 6.30691647529602e-05, 6.854161620140076e-05, 7.401406764984131e-05, 7.948651909828186e-05, 8.495897054672241e-05, 9.043142199516296e-05, 9.590387344360352e-05, 0.00010137632489204407, 0.00010684877634048462, 0.00011232122778892517, 0.00011779367923736572, 0.00012326613068580627, 0.00012873858213424683, 0.00013421103358268738, 0.00013968348503112793, 0.00014515593647956848, 0.00015062838792800903, 0.00015610083937644958, 0.00016157329082489014, 0.0001670457422733307, 0.00017251819372177124, 0.0001779906451702118, 0.00018346309661865234]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 6.0, 10.0, 9.0, 10.0, 15.0, 22.0, 15.0, 25.0, 22.0, 34.0, 35.0, 29.0, 35.0, 37.0, 41.0, 43.0, 49.0, 42.0, 51.0, 39.0, 52.0, 37.0, 43.0, 42.0, 36.0, 29.0, 33.0, 24.0, 18.0, 32.0, 21.0, 14.0, 10.0, 6.0, 10.0, 5.0, 5.0, 4.0, 6.0, 2.0, 0.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.11328125, -3.019744873046875, -2.92620849609375, -2.832672119140625, -2.7391357421875, -2.645599365234375, -2.55206298828125, -2.458526611328125, -2.364990234375, -2.271453857421875, -2.17791748046875, -2.084381103515625, -1.9908447265625, -1.897308349609375, -1.80377197265625, -1.710235595703125, -1.61669921875, -1.523162841796875, -1.42962646484375, -1.336090087890625, -1.2425537109375, -1.149017333984375, -1.05548095703125, -0.961944580078125, -0.868408203125, -0.774871826171875, -0.68133544921875, -0.587799072265625, -0.4942626953125, -0.400726318359375, -0.30718994140625, -0.213653564453125, -0.1201171875, -0.026580810546875, 0.06695556640625, 0.160491943359375, 0.2540283203125, 0.347564697265625, 0.44110107421875, 0.534637451171875, 0.628173828125, 0.721710205078125, 0.81524658203125, 0.908782958984375, 1.0023193359375, 1.095855712890625, 1.18939208984375, 1.282928466796875, 1.37646484375, 1.470001220703125, 1.56353759765625, 1.657073974609375, 1.7506103515625, 1.844146728515625, 1.93768310546875, 2.031219482421875, 2.124755859375, 2.218292236328125, 2.31182861328125, 2.405364990234375, 2.4989013671875, 2.592437744140625, 2.68597412109375, 2.779510498046875, 2.873046875]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 1.0, 5.0, 9.0, 9.0, 19.0, 30.0, 36.0, 37.0, 83.0, 102.0, 153.0, 229.0, 356.0, 606.0, 1353.0, 3057.0, 7094.0, 18274.0, 50284.0, 139139.0, 355003.0, 293246.0, 112702.0, 40715.0, 14908.0, 5818.0, 2512.0, 1188.0, 601.0, 361.0, 184.0, 163.0, 76.0, 64.0, 27.0, 34.0, 16.0, 22.0, 7.0, 8.0, 6.0, 6.0, 2.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.41015625, -3.306488037109375, -3.20281982421875, -3.099151611328125, -2.9954833984375, -2.891815185546875, -2.78814697265625, -2.684478759765625, -2.580810546875, -2.477142333984375, -2.37347412109375, -2.269805908203125, -2.1661376953125, -2.062469482421875, -1.95880126953125, -1.855133056640625, -1.75146484375, -1.647796630859375, -1.54412841796875, -1.440460205078125, -1.3367919921875, -1.233123779296875, -1.12945556640625, -1.025787353515625, -0.922119140625, -0.818450927734375, -0.71478271484375, -0.611114501953125, -0.5074462890625, -0.403778076171875, -0.30010986328125, -0.196441650390625, -0.0927734375, 0.010894775390625, 0.11456298828125, 0.218231201171875, 0.3218994140625, 0.425567626953125, 0.52923583984375, 0.632904052734375, 0.736572265625, 0.840240478515625, 0.94390869140625, 1.047576904296875, 1.1512451171875, 1.254913330078125, 1.35858154296875, 1.462249755859375, 1.56591796875, 1.669586181640625, 1.77325439453125, 1.876922607421875, 1.9805908203125, 2.084259033203125, 2.18792724609375, 2.291595458984375, 2.395263671875, 2.498931884765625, 2.60260009765625, 2.706268310546875, 2.8099365234375, 2.913604736328125, 3.01727294921875, 3.120941162109375, 3.224609375]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 7.0, 8.0, 6.0, 13.0, 15.0, 17.0, 25.0, 26.0, 23.0, 31.0, 23.0, 46.0, 52.0, 64.0, 70.0, 137.0, 263.0, 1521.0, 229.0, 93.0, 62.0, 53.0, 46.0, 32.0, 27.0, 31.0, 16.0, 27.0, 19.0, 17.0, 8.0, 6.0, 11.0, 8.0, 8.0, 5.0, 1.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.40625, -10.0521240234375, -9.697998046875, -9.3438720703125, -8.98974609375, -8.6356201171875, -8.281494140625, -7.9273681640625, -7.5732421875, -7.2191162109375, -6.864990234375, -6.5108642578125, -6.15673828125, -5.8026123046875, -5.448486328125, -5.0943603515625, -4.740234375, -4.3861083984375, -4.031982421875, -3.6778564453125, -3.32373046875, -2.9696044921875, -2.615478515625, -2.2613525390625, -1.9072265625, -1.5531005859375, -1.198974609375, -0.8448486328125, -0.49072265625, -0.1365966796875, 0.217529296875, 0.5716552734375, 0.92578125, 1.2799072265625, 1.634033203125, 1.9881591796875, 2.34228515625, 2.6964111328125, 3.050537109375, 3.4046630859375, 3.7587890625, 4.1129150390625, 4.467041015625, 4.8211669921875, 5.17529296875, 5.5294189453125, 5.883544921875, 6.2376708984375, 6.591796875, 6.9459228515625, 7.300048828125, 7.6541748046875, 8.00830078125, 8.3624267578125, 8.716552734375, 9.0706787109375, 9.4248046875, 9.7789306640625, 10.133056640625, 10.4871826171875, 10.84130859375, 11.1954345703125, 11.549560546875, 11.9036865234375, 12.2578125]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 5.0, 3.0, 4.0, 10.0, 3.0, 3.0, 12.0, 14.0, 15.0, 17.0, 21.0, 28.0, 36.0, 56.0, 59.0, 91.0, 151.0, 241.0, 417.0, 1152.0, 19126.0, 3115308.0, 6910.0, 903.0, 371.0, 220.0, 159.0, 104.0, 69.0, 41.0, 33.0, 21.0, 20.0, 15.0, 12.0, 11.0, 8.0, 7.0, 9.0, 6.0, 3.0, 8.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-42.0, -40.70361328125, -39.4072265625, -38.11083984375, -36.814453125, -35.51806640625, -34.2216796875, -32.92529296875, -31.62890625, -30.33251953125, -29.0361328125, -27.73974609375, -26.443359375, -25.14697265625, -23.8505859375, -22.55419921875, -21.2578125, -19.96142578125, -18.6650390625, -17.36865234375, -16.072265625, -14.77587890625, -13.4794921875, -12.18310546875, -10.88671875, -9.59033203125, -8.2939453125, -6.99755859375, -5.701171875, -4.40478515625, -3.1083984375, -1.81201171875, -0.515625, 0.78076171875, 2.0771484375, 3.37353515625, 4.669921875, 5.96630859375, 7.2626953125, 8.55908203125, 9.85546875, 11.15185546875, 12.4482421875, 13.74462890625, 15.041015625, 16.33740234375, 17.6337890625, 18.93017578125, 20.2265625, 21.52294921875, 22.8193359375, 24.11572265625, 25.412109375, 26.70849609375, 28.0048828125, 29.30126953125, 30.59765625, 31.89404296875, 33.1904296875, 34.48681640625, 35.783203125, 37.07958984375, 38.3759765625, 39.67236328125, 40.96875]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 6.0, 13.0, 41.0, 118.0, 208.0, 242.0, 190.0, 123.0, 48.0, 17.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.137881755828857, -6.310557842254639, -5.48323392868042, -4.655909538269043, -3.8285858631134033, -3.0012617111206055, -2.1739377975463867, -1.346613883972168, -0.5192899703979492, 0.3080340027809143, 1.1353579759597778, 1.9626820087432861, 2.790005922317505, 3.6173300743103027, 4.4446539878845215, 5.27197790145874, 6.099301815032959, 6.926625728607178, 7.7539496421813965, 8.581274032592773, 9.408597946166992, 10.235921859741211, 11.06324577331543, 11.890569686889648, 12.717893600463867, 13.545217514038086, 14.372541427612305, 15.199865341186523, 16.027189254760742, 16.85451316833496, 17.68183708190918, 18.5091609954834, 19.336484909057617, 20.163808822631836, 20.991132736206055, 21.818456649780273, 22.645780563354492, 23.47310447692871, 24.30042839050293, 25.12775230407715, 25.955076217651367, 26.782400131225586, 27.609724044799805, 28.437047958374023, 29.264371871948242, 30.09169578552246, 30.91901969909668, 31.7463436126709, 32.57366943359375, 33.40099334716797, 34.22831726074219, 35.055641174316406, 35.882965087890625, 36.710289001464844, 37.53761291503906, 38.36493682861328, 39.1922607421875, 40.01958465576172, 40.84690856933594, 41.674232482910156, 42.501556396484375, 43.328880310058594, 44.15620422363281, 44.98352813720703, 45.81085205078125]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 7.0, 6.0, 5.0, 7.0, 8.0, 13.0, 13.0, 22.0, 15.0, 13.0, 19.0, 29.0, 21.0, 33.0, 43.0, 41.0, 36.0, 23.0, 45.0, 46.0, 34.0, 46.0, 44.0, 41.0, 46.0, 23.0, 39.0, 42.0, 32.0, 28.0, 20.0, 37.0, 17.0, 13.0, 28.0, 13.0, 8.0, 6.0, 10.0, 5.0, 8.0, 7.0, 3.0, 0.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-27.100921630859375, -26.310359954833984, -25.51979637145996, -24.72923469543457, -23.93867301940918, -23.148109436035156, -22.357547760009766, -21.566986083984375, -20.776424407958984, -19.985862731933594, -19.19529914855957, -18.40473747253418, -17.61417579650879, -16.823612213134766, -16.033050537109375, -15.242488861083984, -14.451925277709961, -13.661362648010254, -12.870800971984863, -12.080238342285156, -11.289676666259766, -10.499114036560059, -9.708551406860352, -8.917989730834961, -8.127427101135254, -7.336864948272705, -6.546302795410156, -5.755740165710449, -4.9651780128479, -4.174615859985352, -3.3840532302856445, -2.5934910774230957, -1.8029308319091797, -1.0123685598373413, -0.22180628776550293, 0.568756103515625, 1.3593182563781738, 2.1498804092407227, 2.9404430389404297, 3.7310051918029785, 4.521567344665527, 5.312129497528076, 6.102691650390625, 6.893254280090332, 7.683816432952881, 8.47437858581543, 9.264941215515137, 10.055503845214844, 10.846065521240234, 11.636628150939941, 12.427189826965332, 13.217752456665039, 14.00831413269043, 14.798876762390137, 15.589439392089844, 16.380001068115234, 17.170562744140625, 17.961124420166016, 18.75168800354004, 19.54224967956543, 20.33281135559082, 21.123374938964844, 21.913936614990234, 22.704498291015625, 23.49506187438965]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 6.0, 3.0, 6.0, 7.0, 5.0, 6.0, 3.0, 12.0, 13.0, 13.0, 11.0, 28.0, 12.0, 22.0, 25.0, 22.0, 31.0, 37.0, 41.0, 40.0, 35.0, 35.0, 43.0, 39.0, 41.0, 31.0, 28.0, 37.0, 28.0, 46.0, 44.0, 39.0, 27.0, 23.0, 24.0, 16.0, 21.0, 23.0, 12.0, 16.0, 12.0, 12.0, 6.0, 8.0, 4.0, 6.0, 2.0, 2.0, 6.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0], "bins": [-3.123046875, -3.029815673828125, -2.93658447265625, -2.843353271484375, -2.7501220703125, -2.656890869140625, -2.56365966796875, -2.470428466796875, -2.377197265625, -2.283966064453125, -2.19073486328125, -2.097503662109375, -2.0042724609375, -1.911041259765625, -1.81781005859375, -1.724578857421875, -1.63134765625, -1.538116455078125, -1.44488525390625, -1.351654052734375, -1.2584228515625, -1.165191650390625, -1.07196044921875, -0.978729248046875, -0.885498046875, -0.792266845703125, -0.69903564453125, -0.605804443359375, -0.5125732421875, -0.419342041015625, -0.32611083984375, -0.232879638671875, -0.1396484375, -0.046417236328125, 0.04681396484375, 0.140045166015625, 0.2332763671875, 0.326507568359375, 0.41973876953125, 0.512969970703125, 0.606201171875, 0.699432373046875, 0.79266357421875, 0.885894775390625, 0.9791259765625, 1.072357177734375, 1.16558837890625, 1.258819580078125, 1.35205078125, 1.445281982421875, 1.53851318359375, 1.631744384765625, 1.7249755859375, 1.818206787109375, 1.91143798828125, 2.004669189453125, 2.097900390625, 2.191131591796875, 2.28436279296875, 2.377593994140625, 2.4708251953125, 2.564056396484375, 2.65728759765625, 2.750518798828125, 2.84375]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 7.0, 5.0, 8.0, 8.0, 7.0, 4.0, 7.0, 18.0, 23.0, 21.0, 29.0, 21.0, 36.0, 51.0, 58.0, 106.0, 170.0, 255.0, 532.0, 1443.0, 8758.0, 139346.0, 1511165.0, 2182001.0, 326525.0, 19234.0, 2549.0, 783.0, 380.0, 214.0, 149.0, 88.0, 65.0, 52.0, 40.0, 23.0, 12.0, 15.0, 12.0, 14.0, 13.0, 8.0, 11.0, 3.0, 3.0, 6.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 3.0], "bins": [-7.28515625, -7.07183837890625, -6.8585205078125, -6.64520263671875, -6.431884765625, -6.21856689453125, -6.0052490234375, -5.79193115234375, -5.57861328125, -5.36529541015625, -5.1519775390625, -4.93865966796875, -4.725341796875, -4.51202392578125, -4.2987060546875, -4.08538818359375, -3.8720703125, -3.65875244140625, -3.4454345703125, -3.23211669921875, -3.018798828125, -2.80548095703125, -2.5921630859375, -2.37884521484375, -2.16552734375, -1.95220947265625, -1.7388916015625, -1.52557373046875, -1.312255859375, -1.09893798828125, -0.8856201171875, -0.67230224609375, -0.458984375, -0.24566650390625, -0.0323486328125, 0.18096923828125, 0.394287109375, 0.60760498046875, 0.8209228515625, 1.03424072265625, 1.24755859375, 1.46087646484375, 1.6741943359375, 1.88751220703125, 2.100830078125, 2.31414794921875, 2.5274658203125, 2.74078369140625, 2.9541015625, 3.16741943359375, 3.3807373046875, 3.59405517578125, 3.807373046875, 4.02069091796875, 4.2340087890625, 4.44732666015625, 4.66064453125, 4.87396240234375, 5.0872802734375, 5.30059814453125, 5.513916015625, 5.72723388671875, 5.9405517578125, 6.15386962890625, 6.3671875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 5.0, 9.0, 8.0, 24.0, 30.0, 39.0, 36.0, 57.0, 85.0, 115.0, 142.0, 226.0, 269.0, 348.0, 421.0, 443.0, 383.0, 369.0, 262.0, 207.0, 177.0, 114.0, 86.0, 57.0, 43.0, 39.0, 18.0, 16.0, 14.0, 8.0, 13.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3671875, -6.17108154296875, -5.9749755859375, -5.77886962890625, -5.582763671875, -5.38665771484375, -5.1905517578125, -4.99444580078125, -4.79833984375, -4.60223388671875, -4.4061279296875, -4.21002197265625, -4.013916015625, -3.81781005859375, -3.6217041015625, -3.42559814453125, -3.2294921875, -3.03338623046875, -2.8372802734375, -2.64117431640625, -2.445068359375, -2.24896240234375, -2.0528564453125, -1.85675048828125, -1.66064453125, -1.46453857421875, -1.2684326171875, -1.07232666015625, -0.876220703125, -0.68011474609375, -0.4840087890625, -0.28790283203125, -0.091796875, 0.10430908203125, 0.3004150390625, 0.49652099609375, 0.692626953125, 0.88873291015625, 1.0848388671875, 1.28094482421875, 1.47705078125, 1.67315673828125, 1.8692626953125, 2.06536865234375, 2.261474609375, 2.45758056640625, 2.6536865234375, 2.84979248046875, 3.0458984375, 3.24200439453125, 3.4381103515625, 3.63421630859375, 3.830322265625, 4.02642822265625, 4.2225341796875, 4.41864013671875, 4.61474609375, 4.81085205078125, 5.0069580078125, 5.20306396484375, 5.399169921875, 5.59527587890625, 5.7913818359375, 5.98748779296875, 6.18359375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 7.0, 7.0, 11.0, 12.0, 16.0, 21.0, 20.0, 44.0, 69.0, 74.0, 124.0, 127.0, 238.0, 297.0, 413.0, 866.0, 21210.0, 3509198.0, 656434.0, 3275.0, 536.0, 372.0, 268.0, 164.0, 140.0, 95.0, 54.0, 58.0, 47.0, 29.0, 25.0, 10.0, 10.0, 3.0, 1.0, 3.0, 5.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.015625, -21.34423828125, -20.6728515625, -20.00146484375, -19.330078125, -18.65869140625, -17.9873046875, -17.31591796875, -16.64453125, -15.97314453125, -15.3017578125, -14.63037109375, -13.958984375, -13.28759765625, -12.6162109375, -11.94482421875, -11.2734375, -10.60205078125, -9.9306640625, -9.25927734375, -8.587890625, -7.91650390625, -7.2451171875, -6.57373046875, -5.90234375, -5.23095703125, -4.5595703125, -3.88818359375, -3.216796875, -2.54541015625, -1.8740234375, -1.20263671875, -0.53125, 0.14013671875, 0.8115234375, 1.48291015625, 2.154296875, 2.82568359375, 3.4970703125, 4.16845703125, 4.83984375, 5.51123046875, 6.1826171875, 6.85400390625, 7.525390625, 8.19677734375, 8.8681640625, 9.53955078125, 10.2109375, 10.88232421875, 11.5537109375, 12.22509765625, 12.896484375, 13.56787109375, 14.2392578125, 14.91064453125, 15.58203125, 16.25341796875, 16.9248046875, 17.59619140625, 18.267578125, 18.93896484375, 19.6103515625, 20.28173828125, 20.953125]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 7.0, 7.0, 20.0, 31.0, 55.0, 58.0, 81.0, 90.0, 117.0, 104.0, 96.0, 96.0, 68.0, 52.0, 44.0, 32.0, 21.0, 15.0, 9.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.229339599609375, -29.47683334350586, -28.724327087402344, -27.971820831298828, -27.219314575195312, -26.466808319091797, -25.71430206298828, -24.961795806884766, -24.20928955078125, -23.456783294677734, -22.70427703857422, -21.951770782470703, -21.199264526367188, -20.446758270263672, -19.694252014160156, -18.94174575805664, -18.189241409301758, -17.436735153198242, -16.684228897094727, -15.931722640991211, -15.179216384887695, -14.42671012878418, -13.67420482635498, -12.921698570251465, -12.16919231414795, -11.416686058044434, -10.664179801940918, -9.911674499511719, -9.159168243408203, -8.406661987304688, -7.654155731201172, -6.901649475097656, -6.149145126342773, -5.396638870239258, -4.644132614135742, -3.8916268348693848, -3.139120578765869, -2.3866143226623535, -1.634108543395996, -0.8816022872924805, -0.12909603118896484, 0.6234101057052612, 1.3759162425994873, 2.128422260284424, 2.8809285163879395, 3.633434772491455, 4.3859405517578125, 5.138446807861328, 5.890953063964844, 6.643459320068359, 7.395965576171875, 8.14847183227539, 8.900978088378906, 9.653484344482422, 10.405989646911621, 11.158495903015137, 11.911002159118652, 12.663508415222168, 13.416014671325684, 14.168519973754883, 14.921026229858398, 15.673532485961914, 16.42603874206543, 17.178544998168945, 17.93105125427246]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 1.0, 6.0, 9.0, 8.0, 9.0, 14.0, 8.0, 32.0, 15.0, 21.0, 32.0, 17.0, 44.0, 29.0, 34.0, 43.0, 42.0, 49.0, 47.0, 39.0, 46.0, 50.0, 47.0, 55.0, 44.0, 36.0, 45.0, 30.0, 32.0, 19.0, 22.0, 18.0, 11.0, 12.0, 12.0, 11.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.076969146728516, -20.358362197875977, -19.639753341674805, -18.921146392822266, -18.202539443969727, -17.483930587768555, -16.765323638916016, -16.046714782714844, -15.328107833862305, -14.60949993133545, -13.89089298248291, -13.172285079956055, -12.4536771774292, -11.735069274902344, -11.016462326049805, -10.29785442352295, -9.57924747467041, -8.860639572143555, -8.142032623291016, -7.42342472076416, -6.704816818237305, -5.986209392547607, -5.26760196685791, -4.548994064331055, -3.8303866386413574, -3.111778974533081, -2.3931713104248047, -1.6745638847351074, -0.955956220626831, -0.2373485565185547, 0.4812588691711426, 1.199866771697998, 1.9184741973876953, 2.6370818614959717, 3.355689525604248, 4.074296951293945, 4.792904853820801, 5.511512279510498, 6.230119705200195, 6.948727607727051, 7.667335033416748, 8.385942459106445, 9.1045503616333, 9.823158264160156, 10.541765213012695, 11.26037311553955, 11.978981018066406, 12.697587966918945, 13.4161958694458, 14.134803771972656, 14.853410720825195, 15.57201862335205, 16.290626525878906, 17.009233474731445, 17.727840423583984, 18.446449279785156, 19.165056228637695, 19.883663177490234, 20.602272033691406, 21.320878982543945, 22.039485931396484, 22.758094787597656, 23.476701736450195, 24.195308685302734, 24.913917541503906]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 6.0, 6.0, 10.0, 11.0, 14.0, 14.0, 15.0, 27.0, 16.0, 16.0, 19.0, 34.0, 36.0, 24.0, 28.0, 44.0, 37.0, 45.0, 34.0, 37.0, 33.0, 43.0, 38.0, 39.0, 37.0, 38.0, 36.0, 29.0, 36.0, 29.0, 20.0, 16.0, 19.0, 18.0, 24.0, 17.0, 11.0, 7.0, 7.0, 14.0, 6.0, 3.0, 4.0, 1.0, 7.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.8515625, -2.76177978515625, -2.6719970703125, -2.58221435546875, -2.492431640625, -2.40264892578125, -2.3128662109375, -2.22308349609375, -2.13330078125, -2.04351806640625, -1.9537353515625, -1.86395263671875, -1.774169921875, -1.68438720703125, -1.5946044921875, -1.50482177734375, -1.4150390625, -1.32525634765625, -1.2354736328125, -1.14569091796875, -1.055908203125, -0.96612548828125, -0.8763427734375, -0.78656005859375, -0.69677734375, -0.60699462890625, -0.5172119140625, -0.42742919921875, -0.337646484375, -0.24786376953125, -0.1580810546875, -0.06829833984375, 0.021484375, 0.11126708984375, 0.2010498046875, 0.29083251953125, 0.380615234375, 0.47039794921875, 0.5601806640625, 0.64996337890625, 0.73974609375, 0.82952880859375, 0.9193115234375, 1.00909423828125, 1.098876953125, 1.18865966796875, 1.2784423828125, 1.36822509765625, 1.4580078125, 1.54779052734375, 1.6375732421875, 1.72735595703125, 1.817138671875, 1.90692138671875, 1.9967041015625, 2.08648681640625, 2.17626953125, 2.26605224609375, 2.3558349609375, 2.44561767578125, 2.535400390625, 2.62518310546875, 2.7149658203125, 2.80474853515625, 2.89453125]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 6.0, 2.0, 3.0, 7.0, 14.0, 16.0, 30.0, 44.0, 53.0, 98.0, 99.0, 148.0, 247.0, 402.0, 548.0, 801.0, 1231.0, 1728.0, 2577.0, 3838.0, 5766.0, 8419.0, 12789.0, 18863.0, 29283.0, 45331.0, 74132.0, 137112.0, 275459.0, 180946.0, 92373.0, 54390.0, 34463.0, 22068.0, 14924.0, 9909.0, 6700.0, 4504.0, 2926.0, 2073.0, 1419.0, 908.0, 581.0, 429.0, 307.0, 188.0, 119.0, 93.0, 72.0, 46.0, 29.0, 16.0, 18.0, 4.0, 10.0, 4.0, 6.0, 1.0, 1.0, 1.0], "bins": [-0.5205078125, -0.5045852661132812, -0.4886627197265625, -0.47274017333984375, -0.456817626953125, -0.44089508056640625, -0.4249725341796875, -0.40904998779296875, -0.39312744140625, -0.37720489501953125, -0.3612823486328125, -0.34535980224609375, -0.329437255859375, -0.31351470947265625, -0.2975921630859375, -0.28166961669921875, -0.2657470703125, -0.24982452392578125, -0.2339019775390625, -0.21797943115234375, -0.202056884765625, -0.18613433837890625, -0.1702117919921875, -0.15428924560546875, -0.13836669921875, -0.12244415283203125, -0.1065216064453125, -0.09059906005859375, -0.074676513671875, -0.05875396728515625, -0.0428314208984375, -0.02690887451171875, -0.010986328125, 0.00493621826171875, 0.0208587646484375, 0.03678131103515625, 0.052703857421875, 0.06862640380859375, 0.0845489501953125, 0.10047149658203125, 0.11639404296875, 0.13231658935546875, 0.1482391357421875, 0.16416168212890625, 0.180084228515625, 0.19600677490234375, 0.2119293212890625, 0.22785186767578125, 0.2437744140625, 0.25969696044921875, 0.2756195068359375, 0.29154205322265625, 0.307464599609375, 0.32338714599609375, 0.3393096923828125, 0.35523223876953125, 0.37115478515625, 0.38707733154296875, 0.4029998779296875, 0.41892242431640625, 0.434844970703125, 0.45076751708984375, 0.4666900634765625, 0.48261260986328125, 0.49853515625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 0.0, 1.0, 5.0, 3.0, 3.0, 4.0, 8.0, 7.0, 10.0, 11.0, 7.0, 8.0, 13.0, 14.0, 17.0, 13.0, 14.0, 29.0, 27.0, 24.0, 29.0, 32.0, 41.0, 33.0, 47.0, 37.0, 37.0, 1062.0, 38.0, 37.0, 26.0, 37.0, 33.0, 26.0, 22.0, 27.0, 26.0, 33.0, 29.0, 31.0, 23.0, 16.0, 14.0, 12.0, 12.0, 14.0, 12.0, 5.0, 10.0, 3.0, 5.0, 2.0, 2.0, 2.0, 3.0, 3.0, 1.0], "bins": [-1.935546875, -1.88006591796875, -1.8245849609375, -1.76910400390625, -1.713623046875, -1.65814208984375, -1.6026611328125, -1.54718017578125, -1.49169921875, -1.43621826171875, -1.3807373046875, -1.32525634765625, -1.269775390625, -1.21429443359375, -1.1588134765625, -1.10333251953125, -1.0478515625, -0.99237060546875, -0.9368896484375, -0.88140869140625, -0.825927734375, -0.77044677734375, -0.7149658203125, -0.65948486328125, -0.60400390625, -0.54852294921875, -0.4930419921875, -0.43756103515625, -0.382080078125, -0.32659912109375, -0.2711181640625, -0.21563720703125, -0.16015625, -0.10467529296875, -0.0491943359375, 0.00628662109375, 0.061767578125, 0.11724853515625, 0.1727294921875, 0.22821044921875, 0.28369140625, 0.33917236328125, 0.3946533203125, 0.45013427734375, 0.505615234375, 0.56109619140625, 0.6165771484375, 0.67205810546875, 0.7275390625, 0.78302001953125, 0.8385009765625, 0.89398193359375, 0.949462890625, 1.00494384765625, 1.0604248046875, 1.11590576171875, 1.17138671875, 1.22686767578125, 1.2823486328125, 1.33782958984375, 1.393310546875, 1.44879150390625, 1.5042724609375, 1.55975341796875, 1.615234375]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 6.0, 4.0, 10.0, 24.0, 24.0, 44.0, 40.0, 85.0, 143.0, 154.0, 252.0, 356.0, 612.0, 849.0, 1191.0, 1718.0, 2544.0, 3881.0, 5571.0, 8686.0, 13032.0, 20271.0, 31704.0, 51076.0, 87654.0, 173704.0, 1342331.0, 146130.0, 77403.0, 45662.0, 27971.0, 18045.0, 11778.0, 7834.0, 5150.0, 3529.0, 2454.0, 1694.0, 1125.0, 784.0, 521.0, 382.0, 211.0, 183.0, 117.0, 75.0, 44.0, 25.0, 21.0, 15.0, 7.0, 10.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.54052734375, -0.5243377685546875, -0.508148193359375, -0.4919586181640625, -0.47576904296875, -0.4595794677734375, -0.443389892578125, -0.4272003173828125, -0.4110107421875, -0.3948211669921875, -0.378631591796875, -0.3624420166015625, -0.34625244140625, -0.3300628662109375, -0.313873291015625, -0.2976837158203125, -0.281494140625, -0.2653045654296875, -0.249114990234375, -0.2329254150390625, -0.21673583984375, -0.2005462646484375, -0.184356689453125, -0.1681671142578125, -0.1519775390625, -0.1357879638671875, -0.119598388671875, -0.1034088134765625, -0.08721923828125, -0.0710296630859375, -0.054840087890625, -0.0386505126953125, -0.0224609375, -0.0062713623046875, 0.009918212890625, 0.0261077880859375, 0.04229736328125, 0.0584869384765625, 0.074676513671875, 0.0908660888671875, 0.1070556640625, 0.1232452392578125, 0.139434814453125, 0.1556243896484375, 0.17181396484375, 0.1880035400390625, 0.204193115234375, 0.2203826904296875, 0.236572265625, 0.2527618408203125, 0.268951416015625, 0.2851409912109375, 0.30133056640625, 0.3175201416015625, 0.333709716796875, 0.3498992919921875, 0.3660888671875, 0.3822784423828125, 0.398468017578125, 0.4146575927734375, 0.43084716796875, 0.4470367431640625, 0.463226318359375, 0.4794158935546875, 0.49560546875]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 4.0, 5.0, 5.0, 3.0, 10.0, 12.0, 10.0, 20.0, 14.0, 23.0, 22.0, 33.0, 26.0, 30.0, 58.0, 60.0, 67.0, 66.0, 75.0, 69.0, 65.0, 51.0, 41.0, 49.0, 30.0, 23.0, 21.0, 19.0, 18.0, 13.0, 7.0, 12.0, 6.0, 4.0, 4.0, 4.0, 7.0, 3.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00037384033203125, -0.00036083534359931946, -0.0003478303551673889, -0.0003348253667354584, -0.00032182037830352783, -0.0003088153898715973, -0.00029581040143966675, -0.0002828054130077362, -0.00026980042457580566, -0.0002567954361438751, -0.00024379044771194458, -0.00023078545928001404, -0.0002177804708480835, -0.00020477548241615295, -0.0001917704939842224, -0.00017876550555229187, -0.00016576051712036133, -0.00015275552868843079, -0.00013975054025650024, -0.0001267455518245697, -0.00011374056339263916, -0.00010073557496070862, -8.773058652877808e-05, -7.472559809684753e-05, -6.172060966491699e-05, -4.871562123298645e-05, -3.571063280105591e-05, -2.2705644369125366e-05, -9.700655937194824e-06, 3.3043324947357178e-06, 1.630932092666626e-05, 2.9314309358596802e-05, 4.2319297790527344e-05, 5.5324286222457886e-05, 6.832927465438843e-05, 8.133426308631897e-05, 9.433925151824951e-05, 0.00010734423995018005, 0.0001203492283821106, 0.00013335421681404114, 0.00014635920524597168, 0.00015936419367790222, 0.00017236918210983276, 0.0001853741705417633, 0.00019837915897369385, 0.0002113841474056244, 0.00022438913583755493, 0.00023739412426948547, 0.000250399112701416, 0.00026340410113334656, 0.0002764090895652771, 0.00028941407799720764, 0.0003024190664291382, 0.0003154240548610687, 0.00032842904329299927, 0.0003414340317249298, 0.00035443902015686035, 0.0003674440085887909, 0.00038044899702072144, 0.000393453985452652, 0.0004064589738845825, 0.00041946396231651306, 0.0004324689507484436, 0.00044547393918037415, 0.0004584789276123047]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 4.0, 4.0, 4.0, 6.0, 4.0, 8.0, 8.0, 9.0, 13.0, 18.0, 15.0, 21.0, 26.0, 29.0, 37.0, 62.0, 83.0, 135.0, 216.0, 405.0, 950.0, 131347.0, 912327.0, 1452.0, 549.0, 251.0, 159.0, 80.0, 73.0, 56.0, 55.0, 27.0, 24.0, 23.0, 16.0, 16.0, 12.0, 10.0, 4.0, 6.0, 5.0, 4.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00946807861328125, -0.009198606014251709, -0.008929133415222168, -0.008659660816192627, -0.008390188217163086, -0.008120715618133545, -0.007851243019104004, -0.007581770420074463, -0.007312297821044922, -0.007042825222015381, -0.00677335262298584, -0.006503880023956299, -0.006234407424926758, -0.005964934825897217, -0.005695462226867676, -0.005425989627838135, -0.005156517028808594, -0.004887044429779053, -0.004617571830749512, -0.004348099231719971, -0.00407862663269043, -0.0038091540336608887, -0.0035396814346313477, -0.0032702088356018066, -0.0030007362365722656, -0.0027312636375427246, -0.0024617910385131836, -0.0021923184394836426, -0.0019228458404541016, -0.0016533732414245605, -0.0013839006423950195, -0.0011144280433654785, -0.0008449554443359375, -0.0005754828453063965, -0.00030601024627685547, -3.653764724731445e-05, 0.00023293495178222656, 0.0005024075508117676, 0.0007718801498413086, 0.0010413527488708496, 0.0013108253479003906, 0.0015802979469299316, 0.0018497705459594727, 0.0021192431449890137, 0.0023887157440185547, 0.0026581883430480957, 0.0029276609420776367, 0.0031971335411071777, 0.0034666061401367188, 0.0037360787391662598, 0.004005551338195801, 0.004275023937225342, 0.004544496536254883, 0.004813969135284424, 0.005083441734313965, 0.005352914333343506, 0.005622386932373047, 0.005891859531402588, 0.006161332130432129, 0.00643080472946167, 0.006700277328491211, 0.006969749927520752, 0.007239222526550293, 0.007508695125579834, 0.007778167724609375]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 54.0, 660.0, 297.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010406688088551164, -0.0009949058294296265, -0.0009491429664194584, -0.0009033800452016294, -0.0008576171239838004, -0.0008118542027659714, -0.0007660912815481424, -0.0007203283603303134, -0.0006745654391124845, -0.0006288025178946555, -0.0005830395966768265, -0.0005372766754589975, -0.0004915137542411685, -0.0004457508330233395, -0.0003999879118055105, -0.00035422499058768153, -0.00030846206936985254, -0.00026269914815202355, -0.00021693622693419456, -0.00017117330571636558, -0.0001254103844985366, -7.96474632807076e-05, -3.388454206287861e-05, 1.187837915495038e-05, 5.764130037277937e-05, 0.00010340422159060836, 0.00014916714280843735, 0.00019493006402626634, 0.00024069298524409533, 0.0002864559064619243, 0.0003322188276797533, 0.0003779817488975823, 0.0004237447865307331, 0.0004695077077485621, 0.0005152706289663911, 0.0005610335501842201, 0.0006067964714020491, 0.000652559392619878, 0.000698322313837707, 0.000744085235055536, 0.000789848156273365, 0.000835611077491194, 0.000881373998709023, 0.000927136919926852, 0.000972899841144681, 0.001018662704154849, 0.001064425683580339, 0.0011101886630058289, 0.001155951526015997, 0.001201714389026165, 0.001247477368451655, 0.0012932403478771448, 0.0013390032108873129, 0.001384766073897481, 0.0014305290533229709, 0.0014762920327484608, 0.0015220548957586288, 0.001567817758768797, 0.0016135807381942868, 0.0016593437176197767, 0.0017051065806299448, 0.0017508694436401129, 0.0017966324230656028, 0.0018423954024910927, 0.0018881582655012608]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 3.0, 1.0, 9.0, 4.0, 5.0, 12.0, 14.0, 15.0, 21.0, 17.0, 20.0, 22.0, 24.0, 20.0, 36.0, 39.0, 36.0, 27.0, 29.0, 31.0, 31.0, 36.0, 33.0, 45.0, 41.0, 41.0, 30.0, 26.0, 32.0, 33.0, 32.0, 28.0, 19.0, 23.0, 24.0, 14.0, 21.0, 15.0, 12.0, 15.0, 15.0, 4.0, 10.0, 5.0, 5.0, 3.0, 4.0, 6.0, 1.0, 3.0, 2.0, 5.0, 3.0], "bins": [-0.0001995563507080078, -0.00019373930990695953, -0.00018792226910591125, -0.00018210522830486298, -0.0001762881875038147, -0.00017047114670276642, -0.00016465410590171814, -0.00015883706510066986, -0.00015302002429962158, -0.0001472029834985733, -0.00014138594269752502, -0.00013556890189647675, -0.00012975186109542847, -0.0001239348202943802, -0.00011811777949333191, -0.00011230073869228363, -0.00010648369789123535, -0.00010066665709018707, -9.48496162891388e-05, -8.903257548809052e-05, -8.321553468704224e-05, -7.739849388599396e-05, -7.158145308494568e-05, -6.57644122838974e-05, -5.994737148284912e-05, -5.413033068180084e-05, -4.8313289880752563e-05, -4.2496249079704285e-05, -3.6679208278656006e-05, -3.086216747760773e-05, -2.5045126676559448e-05, -1.922808587551117e-05, -1.341104507446289e-05, -7.594004273414612e-06, -1.776963472366333e-06, 4.040077328681946e-06, 9.857118129730225e-06, 1.5674158930778503e-05, 2.1491199731826782e-05, 2.730824053287506e-05, 3.312528133392334e-05, 3.894232213497162e-05, 4.47593629360199e-05, 5.0576403737068176e-05, 5.6393444538116455e-05, 6.221048533916473e-05, 6.802752614021301e-05, 7.384456694126129e-05, 7.966160774230957e-05, 8.547864854335785e-05, 9.129568934440613e-05, 9.71127301454544e-05, 0.00010292977094650269, 0.00010874681174755096, 0.00011456385254859924, 0.00012038089334964752, 0.0001261979341506958, 0.00013201497495174408, 0.00013783201575279236, 0.00014364905655384064, 0.00014946609735488892, 0.0001552831381559372, 0.00016110017895698547, 0.00016691721975803375, 0.00017273426055908203]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 6.0, 6.0, 10.0, 11.0, 14.0, 14.0, 15.0, 27.0, 16.0, 16.0, 19.0, 34.0, 36.0, 24.0, 28.0, 44.0, 38.0, 44.0, 34.0, 37.0, 33.0, 42.0, 39.0, 39.0, 37.0, 38.0, 36.0, 29.0, 36.0, 29.0, 20.0, 16.0, 19.0, 18.0, 24.0, 17.0, 11.0, 7.0, 7.0, 14.0, 6.0, 3.0, 4.0, 1.0, 7.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.8515625, -2.76177978515625, -2.6719970703125, -2.58221435546875, -2.492431640625, -2.40264892578125, -2.3128662109375, -2.22308349609375, -2.13330078125, -2.04351806640625, -1.9537353515625, -1.86395263671875, -1.774169921875, -1.68438720703125, -1.5946044921875, -1.50482177734375, -1.4150390625, -1.32525634765625, -1.2354736328125, -1.14569091796875, -1.055908203125, -0.96612548828125, -0.8763427734375, -0.78656005859375, -0.69677734375, -0.60699462890625, -0.5172119140625, -0.42742919921875, -0.337646484375, -0.24786376953125, -0.1580810546875, -0.06829833984375, 0.021484375, 0.11126708984375, 0.2010498046875, 0.29083251953125, 0.380615234375, 0.47039794921875, 0.5601806640625, 0.64996337890625, 0.73974609375, 0.82952880859375, 0.9193115234375, 1.00909423828125, 1.098876953125, 1.18865966796875, 1.2784423828125, 1.36822509765625, 1.4580078125, 1.54779052734375, 1.6375732421875, 1.72735595703125, 1.817138671875, 1.90692138671875, 1.9967041015625, 2.08648681640625, 2.17626953125, 2.26605224609375, 2.3558349609375, 2.44561767578125, 2.535400390625, 2.62518310546875, 2.7149658203125, 2.80474853515625, 2.89453125]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 7.0, 1.0, 9.0, 14.0, 13.0, 24.0, 24.0, 47.0, 51.0, 67.0, 103.0, 102.0, 177.0, 245.0, 401.0, 705.0, 1328.0, 2677.0, 5535.0, 13060.0, 30777.0, 74208.0, 171382.0, 373984.0, 212173.0, 92397.0, 38601.0, 16359.0, 7071.0, 3228.0, 1583.0, 815.0, 423.0, 269.0, 170.0, 119.0, 115.0, 82.0, 58.0, 37.0, 31.0, 21.0, 22.0, 11.0, 7.0, 9.0, 6.0, 8.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.751953125, -2.664947509765625, -2.57794189453125, -2.490936279296875, -2.4039306640625, -2.316925048828125, -2.22991943359375, -2.142913818359375, -2.055908203125, -1.968902587890625, -1.88189697265625, -1.794891357421875, -1.7078857421875, -1.620880126953125, -1.53387451171875, -1.446868896484375, -1.35986328125, -1.272857666015625, -1.18585205078125, -1.098846435546875, -1.0118408203125, -0.924835205078125, -0.83782958984375, -0.750823974609375, -0.663818359375, -0.576812744140625, -0.48980712890625, -0.402801513671875, -0.3157958984375, -0.228790283203125, -0.14178466796875, -0.054779052734375, 0.0322265625, 0.119232177734375, 0.20623779296875, 0.293243408203125, 0.3802490234375, 0.467254638671875, 0.55426025390625, 0.641265869140625, 0.728271484375, 0.815277099609375, 0.90228271484375, 0.989288330078125, 1.0762939453125, 1.163299560546875, 1.25030517578125, 1.337310791015625, 1.42431640625, 1.511322021484375, 1.59832763671875, 1.685333251953125, 1.7723388671875, 1.859344482421875, 1.94635009765625, 2.033355712890625, 2.120361328125, 2.207366943359375, 2.29437255859375, 2.381378173828125, 2.4683837890625, 2.555389404296875, 2.64239501953125, 2.729400634765625, 2.81640625]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 5.0, 5.0, 4.0, 7.0, 3.0, 10.0, 7.0, 8.0, 13.0, 12.0, 16.0, 15.0, 21.0, 29.0, 18.0, 32.0, 35.0, 38.0, 44.0, 43.0, 56.0, 99.0, 234.0, 1512.0, 283.0, 76.0, 60.0, 53.0, 40.0, 27.0, 25.0, 37.0, 27.0, 22.0, 25.0, 23.0, 14.0, 11.0, 9.0, 15.0, 7.0, 10.0, 3.0, 5.0, 4.0, 5.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-10.3671875, -10.028076171875, -9.68896484375, -9.349853515625, -9.0107421875, -8.671630859375, -8.33251953125, -7.993408203125, -7.654296875, -7.315185546875, -6.97607421875, -6.636962890625, -6.2978515625, -5.958740234375, -5.61962890625, -5.280517578125, -4.94140625, -4.602294921875, -4.26318359375, -3.924072265625, -3.5849609375, -3.245849609375, -2.90673828125, -2.567626953125, -2.228515625, -1.889404296875, -1.55029296875, -1.211181640625, -0.8720703125, -0.532958984375, -0.19384765625, 0.145263671875, 0.484375, 0.823486328125, 1.16259765625, 1.501708984375, 1.8408203125, 2.179931640625, 2.51904296875, 2.858154296875, 3.197265625, 3.536376953125, 3.87548828125, 4.214599609375, 4.5537109375, 4.892822265625, 5.23193359375, 5.571044921875, 5.91015625, 6.249267578125, 6.58837890625, 6.927490234375, 7.2666015625, 7.605712890625, 7.94482421875, 8.283935546875, 8.623046875, 8.962158203125, 9.30126953125, 9.640380859375, 9.9794921875, 10.318603515625, 10.65771484375, 10.996826171875, 11.3359375]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 5.0, 3.0, 4.0, 15.0, 12.0, 16.0, 25.0, 33.0, 49.0, 74.0, 124.0, 179.0, 381.0, 1402.0, 1727101.0, 1413984.0, 1332.0, 403.0, 204.0, 104.0, 80.0, 48.0, 41.0, 33.0, 19.0, 11.0, 8.0, 8.0, 4.0, 1.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-71.5, -69.5673828125, -67.634765625, -65.7021484375, -63.76953125, -61.8369140625, -59.904296875, -57.9716796875, -56.0390625, -54.1064453125, -52.173828125, -50.2412109375, -48.30859375, -46.3759765625, -44.443359375, -42.5107421875, -40.578125, -38.6455078125, -36.712890625, -34.7802734375, -32.84765625, -30.9150390625, -28.982421875, -27.0498046875, -25.1171875, -23.1845703125, -21.251953125, -19.3193359375, -17.38671875, -15.4541015625, -13.521484375, -11.5888671875, -9.65625, -7.7236328125, -5.791015625, -3.8583984375, -1.92578125, 0.0068359375, 1.939453125, 3.8720703125, 5.8046875, 7.7373046875, 9.669921875, 11.6025390625, 13.53515625, 15.4677734375, 17.400390625, 19.3330078125, 21.265625, 23.1982421875, 25.130859375, 27.0634765625, 28.99609375, 30.9287109375, 32.861328125, 34.7939453125, 36.7265625, 38.6591796875, 40.591796875, 42.5244140625, 44.45703125, 46.3896484375, 48.322265625, 50.2548828125, 52.1875]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 8.0, 38.0, 165.0, 292.0, 318.0, 149.0, 37.0, 9.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.66176700592041, -5.574765682220459, -4.487764358520508, -3.4007625579833984, -2.3137612342834473, -1.226759910583496, -0.13975811004638672, 0.9472432136535645, 2.0342445373535156, 3.121245861053467, 4.208247184753418, 5.295248985290527, 6.3822503089904785, 7.46925163269043, 8.556253433227539, 9.643255233764648, 10.730256080627441, 11.81725788116455, 12.904258728027344, 13.991260528564453, 15.078262329101562, 16.165264129638672, 17.25226593017578, 18.339265823364258, 19.426267623901367, 20.513269424438477, 21.600271224975586, 22.687271118164062, 23.774272918701172, 24.86127471923828, 25.94827651977539, 27.0352783203125, 28.12228012084961, 29.20928192138672, 30.296283721923828, 31.383285522460938, 32.47028732299805, 33.557289123535156, 34.644287109375, 35.73128890991211, 36.81829071044922, 37.90529251098633, 38.99229431152344, 40.07929611206055, 41.166297912597656, 42.2532958984375, 43.340301513671875, 44.42729949951172, 45.514305114746094, 46.6013069152832, 47.68830871582031, 48.77531051635742, 49.86231231689453, 50.949310302734375, 52.03631591796875, 53.123313903808594, 54.2103157043457, 55.29731750488281, 56.38431930541992, 57.47132110595703, 58.55832290649414, 59.64532470703125, 60.732322692871094, 61.8193244934082, 62.90632629394531]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [4.0, 3.0, 6.0, 3.0, 4.0, 5.0, 7.0, 8.0, 6.0, 7.0, 12.0, 15.0, 10.0, 28.0, 22.0, 20.0, 20.0, 26.0, 31.0, 33.0, 37.0, 34.0, 36.0, 41.0, 41.0, 47.0, 34.0, 43.0, 43.0, 39.0, 30.0, 24.0, 42.0, 38.0, 33.0, 31.0, 27.0, 23.0, 16.0, 15.0, 16.0, 14.0, 13.0, 10.0, 4.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.7840576171875, -20.971065521240234, -20.1580753326416, -19.345083236694336, -18.532093048095703, -17.719100952148438, -16.906108856201172, -16.093116760253906, -15.280126571655273, -14.467135429382324, -13.654144287109375, -12.84115219116211, -12.02816104888916, -11.215169906616211, -10.402177810668945, -9.589186668395996, -8.776195526123047, -7.963204383850098, -7.15021276473999, -6.337221145629883, -5.524230003356934, -4.711238861083984, -3.898247241973877, -3.0852556228637695, -2.2722644805908203, -1.459273099899292, -0.6462817192077637, 0.16670966148376465, 0.979701042175293, 1.7926921844482422, 2.6056838035583496, 3.418675422668457, 4.231666564941406, 5.0446577072143555, 5.857649326324463, 6.67064094543457, 7.4836320877075195, 8.296623229980469, 9.109615325927734, 9.922606468200684, 10.735597610473633, 11.548588752746582, 12.361579895019531, 13.174571990966797, 13.987563133239746, 14.800554275512695, 15.613546371459961, 16.426536560058594, 17.23952865600586, 18.052520751953125, 18.865510940551758, 19.678503036499023, 20.491493225097656, 21.304485321044922, 22.117477416992188, 22.930469512939453, 23.743459701538086, 24.55645179748535, 25.369441986083984, 26.18243408203125, 26.995426177978516, 27.80841636657715, 28.621408462524414, 29.434398651123047, 30.247390747070312]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 5.0, 2.0, 1.0, 11.0, 8.0, 11.0, 19.0, 7.0, 19.0, 22.0, 26.0, 16.0, 27.0, 28.0, 31.0, 27.0, 40.0, 32.0, 37.0, 32.0, 36.0, 39.0, 37.0, 42.0, 40.0, 36.0, 40.0, 35.0, 38.0, 38.0, 32.0, 23.0, 24.0, 22.0, 12.0, 14.0, 19.0, 13.0, 12.0, 8.0, 15.0, 11.0, 7.0, 2.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.21484375, -3.116058349609375, -3.01727294921875, -2.918487548828125, -2.8197021484375, -2.720916748046875, -2.62213134765625, -2.523345947265625, -2.424560546875, -2.325775146484375, -2.22698974609375, -2.128204345703125, -2.0294189453125, -1.930633544921875, -1.83184814453125, -1.733062744140625, -1.63427734375, -1.535491943359375, -1.43670654296875, -1.337921142578125, -1.2391357421875, -1.140350341796875, -1.04156494140625, -0.942779541015625, -0.843994140625, -0.745208740234375, -0.64642333984375, -0.547637939453125, -0.4488525390625, -0.350067138671875, -0.25128173828125, -0.152496337890625, -0.0537109375, 0.045074462890625, 0.14385986328125, 0.242645263671875, 0.3414306640625, 0.440216064453125, 0.53900146484375, 0.637786865234375, 0.736572265625, 0.835357666015625, 0.93414306640625, 1.032928466796875, 1.1317138671875, 1.230499267578125, 1.32928466796875, 1.428070068359375, 1.52685546875, 1.625640869140625, 1.72442626953125, 1.823211669921875, 1.9219970703125, 2.020782470703125, 2.11956787109375, 2.218353271484375, 2.317138671875, 2.415924072265625, 2.51470947265625, 2.613494873046875, 2.7122802734375, 2.811065673828125, 2.90985107421875, 3.008636474609375, 3.107421875]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 7.0, 5.0, 11.0, 14.0, 14.0, 24.0, 23.0, 39.0, 44.0, 44.0, 54.0, 63.0, 74.0, 94.0, 124.0, 167.0, 342.0, 699.0, 3017.0, 32336.0, 598964.0, 2567670.0, 927391.0, 56354.0, 4565.0, 926.0, 391.0, 199.0, 134.0, 100.0, 78.0, 35.0, 47.0, 38.0, 33.0, 27.0, 26.0, 26.0, 19.0, 19.0, 13.0, 8.0, 4.0, 11.0, 6.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.515625, -7.2850341796875, -7.054443359375, -6.8238525390625, -6.59326171875, -6.3626708984375, -6.132080078125, -5.9014892578125, -5.6708984375, -5.4403076171875, -5.209716796875, -4.9791259765625, -4.74853515625, -4.5179443359375, -4.287353515625, -4.0567626953125, -3.826171875, -3.5955810546875, -3.364990234375, -3.1343994140625, -2.90380859375, -2.6732177734375, -2.442626953125, -2.2120361328125, -1.9814453125, -1.7508544921875, -1.520263671875, -1.2896728515625, -1.05908203125, -0.8284912109375, -0.597900390625, -0.3673095703125, -0.13671875, 0.0938720703125, 0.324462890625, 0.5550537109375, 0.78564453125, 1.0162353515625, 1.246826171875, 1.4774169921875, 1.7080078125, 1.9385986328125, 2.169189453125, 2.3997802734375, 2.63037109375, 2.8609619140625, 3.091552734375, 3.3221435546875, 3.552734375, 3.7833251953125, 4.013916015625, 4.2445068359375, 4.47509765625, 4.7056884765625, 4.936279296875, 5.1668701171875, 5.3974609375, 5.6280517578125, 5.858642578125, 6.0892333984375, 6.31982421875, 6.5504150390625, 6.781005859375, 7.0115966796875, 7.2421875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 2.0, 5.0, 2.0, 2.0, 0.0, 5.0, 8.0, 12.0, 10.0, 18.0, 24.0, 29.0, 27.0, 58.0, 70.0, 71.0, 98.0, 157.0, 151.0, 193.0, 277.0, 299.0, 364.0, 384.0, 347.0, 311.0, 258.0, 183.0, 154.0, 127.0, 92.0, 73.0, 54.0, 41.0, 40.0, 26.0, 29.0, 16.0, 13.0, 8.0, 7.0, 9.0, 7.0, 4.0, 5.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0], "bins": [-5.875, -5.70941162109375, -5.5438232421875, -5.37823486328125, -5.212646484375, -5.04705810546875, -4.8814697265625, -4.71588134765625, -4.55029296875, -4.38470458984375, -4.2191162109375, -4.05352783203125, -3.887939453125, -3.72235107421875, -3.5567626953125, -3.39117431640625, -3.2255859375, -3.05999755859375, -2.8944091796875, -2.72882080078125, -2.563232421875, -2.39764404296875, -2.2320556640625, -2.06646728515625, -1.90087890625, -1.73529052734375, -1.5697021484375, -1.40411376953125, -1.238525390625, -1.07293701171875, -0.9073486328125, -0.74176025390625, -0.576171875, -0.41058349609375, -0.2449951171875, -0.07940673828125, 0.086181640625, 0.25177001953125, 0.4173583984375, 0.58294677734375, 0.74853515625, 0.91412353515625, 1.0797119140625, 1.24530029296875, 1.410888671875, 1.57647705078125, 1.7420654296875, 1.90765380859375, 2.0732421875, 2.23883056640625, 2.4044189453125, 2.57000732421875, 2.735595703125, 2.90118408203125, 3.0667724609375, 3.23236083984375, 3.39794921875, 3.56353759765625, 3.7291259765625, 3.89471435546875, 4.060302734375, 4.22589111328125, 4.3914794921875, 4.55706787109375, 4.72265625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 3.0, 2.0, 7.0, 2.0, 7.0, 6.0, 9.0, 12.0, 13.0, 17.0, 24.0, 36.0, 42.0, 38.0, 63.0, 85.0, 111.0, 162.0, 239.0, 317.0, 459.0, 1483.0, 179444.0, 3979257.0, 30054.0, 878.0, 407.0, 255.0, 218.0, 150.0, 108.0, 97.0, 76.0, 59.0, 36.0, 22.0, 23.0, 20.0, 11.0, 8.0, 8.0, 5.0, 3.0, 1.0, 3.0, 3.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.890625, -22.111083984375, -21.33154296875, -20.552001953125, -19.7724609375, -18.992919921875, -18.21337890625, -17.433837890625, -16.654296875, -15.874755859375, -15.09521484375, -14.315673828125, -13.5361328125, -12.756591796875, -11.97705078125, -11.197509765625, -10.41796875, -9.638427734375, -8.85888671875, -8.079345703125, -7.2998046875, -6.520263671875, -5.74072265625, -4.961181640625, -4.181640625, -3.402099609375, -2.62255859375, -1.843017578125, -1.0634765625, -0.283935546875, 0.49560546875, 1.275146484375, 2.0546875, 2.834228515625, 3.61376953125, 4.393310546875, 5.1728515625, 5.952392578125, 6.73193359375, 7.511474609375, 8.291015625, 9.070556640625, 9.85009765625, 10.629638671875, 11.4091796875, 12.188720703125, 12.96826171875, 13.747802734375, 14.52734375, 15.306884765625, 16.08642578125, 16.865966796875, 17.6455078125, 18.425048828125, 19.20458984375, 19.984130859375, 20.763671875, 21.543212890625, 22.32275390625, 23.102294921875, 23.8818359375, 24.661376953125, 25.44091796875, 26.220458984375, 27.0]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 48.0, 340.0, 448.0, 160.0, 13.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.03895950317383, -29.493732452392578, -25.948505401611328, -22.403278350830078, -18.858051300048828, -15.312822341918945, -11.767595291137695, -8.222368240356445, -4.677141189575195, -1.1319139003753662, 2.413313388824463, 5.958540916442871, 9.503767967224121, 13.048995971679688, 16.594223022460938, 20.139450073242188, 23.684677124023438, 27.229904174804688, 30.775131225585938, 34.32035827636719, 37.86558532714844, 41.41081237792969, 44.95603942871094, 48.50126647949219, 52.04649353027344, 55.59172058105469, 59.13694763183594, 62.68217468261719, 66.22740173339844, 69.77262878417969, 73.31785583496094, 76.86308288574219, 80.40831756591797, 83.95354461669922, 87.49877166748047, 91.04399871826172, 94.58922576904297, 98.13445281982422, 101.67967987060547, 105.22490692138672, 108.77013397216797, 112.31536102294922, 115.86058807373047, 119.40581512451172, 122.95104217529297, 126.49626922607422, 130.04150390625, 133.58673095703125, 137.1319580078125, 140.67718505859375, 144.222412109375, 147.76763916015625, 151.3128662109375, 154.85809326171875, 158.4033203125, 161.94854736328125, 165.4937744140625, 169.03900146484375, 172.584228515625, 176.12945556640625, 179.6746826171875, 183.21990966796875, 186.76513671875, 190.31036376953125, 193.8555908203125]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 9.0, 4.0, 10.0, 14.0, 12.0, 21.0, 21.0, 18.0, 29.0, 16.0, 18.0, 37.0, 27.0, 27.0, 29.0, 45.0, 43.0, 43.0, 42.0, 38.0, 49.0, 40.0, 47.0, 39.0, 32.0, 38.0, 37.0, 23.0, 28.0, 25.0, 20.0, 18.0, 16.0, 14.0, 15.0, 12.0, 10.0, 7.0, 4.0, 8.0, 5.0, 2.0, 3.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.97812271118164, -20.312986373901367, -19.647851943969727, -18.982715606689453, -18.31757926940918, -17.65244483947754, -16.987308502197266, -16.322174072265625, -15.657037734985352, -14.991902351379395, -14.326766014099121, -13.661630630493164, -12.996495246887207, -12.33135986328125, -11.666223526000977, -11.00108814239502, -10.335951805114746, -9.670816421508789, -9.005680084228516, -8.340544700622559, -7.675409317016602, -7.010273456573486, -6.345137596130371, -5.680002212524414, -5.014866352081299, -4.349730491638184, -3.6845951080322266, -3.0194592475891113, -2.354323625564575, -1.689188003540039, -1.0240521430969238, -0.3589167594909668, 0.30621910095214844, 0.9713547825813293, 1.6364904642105103, 2.301626205444336, 2.966761827468872, 3.631897449493408, 4.297033309936523, 4.9621686935424805, 5.627304553985596, 6.292440414428711, 6.957575798034668, 7.622711658477783, 8.287847518920898, 8.952982902526855, 9.618118286132812, 10.283254623413086, 10.948390007019043, 11.613525390625, 12.278661727905273, 12.94379711151123, 13.608932495117188, 14.274068832397461, 14.939204216003418, 15.604339599609375, 16.26947593688965, 16.934612274169922, 17.599746704101562, 18.264883041381836, 18.93001937866211, 19.59515380859375, 20.260290145874023, 20.925426483154297, 21.590560913085938]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 4.0, 2.0, 9.0, 9.0, 10.0, 11.0, 11.0, 16.0, 20.0, 26.0, 21.0, 22.0, 26.0, 22.0, 35.0, 29.0, 31.0, 33.0, 43.0, 32.0, 47.0, 44.0, 41.0, 43.0, 38.0, 41.0, 37.0, 37.0, 31.0, 26.0, 25.0, 25.0, 24.0, 14.0, 23.0, 23.0, 22.0, 7.0, 7.0, 5.0, 7.0, 7.0, 7.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.986328125, -2.892425537109375, -2.79852294921875, -2.704620361328125, -2.6107177734375, -2.516815185546875, -2.42291259765625, -2.329010009765625, -2.235107421875, -2.141204833984375, -2.04730224609375, -1.953399658203125, -1.8594970703125, -1.765594482421875, -1.67169189453125, -1.577789306640625, -1.48388671875, -1.389984130859375, -1.29608154296875, -1.202178955078125, -1.1082763671875, -1.014373779296875, -0.92047119140625, -0.826568603515625, -0.732666015625, -0.638763427734375, -0.54486083984375, -0.450958251953125, -0.3570556640625, -0.263153076171875, -0.16925048828125, -0.075347900390625, 0.0185546875, 0.112457275390625, 0.20635986328125, 0.300262451171875, 0.3941650390625, 0.488067626953125, 0.58197021484375, 0.675872802734375, 0.769775390625, 0.863677978515625, 0.95758056640625, 1.051483154296875, 1.1453857421875, 1.239288330078125, 1.33319091796875, 1.427093505859375, 1.52099609375, 1.614898681640625, 1.70880126953125, 1.802703857421875, 1.8966064453125, 1.990509033203125, 2.08441162109375, 2.178314208984375, 2.272216796875, 2.366119384765625, 2.46002197265625, 2.553924560546875, 2.6478271484375, 2.741729736328125, 2.83563232421875, 2.929534912109375, 3.0234375]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 5.0, 8.0, 10.0, 10.0, 28.0, 31.0, 45.0, 49.0, 88.0, 128.0, 161.0, 226.0, 340.0, 486.0, 693.0, 983.0, 1409.0, 2027.0, 3035.0, 4470.0, 6369.0, 9326.0, 13735.0, 20403.0, 30290.0, 47389.0, 77297.0, 140666.0, 259590.0, 175258.0, 92252.0, 54743.0, 34735.0, 23021.0, 15595.0, 10592.0, 7172.0, 4969.0, 3331.0, 2298.0, 1608.0, 1151.0, 757.0, 549.0, 385.0, 247.0, 166.0, 141.0, 94.0, 56.0, 52.0, 31.0, 26.0, 16.0, 10.0, 8.0, 8.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.485595703125, -0.4702568054199219, -0.45491790771484375, -0.4395790100097656, -0.4242401123046875, -0.4089012145996094, -0.39356231689453125, -0.3782234191894531, -0.362884521484375, -0.3475456237792969, -0.33220672607421875, -0.3168678283691406, -0.3015289306640625, -0.2861900329589844, -0.27085113525390625, -0.2555122375488281, -0.24017333984375, -0.22483444213867188, -0.20949554443359375, -0.19415664672851562, -0.1788177490234375, -0.16347885131835938, -0.14813995361328125, -0.13280105590820312, -0.117462158203125, -0.10212326049804688, -0.08678436279296875, -0.07144546508789062, -0.0561065673828125, -0.040767669677734375, -0.02542877197265625, -0.010089874267578125, 0.0052490234375, 0.020587921142578125, 0.03592681884765625, 0.051265716552734375, 0.0666046142578125, 0.08194351196289062, 0.09728240966796875, 0.11262130737304688, 0.127960205078125, 0.14329910278320312, 0.15863800048828125, 0.17397689819335938, 0.1893157958984375, 0.20465469360351562, 0.21999359130859375, 0.23533248901367188, 0.25067138671875, 0.2660102844238281, 0.28134918212890625, 0.2966880798339844, 0.3120269775390625, 0.3273658752441406, 0.34270477294921875, 0.3580436706542969, 0.373382568359375, 0.3887214660644531, 0.40406036376953125, 0.4193992614746094, 0.4347381591796875, 0.4500770568847656, 0.46541595458984375, 0.4807548522949219, 0.49609375]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 1.0, 7.0, 4.0, 4.0, 9.0, 7.0, 12.0, 20.0, 11.0, 19.0, 18.0, 12.0, 20.0, 23.0, 15.0, 26.0, 41.0, 37.0, 36.0, 37.0, 42.0, 33.0, 40.0, 1064.0, 38.0, 51.0, 33.0, 39.0, 38.0, 34.0, 30.0, 28.0, 37.0, 24.0, 33.0, 20.0, 20.0, 9.0, 7.0, 10.0, 9.0, 2.0, 8.0, 12.0, 4.0, 1.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.6103515625, -1.5503692626953125, -1.490386962890625, -1.4304046630859375, -1.37042236328125, -1.3104400634765625, -1.250457763671875, -1.1904754638671875, -1.1304931640625, -1.0705108642578125, -1.010528564453125, -0.9505462646484375, -0.89056396484375, -0.8305816650390625, -0.770599365234375, -0.7106170654296875, -0.650634765625, -0.5906524658203125, -0.530670166015625, -0.4706878662109375, -0.41070556640625, -0.3507232666015625, -0.290740966796875, -0.2307586669921875, -0.1707763671875, -0.1107940673828125, -0.050811767578125, 0.0091705322265625, 0.06915283203125, 0.1291351318359375, 0.189117431640625, 0.2490997314453125, 0.30908203125, 0.3690643310546875, 0.429046630859375, 0.4890289306640625, 0.54901123046875, 0.6089935302734375, 0.668975830078125, 0.7289581298828125, 0.7889404296875, 0.8489227294921875, 0.908905029296875, 0.9688873291015625, 1.02886962890625, 1.0888519287109375, 1.148834228515625, 1.2088165283203125, 1.268798828125, 1.3287811279296875, 1.388763427734375, 1.4487457275390625, 1.50872802734375, 1.5687103271484375, 1.628692626953125, 1.6886749267578125, 1.7486572265625, 1.8086395263671875, 1.868621826171875, 1.9286041259765625, 1.98858642578125, 2.0485687255859375, 2.108551025390625, 2.1685333251953125, 2.228515625]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 10.0, 9.0, 8.0, 20.0, 21.0, 40.0, 64.0, 115.0, 148.0, 221.0, 394.0, 571.0, 866.0, 1230.0, 1871.0, 2716.0, 4013.0, 6053.0, 9267.0, 14453.0, 23339.0, 37949.0, 65605.0, 124167.0, 1323091.0, 225649.0, 105287.0, 56947.0, 33597.0, 20668.0, 13314.0, 8584.0, 5668.0, 3869.0, 2463.0, 1683.0, 1094.0, 737.0, 458.0, 287.0, 209.0, 122.0, 93.0, 57.0, 41.0, 17.0, 14.0, 17.0, 11.0, 7.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.49267578125, -0.475616455078125, -0.45855712890625, -0.441497802734375, -0.4244384765625, -0.407379150390625, -0.39031982421875, -0.373260498046875, -0.356201171875, -0.339141845703125, -0.32208251953125, -0.305023193359375, -0.2879638671875, -0.270904541015625, -0.25384521484375, -0.236785888671875, -0.2197265625, -0.202667236328125, -0.18560791015625, -0.168548583984375, -0.1514892578125, -0.134429931640625, -0.11737060546875, -0.100311279296875, -0.083251953125, -0.066192626953125, -0.04913330078125, -0.032073974609375, -0.0150146484375, 0.002044677734375, 0.01910400390625, 0.036163330078125, 0.05322265625, 0.070281982421875, 0.08734130859375, 0.104400634765625, 0.1214599609375, 0.138519287109375, 0.15557861328125, 0.172637939453125, 0.189697265625, 0.206756591796875, 0.22381591796875, 0.240875244140625, 0.2579345703125, 0.274993896484375, 0.29205322265625, 0.309112548828125, 0.326171875, 0.343231201171875, 0.36029052734375, 0.377349853515625, 0.3944091796875, 0.411468505859375, 0.42852783203125, 0.445587158203125, 0.462646484375, 0.479705810546875, 0.49676513671875, 0.513824462890625, 0.5308837890625, 0.547943115234375, 0.56500244140625, 0.582061767578125, 0.59912109375]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 5.0, 6.0, 4.0, 6.0, 9.0, 10.0, 8.0, 17.0, 21.0, 22.0, 17.0, 32.0, 37.0, 37.0, 34.0, 45.0, 48.0, 55.0, 50.0, 57.0, 46.0, 57.0, 55.0, 41.0, 38.0, 46.0, 31.0, 31.0, 39.0, 19.0, 13.0, 16.0, 13.0, 10.0, 7.0, 9.0, 4.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000232696533203125, -0.0002246946096420288, -0.00021669268608093262, -0.00020869076251983643, -0.00020068883895874023, -0.00019268691539764404, -0.00018468499183654785, -0.00017668306827545166, -0.00016868114471435547, -0.00016067922115325928, -0.00015267729759216309, -0.0001446753740310669, -0.0001366734504699707, -0.0001286715269088745, -0.00012066960334777832, -0.00011266767978668213, -0.00010466575622558594, -9.666383266448975e-05, -8.866190910339355e-05, -8.065998554229736e-05, -7.265806198120117e-05, -6.465613842010498e-05, -5.665421485900879e-05, -4.86522912979126e-05, -4.0650367736816406e-05, -3.2648444175720215e-05, -2.4646520614624023e-05, -1.6644597053527832e-05, -8.64267349243164e-06, -6.407499313354492e-07, 7.361173629760742e-06, 1.5363097190856934e-05, 2.3365020751953125e-05, 3.1366944313049316e-05, 3.936886787414551e-05, 4.73707914352417e-05, 5.537271499633789e-05, 6.337463855743408e-05, 7.137656211853027e-05, 7.937848567962646e-05, 8.738040924072266e-05, 9.538233280181885e-05, 0.00010338425636291504, 0.00011138617992401123, 0.00011938810348510742, 0.0001273900270462036, 0.0001353919506072998, 0.000143393874168396, 0.0001513957977294922, 0.00015939772129058838, 0.00016739964485168457, 0.00017540156841278076, 0.00018340349197387695, 0.00019140541553497314, 0.00019940733909606934, 0.00020740926265716553, 0.00021541118621826172, 0.0002234131097793579, 0.0002314150333404541, 0.0002394169569015503, 0.0002474188804626465, 0.0002554208040237427, 0.00026342272758483887, 0.00027142465114593506, 0.00027942657470703125]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 1.0, 2.0, 2.0, 5.0, 7.0, 7.0, 7.0, 15.0, 19.0, 23.0, 25.0, 45.0, 51.0, 59.0, 76.0, 92.0, 125.0, 254.0, 513.0, 1477.0, 415731.0, 626699.0, 1806.0, 572.0, 271.0, 173.0, 110.0, 77.0, 61.0, 45.0, 51.0, 30.0, 29.0, 27.0, 14.0, 13.0, 9.0, 6.0, 11.0, 9.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0], "bins": [-0.006122589111328125, -0.005952715873718262, -0.0057828426361083984, -0.005612969398498535, -0.005443096160888672, -0.005273222923278809, -0.005103349685668945, -0.004933476448059082, -0.004763603210449219, -0.0045937299728393555, -0.004423856735229492, -0.004253983497619629, -0.004084110260009766, -0.003914237022399902, -0.003744363784790039, -0.0035744905471801758, -0.0034046173095703125, -0.0032347440719604492, -0.003064870834350586, -0.0028949975967407227, -0.0027251243591308594, -0.002555251121520996, -0.002385377883911133, -0.0022155046463012695, -0.0020456314086914062, -0.001875758171081543, -0.0017058849334716797, -0.0015360116958618164, -0.0013661384582519531, -0.0011962652206420898, -0.0010263919830322266, -0.0008565187454223633, -0.0006866455078125, -0.0005167722702026367, -0.00034689903259277344, -0.00017702579498291016, -7.152557373046875e-06, 0.0001627206802368164, 0.0003325939178466797, 0.000502467155456543, 0.0006723403930664062, 0.0008422136306762695, 0.0010120868682861328, 0.001181960105895996, 0.0013518333435058594, 0.0015217065811157227, 0.001691579818725586, 0.0018614530563354492, 0.0020313262939453125, 0.0022011995315551758, 0.002371072769165039, 0.0025409460067749023, 0.0027108192443847656, 0.002880692481994629, 0.003050565719604492, 0.0032204389572143555, 0.0033903121948242188, 0.003560185432434082, 0.0037300586700439453, 0.0038999319076538086, 0.004069805145263672, 0.004239678382873535, 0.0044095516204833984, 0.004579424858093262, 0.004749298095703125]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 6.0, 19.0, 28.0, 34.0, 76.0, 120.0, 126.0, 130.0, 133.0, 127.0, 81.0, 49.0, 41.0, 14.0, 13.0, 6.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.00014169173664413393, -0.00013415678404271603, -0.00012662183144129813, -0.00011908687883988023, -0.00011155191896250471, -0.00010401696636108682, -9.648201375966892e-05, -8.89470538822934e-05, -8.14121012808755e-05, -7.38771486794576e-05, -6.63421960780397e-05, -5.8807239838643e-05, -5.127228359924629e-05, -4.3737330997828394e-05, -3.6202378396410495e-05, -2.866742215701379e-05, -2.1132473193574697e-05, -1.3597518773167394e-05, -6.062565262254793e-06, 1.4723882486578077e-06, 9.00734266906511e-06, 1.6542297089472413e-05, 2.4077249690890312e-05, 3.161220593028702e-05, 3.914715853170492e-05, 4.668211113312282e-05, 5.421706737251952e-05, 6.175201997393742e-05, 6.928697257535532e-05, 7.682193245273083e-05, 8.435688505414873e-05, 9.189183765556663e-05, 9.942679025698453e-05, 0.00010696174285840243, 0.00011449669545982033, 0.00012203164806123823, 0.00012956660066265613, 0.00013710156781598926, 0.00014463652041740716, 0.00015217147301882505, 0.00015970642562024295, 0.00016724137822166085, 0.00017477633082307875, 0.00018231128342449665, 0.00018984623602591455, 0.00019738118862733245, 0.00020491614122875035, 0.00021245110838208348, 0.00021998604643158615, 0.00022752099903300405, 0.00023505595163442194, 0.00024259090423583984, 0.00025012585683725774, 0.00025766080943867564, 0.00026519576204009354, 0.00027273071464151144, 0.0002802656963467598, 0.0002878006489481777, 0.0002953356015495956, 0.0003028705541510135, 0.0003104055067524314, 0.0003179404593538493, 0.0003254754119552672, 0.0003330103645566851, 0.000340545317158103]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 1.0, 7.0, 4.0, 2.0, 5.0, 11.0, 15.0, 11.0, 19.0, 10.0, 24.0, 31.0, 47.0, 23.0, 30.0, 33.0, 40.0, 39.0, 39.0, 39.0, 42.0, 38.0, 42.0, 37.0, 39.0, 41.0, 33.0, 35.0, 30.0, 28.0, 33.0, 29.0, 16.0, 19.0, 23.0, 19.0, 13.0, 14.0, 8.0, 5.0, 10.0, 2.0, 7.0, 3.0, 1.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.00014823675155639648, -0.0001438213512301445, -0.00013940595090389252, -0.00013499055057764053, -0.00013057515025138855, -0.00012615974992513657, -0.00012174434959888458, -0.0001173289492726326, -0.00011291354894638062, -0.00010849814862012863, -0.00010408274829387665, -9.966734796762466e-05, -9.525194764137268e-05, -9.08365473151207e-05, -8.642114698886871e-05, -8.200574666261673e-05, -7.759034633636475e-05, -7.317494601011276e-05, -6.875954568386078e-05, -6.43441453576088e-05, -5.992874503135681e-05, -5.551334470510483e-05, -5.1097944378852844e-05, -4.668254405260086e-05, -4.226714372634888e-05, -3.785174340009689e-05, -3.343634307384491e-05, -2.9020942747592926e-05, -2.4605542421340942e-05, -2.019014209508896e-05, -1.5774741768836975e-05, -1.1359341442584991e-05, -6.943941116333008e-06, -2.528540790081024e-06, 1.8868595361709595e-06, 6.302259862422943e-06, 1.0717660188674927e-05, 1.513306051492691e-05, 1.9548460841178894e-05, 2.3963861167430878e-05, 2.837926149368286e-05, 3.2794661819934845e-05, 3.721006214618683e-05, 4.162546247243881e-05, 4.6040862798690796e-05, 5.045626312494278e-05, 5.487166345119476e-05, 5.928706377744675e-05, 6.370246410369873e-05, 6.811786442995071e-05, 7.25332647562027e-05, 7.694866508245468e-05, 8.136406540870667e-05, 8.577946573495865e-05, 9.019486606121063e-05, 9.461026638746262e-05, 9.90256667137146e-05, 0.00010344106703996658, 0.00010785646736621857, 0.00011227186769247055, 0.00011668726801872253, 0.00012110266834497452, 0.0001255180686712265, 0.00012993346899747849, 0.00013434886932373047]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 4.0, 2.0, 9.0, 9.0, 10.0, 11.0, 11.0, 16.0, 20.0, 26.0, 21.0, 22.0, 26.0, 22.0, 35.0, 29.0, 31.0, 33.0, 43.0, 32.0, 47.0, 44.0, 41.0, 43.0, 38.0, 41.0, 37.0, 37.0, 31.0, 26.0, 25.0, 25.0, 24.0, 14.0, 23.0, 23.0, 22.0, 7.0, 7.0, 5.0, 7.0, 7.0, 7.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.986328125, -2.892425537109375, -2.79852294921875, -2.704620361328125, -2.6107177734375, -2.516815185546875, -2.42291259765625, -2.329010009765625, -2.235107421875, -2.141204833984375, -2.04730224609375, -1.953399658203125, -1.8594970703125, -1.765594482421875, -1.67169189453125, -1.577789306640625, -1.48388671875, -1.389984130859375, -1.29608154296875, -1.202178955078125, -1.1082763671875, -1.014373779296875, -0.92047119140625, -0.826568603515625, -0.732666015625, -0.638763427734375, -0.54486083984375, -0.450958251953125, -0.3570556640625, -0.263153076171875, -0.16925048828125, -0.075347900390625, 0.0185546875, 0.112457275390625, 0.20635986328125, 0.300262451171875, 0.3941650390625, 0.488067626953125, 0.58197021484375, 0.675872802734375, 0.769775390625, 0.863677978515625, 0.95758056640625, 1.051483154296875, 1.1453857421875, 1.239288330078125, 1.33319091796875, 1.427093505859375, 1.52099609375, 1.614898681640625, 1.70880126953125, 1.802703857421875, 1.8966064453125, 1.990509033203125, 2.08441162109375, 2.178314208984375, 2.272216796875, 2.366119384765625, 2.46002197265625, 2.553924560546875, 2.6478271484375, 2.741729736328125, 2.83563232421875, 2.929534912109375, 3.0234375]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 5.0, 6.0, 8.0, 9.0, 9.0, 10.0, 20.0, 23.0, 37.0, 56.0, 69.0, 112.0, 242.0, 452.0, 1027.0, 2129.0, 4464.0, 9401.0, 19415.0, 43619.0, 110736.0, 291262.0, 336562.0, 133614.0, 52083.0, 22587.0, 10619.0, 5173.0, 2425.0, 1115.0, 566.0, 280.0, 137.0, 81.0, 49.0, 38.0, 34.0, 26.0, 14.0, 11.0, 7.0, 6.0, 7.0, 3.0, 7.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.91796875, -2.821014404296875, -2.72406005859375, -2.627105712890625, -2.5301513671875, -2.433197021484375, -2.33624267578125, -2.239288330078125, -2.142333984375, -2.045379638671875, -1.94842529296875, -1.851470947265625, -1.7545166015625, -1.657562255859375, -1.56060791015625, -1.463653564453125, -1.36669921875, -1.269744873046875, -1.17279052734375, -1.075836181640625, -0.9788818359375, -0.881927490234375, -0.78497314453125, -0.688018798828125, -0.591064453125, -0.494110107421875, -0.39715576171875, -0.300201416015625, -0.2032470703125, -0.106292724609375, -0.00933837890625, 0.087615966796875, 0.1845703125, 0.281524658203125, 0.37847900390625, 0.475433349609375, 0.5723876953125, 0.669342041015625, 0.76629638671875, 0.863250732421875, 0.960205078125, 1.057159423828125, 1.15411376953125, 1.251068115234375, 1.3480224609375, 1.444976806640625, 1.54193115234375, 1.638885498046875, 1.73583984375, 1.832794189453125, 1.92974853515625, 2.026702880859375, 2.1236572265625, 2.220611572265625, 2.31756591796875, 2.414520263671875, 2.511474609375, 2.608428955078125, 2.70538330078125, 2.802337646484375, 2.8992919921875, 2.996246337890625, 3.09320068359375, 3.190155029296875, 3.287109375]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 11.0, 9.0, 9.0, 12.0, 13.0, 13.0, 19.0, 33.0, 23.0, 35.0, 27.0, 34.0, 49.0, 51.0, 71.0, 150.0, 452.0, 1468.0, 146.0, 73.0, 52.0, 53.0, 42.0, 35.0, 29.0, 23.0, 16.0, 14.0, 23.0, 16.0, 10.0, 9.0, 3.0, 5.0, 7.0, 6.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.46875, -13.02001953125, -12.5712890625, -12.12255859375, -11.673828125, -11.22509765625, -10.7763671875, -10.32763671875, -9.87890625, -9.43017578125, -8.9814453125, -8.53271484375, -8.083984375, -7.63525390625, -7.1865234375, -6.73779296875, -6.2890625, -5.84033203125, -5.3916015625, -4.94287109375, -4.494140625, -4.04541015625, -3.5966796875, -3.14794921875, -2.69921875, -2.25048828125, -1.8017578125, -1.35302734375, -0.904296875, -0.45556640625, -0.0068359375, 0.44189453125, 0.890625, 1.33935546875, 1.7880859375, 2.23681640625, 2.685546875, 3.13427734375, 3.5830078125, 4.03173828125, 4.48046875, 4.92919921875, 5.3779296875, 5.82666015625, 6.275390625, 6.72412109375, 7.1728515625, 7.62158203125, 8.0703125, 8.51904296875, 8.9677734375, 9.41650390625, 9.865234375, 10.31396484375, 10.7626953125, 11.21142578125, 11.66015625, 12.10888671875, 12.5576171875, 13.00634765625, 13.455078125, 13.90380859375, 14.3525390625, 14.80126953125, 15.25]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 6.0, 3.0, 3.0, 10.0, 7.0, 18.0, 16.0, 20.0, 26.0, 24.0, 40.0, 40.0, 40.0, 93.0, 127.0, 187.0, 325.0, 580.0, 2871.0, 3029789.0, 109090.0, 1086.0, 432.0, 261.0, 156.0, 120.0, 89.0, 56.0, 39.0, 34.0, 20.0, 28.0, 24.0, 11.0, 16.0, 9.0, 3.0, 4.0, 4.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.90625, -37.6826171875, -36.458984375, -35.2353515625, -34.01171875, -32.7880859375, -31.564453125, -30.3408203125, -29.1171875, -27.8935546875, -26.669921875, -25.4462890625, -24.22265625, -22.9990234375, -21.775390625, -20.5517578125, -19.328125, -18.1044921875, -16.880859375, -15.6572265625, -14.43359375, -13.2099609375, -11.986328125, -10.7626953125, -9.5390625, -8.3154296875, -7.091796875, -5.8681640625, -4.64453125, -3.4208984375, -2.197265625, -0.9736328125, 0.25, 1.4736328125, 2.697265625, 3.9208984375, 5.14453125, 6.3681640625, 7.591796875, 8.8154296875, 10.0390625, 11.2626953125, 12.486328125, 13.7099609375, 14.93359375, 16.1572265625, 17.380859375, 18.6044921875, 19.828125, 21.0517578125, 22.275390625, 23.4990234375, 24.72265625, 25.9462890625, 27.169921875, 28.3935546875, 29.6171875, 30.8408203125, 32.064453125, 33.2880859375, 34.51171875, 35.7353515625, 36.958984375, 38.1826171875, 39.40625]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 9.0, 22.0, 148.0, 372.0, 331.0, 109.0, 20.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.757884979248047, -26.49295425415039, -25.228025436401367, -23.96309471130371, -22.698165893554688, -21.43323516845703, -20.168304443359375, -18.90337371826172, -17.638444900512695, -16.37351417541504, -15.108585357666016, -13.84365463256836, -12.57872486114502, -11.31379508972168, -10.048864364624023, -8.783934593200684, -7.519004821777344, -6.254075050354004, -4.989144802093506, -3.724214792251587, -2.459284782409668, -1.1943550109863281, 0.07057523727416992, 1.335505485534668, 2.600435256958008, 3.8653652667999268, 5.130295276641846, 6.395225524902344, 7.660155296325684, 8.925085067749023, 10.19001579284668, 11.45494556427002, 12.719871520996094, 13.984801292419434, 15.249731063842773, 16.51466178894043, 17.779590606689453, 19.04452133178711, 20.309452056884766, 21.574382781982422, 22.839311599731445, 24.1042423248291, 25.369171142578125, 26.63410186767578, 27.899032592773438, 29.16396141052246, 30.428892135620117, 31.69382095336914, 32.9587516784668, 34.22368240356445, 35.48861312866211, 36.7535400390625, 38.018470764160156, 39.28340148925781, 40.54833221435547, 41.813262939453125, 43.07819366455078, 44.34312438964844, 45.608055114746094, 46.872982025146484, 48.13791275024414, 49.4028434753418, 50.66777420043945, 51.93270492553711, 53.1976318359375]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 4.0, 4.0, 5.0, 6.0, 10.0, 10.0, 8.0, 17.0, 21.0, 17.0, 23.0, 25.0, 18.0, 22.0, 26.0, 40.0, 39.0, 32.0, 33.0, 36.0, 51.0, 24.0, 34.0, 50.0, 43.0, 39.0, 35.0, 42.0, 46.0, 34.0, 24.0, 27.0, 15.0, 26.0, 18.0, 16.0, 17.0, 5.0, 11.0, 16.0, 5.0, 6.0, 4.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-28.774852752685547, -27.903209686279297, -27.031564712524414, -26.159921646118164, -25.28827667236328, -24.41663360595703, -23.54499053955078, -22.67334747314453, -21.80170249938965, -20.9300594329834, -20.058414459228516, -19.186771392822266, -18.315128326416016, -17.443483352661133, -16.571840286254883, -15.700196266174316, -14.82855224609375, -13.956908226013184, -13.085264205932617, -12.213621139526367, -11.3419771194458, -10.470333099365234, -9.598690032958984, -8.727046012878418, -7.855401992797852, -6.983757972717285, -6.112114429473877, -5.240470886230469, -4.368826866149902, -3.497182846069336, -2.6255393028259277, -1.7538957595825195, -0.8822498321533203, -0.010606050491333008, 0.8610377311706543, 1.7326815128326416, 2.604325294494629, 3.4759693145751953, 4.3476128578186035, 5.219256401062012, 6.090900421142578, 6.9625444412231445, 7.834187984466553, 8.705831527709961, 9.577475547790527, 10.449119567871094, 11.320762634277344, 12.19240665435791, 13.064050674438477, 13.935694694519043, 14.80733871459961, 15.67898178100586, 16.55062484741211, 17.422269821166992, 18.293912887573242, 19.165557861328125, 20.037200927734375, 20.908843994140625, 21.780488967895508, 22.652132034301758, 23.52377700805664, 24.39542007446289, 25.26706314086914, 26.13870620727539, 27.010351181030273]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 3.0, 6.0, 4.0, 4.0, 9.0, 9.0, 11.0, 10.0, 17.0, 20.0, 25.0, 22.0, 25.0, 28.0, 32.0, 27.0, 40.0, 35.0, 42.0, 41.0, 37.0, 34.0, 47.0, 40.0, 38.0, 41.0, 51.0, 34.0, 32.0, 29.0, 42.0, 24.0, 21.0, 17.0, 20.0, 22.0, 13.0, 9.0, 9.0, 14.0, 1.0, 6.0, 6.0, 1.0, 5.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4453125, -3.33453369140625, -3.2237548828125, -3.11297607421875, -3.002197265625, -2.89141845703125, -2.7806396484375, -2.66986083984375, -2.55908203125, -2.44830322265625, -2.3375244140625, -2.22674560546875, -2.115966796875, -2.00518798828125, -1.8944091796875, -1.78363037109375, -1.6728515625, -1.56207275390625, -1.4512939453125, -1.34051513671875, -1.229736328125, -1.11895751953125, -1.0081787109375, -0.89739990234375, -0.78662109375, -0.67584228515625, -0.5650634765625, -0.45428466796875, -0.343505859375, -0.23272705078125, -0.1219482421875, -0.01116943359375, 0.099609375, 0.21038818359375, 0.3211669921875, 0.43194580078125, 0.542724609375, 0.65350341796875, 0.7642822265625, 0.87506103515625, 0.98583984375, 1.09661865234375, 1.2073974609375, 1.31817626953125, 1.428955078125, 1.53973388671875, 1.6505126953125, 1.76129150390625, 1.8720703125, 1.98284912109375, 2.0936279296875, 2.20440673828125, 2.315185546875, 2.42596435546875, 2.5367431640625, 2.64752197265625, 2.75830078125, 2.86907958984375, 2.9798583984375, 3.09063720703125, 3.201416015625, 3.31219482421875, 3.4229736328125, 3.53375244140625, 3.64453125]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 6.0, 7.0, 4.0, 5.0, 5.0, 9.0, 9.0, 18.0, 27.0, 25.0, 32.0, 34.0, 44.0, 64.0, 87.0, 102.0, 173.0, 315.0, 880.0, 4307.0, 141100.0, 2864240.0, 1155364.0, 24208.0, 1920.0, 498.0, 240.0, 142.0, 97.0, 63.0, 50.0, 48.0, 27.0, 36.0, 23.0, 22.0, 14.0, 13.0, 7.0, 6.0, 6.0, 2.0, 2.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.2109375, -9.8680419921875, -9.525146484375, -9.1822509765625, -8.83935546875, -8.4964599609375, -8.153564453125, -7.8106689453125, -7.4677734375, -7.1248779296875, -6.781982421875, -6.4390869140625, -6.09619140625, -5.7532958984375, -5.410400390625, -5.0675048828125, -4.724609375, -4.3817138671875, -4.038818359375, -3.6959228515625, -3.35302734375, -3.0101318359375, -2.667236328125, -2.3243408203125, -1.9814453125, -1.6385498046875, -1.295654296875, -0.9527587890625, -0.60986328125, -0.2669677734375, 0.075927734375, 0.4188232421875, 0.76171875, 1.1046142578125, 1.447509765625, 1.7904052734375, 2.13330078125, 2.4761962890625, 2.819091796875, 3.1619873046875, 3.5048828125, 3.8477783203125, 4.190673828125, 4.5335693359375, 4.87646484375, 5.2193603515625, 5.562255859375, 5.9051513671875, 6.248046875, 6.5909423828125, 6.933837890625, 7.2767333984375, 7.61962890625, 7.9625244140625, 8.305419921875, 8.6483154296875, 8.9912109375, 9.3341064453125, 9.677001953125, 10.0198974609375, 10.36279296875, 10.7056884765625, 11.048583984375, 11.3914794921875, 11.734375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 8.0, 10.0, 19.0, 15.0, 27.0, 34.0, 58.0, 82.0, 98.0, 180.0, 241.0, 323.0, 441.0, 500.0, 468.0, 431.0, 318.0, 225.0, 169.0, 120.0, 99.0, 42.0, 43.0, 32.0, 20.0, 18.0, 18.0, 7.0, 9.0, 6.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.33203125, -6.10601806640625, -5.8800048828125, -5.65399169921875, -5.427978515625, -5.20196533203125, -4.9759521484375, -4.74993896484375, -4.52392578125, -4.29791259765625, -4.0718994140625, -3.84588623046875, -3.619873046875, -3.39385986328125, -3.1678466796875, -2.94183349609375, -2.7158203125, -2.48980712890625, -2.2637939453125, -2.03778076171875, -1.811767578125, -1.58575439453125, -1.3597412109375, -1.13372802734375, -0.90771484375, -0.68170166015625, -0.4556884765625, -0.22967529296875, -0.003662109375, 0.22235107421875, 0.4483642578125, 0.67437744140625, 0.900390625, 1.12640380859375, 1.3524169921875, 1.57843017578125, 1.804443359375, 2.03045654296875, 2.2564697265625, 2.48248291015625, 2.70849609375, 2.93450927734375, 3.1605224609375, 3.38653564453125, 3.612548828125, 3.83856201171875, 4.0645751953125, 4.29058837890625, 4.5166015625, 4.74261474609375, 4.9686279296875, 5.19464111328125, 5.420654296875, 5.64666748046875, 5.8726806640625, 6.09869384765625, 6.32470703125, 6.55072021484375, 6.7767333984375, 7.00274658203125, 7.228759765625, 7.45477294921875, 7.6807861328125, 7.90679931640625, 8.1328125]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 8.0, 8.0, 10.0, 15.0, 21.0, 32.0, 45.0, 56.0, 61.0, 144.0, 184.0, 257.0, 390.0, 725.0, 14677.0, 4105486.0, 69929.0, 907.0, 456.0, 271.0, 203.0, 124.0, 84.0, 61.0, 41.0, 15.0, 20.0, 17.0, 13.0, 7.0, 5.0, 3.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.65625, -37.628173828125, -36.60009765625, -35.572021484375, -34.5439453125, -33.515869140625, -32.48779296875, -31.459716796875, -30.431640625, -29.403564453125, -28.37548828125, -27.347412109375, -26.3193359375, -25.291259765625, -24.26318359375, -23.235107421875, -22.20703125, -21.178955078125, -20.15087890625, -19.122802734375, -18.0947265625, -17.066650390625, -16.03857421875, -15.010498046875, -13.982421875, -12.954345703125, -11.92626953125, -10.898193359375, -9.8701171875, -8.842041015625, -7.81396484375, -6.785888671875, -5.7578125, -4.729736328125, -3.70166015625, -2.673583984375, -1.6455078125, -0.617431640625, 0.41064453125, 1.438720703125, 2.466796875, 3.494873046875, 4.52294921875, 5.551025390625, 6.5791015625, 7.607177734375, 8.63525390625, 9.663330078125, 10.69140625, 11.719482421875, 12.74755859375, 13.775634765625, 14.8037109375, 15.831787109375, 16.85986328125, 17.887939453125, 18.916015625, 19.944091796875, 20.97216796875, 22.000244140625, 23.0283203125, 24.056396484375, 25.08447265625, 26.112548828125, 27.140625]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 10.0, 91.0, 430.0, 411.0, 69.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.77948760986328, -23.382638931274414, -19.985790252685547, -16.58894157409668, -13.192092895507812, -9.795244216918945, -6.398395538330078, -3.001546859741211, 0.39530181884765625, 3.7921504974365234, 7.188999176025391, 10.585847854614258, 13.982696533203125, 17.379545211791992, 20.77639389038086, 24.173242568969727, 27.570091247558594, 30.96693992614746, 34.36378860473633, 37.76063537597656, 41.15748596191406, 44.55433654785156, 47.9511833190918, 51.34803009033203, 54.74488067626953, 58.14173126220703, 61.538578033447266, 64.9354248046875, 68.332275390625, 71.7291259765625, 75.1259765625, 78.52281951904297, 81.919677734375, 85.3165283203125, 88.71337890625, 92.11022186279297, 95.50707244873047, 98.90392303466797, 102.30076599121094, 105.69761657714844, 109.09446716308594, 112.49131774902344, 115.88816833496094, 119.2850112915039, 122.6818618774414, 126.0787124633789, 129.47555541992188, 132.87240600585938, 136.26925659179688, 139.66610717773438, 143.06295776367188, 146.45980834960938, 149.85665893554688, 153.2534942626953, 156.6503448486328, 160.0471954345703, 163.4440460205078, 166.8408966064453, 170.2377471923828, 173.6345977783203, 177.03143310546875, 180.42828369140625, 183.82513427734375, 187.22198486328125, 190.61883544921875]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 6.0, 2.0, 6.0, 5.0, 11.0, 10.0, 7.0, 6.0, 13.0, 16.0, 11.0, 29.0, 19.0, 29.0, 40.0, 41.0, 31.0, 36.0, 43.0, 36.0, 51.0, 47.0, 49.0, 49.0, 36.0, 47.0, 49.0, 43.0, 28.0, 32.0, 41.0, 21.0, 26.0, 13.0, 18.0, 15.0, 10.0, 9.0, 11.0, 6.0, 0.0, 6.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.824111938476562, -21.110454559326172, -20.39679527282715, -19.683137893676758, -18.969478607177734, -18.255821228027344, -17.542163848876953, -16.82850456237793, -16.114845275878906, -15.4011869430542, -14.687528610229492, -13.973871231079102, -13.260211944580078, -12.546554565429688, -11.83289623260498, -11.119237899780273, -10.405580520629883, -9.691922187805176, -8.978263854980469, -8.264606475830078, -7.550947666168213, -6.837289333343506, -6.123631477355957, -5.40997314453125, -4.696314811706543, -3.982656478881836, -3.268998384475708, -2.55534029006958, -1.841681957244873, -1.128023624420166, -0.4143657684326172, 0.29929256439208984, 1.0129528045654297, 1.7266110181808472, 2.4402692317962646, 3.1539273262023926, 3.8675856590270996, 4.581243991851807, 5.2949018478393555, 6.0085601806640625, 6.7222185134887695, 7.435876846313477, 8.149535179138184, 8.86319351196289, 9.576850891113281, 10.290510177612305, 11.004167556762695, 11.717825889587402, 12.43148422241211, 13.145142555236816, 13.858800888061523, 14.572458267211914, 15.286117553710938, 15.999774932861328, 16.71343231201172, 17.427091598510742, 18.140750885009766, 18.854408264160156, 19.56806755065918, 20.28172492980957, 20.995384216308594, 21.709041595458984, 22.422698974609375, 23.1363582611084, 23.85001564025879]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 7.0, 6.0, 12.0, 7.0, 11.0, 9.0, 13.0, 15.0, 19.0, 20.0, 25.0, 23.0, 32.0, 28.0, 24.0, 39.0, 39.0, 36.0, 32.0, 48.0, 40.0, 30.0, 45.0, 38.0, 29.0, 33.0, 30.0, 35.0, 26.0, 31.0, 32.0, 35.0, 24.0, 23.0, 14.0, 14.0, 11.0, 14.0, 5.0, 9.0, 8.0, 9.0, 8.0, 3.0, 1.0, 4.0, 4.0, 4.0, 0.0, 1.0], "bins": [-3.298828125, -3.205657958984375, -3.11248779296875, -3.019317626953125, -2.9261474609375, -2.832977294921875, -2.73980712890625, -2.646636962890625, -2.553466796875, -2.460296630859375, -2.36712646484375, -2.273956298828125, -2.1807861328125, -2.087615966796875, -1.99444580078125, -1.901275634765625, -1.80810546875, -1.714935302734375, -1.62176513671875, -1.528594970703125, -1.4354248046875, -1.342254638671875, -1.24908447265625, -1.155914306640625, -1.062744140625, -0.969573974609375, -0.87640380859375, -0.783233642578125, -0.6900634765625, -0.596893310546875, -0.50372314453125, -0.410552978515625, -0.3173828125, -0.224212646484375, -0.13104248046875, -0.037872314453125, 0.0552978515625, 0.148468017578125, 0.24163818359375, 0.334808349609375, 0.427978515625, 0.521148681640625, 0.61431884765625, 0.707489013671875, 0.8006591796875, 0.893829345703125, 0.98699951171875, 1.080169677734375, 1.17333984375, 1.266510009765625, 1.35968017578125, 1.452850341796875, 1.5460205078125, 1.639190673828125, 1.73236083984375, 1.825531005859375, 1.918701171875, 2.011871337890625, 2.10504150390625, 2.198211669921875, 2.2913818359375, 2.384552001953125, 2.47772216796875, 2.570892333984375, 2.6640625]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 9.0, 13.0, 19.0, 25.0, 33.0, 36.0, 65.0, 94.0, 157.0, 237.0, 318.0, 490.0, 707.0, 993.0, 1547.0, 2057.0, 2877.0, 4324.0, 6405.0, 9343.0, 13700.0, 20793.0, 32227.0, 50931.0, 84293.0, 154623.0, 264283.0, 160294.0, 87180.0, 51943.0, 33119.0, 21208.0, 13941.0, 9440.0, 6487.0, 4449.0, 3043.0, 2077.0, 1475.0, 991.0, 721.0, 531.0, 339.0, 213.0, 168.0, 122.0, 94.0, 58.0, 26.0, 22.0, 16.0, 7.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.479248046875, -0.4640464782714844, -0.44884490966796875, -0.4336433410644531, -0.4184417724609375, -0.4032402038574219, -0.38803863525390625, -0.3728370666503906, -0.357635498046875, -0.3424339294433594, -0.32723236083984375, -0.3120307922363281, -0.2968292236328125, -0.2816276550292969, -0.26642608642578125, -0.2512245178222656, -0.23602294921875, -0.22082138061523438, -0.20561981201171875, -0.19041824340820312, -0.1752166748046875, -0.16001510620117188, -0.14481353759765625, -0.12961196899414062, -0.114410400390625, -0.09920883178710938, -0.08400726318359375, -0.06880569458007812, -0.0536041259765625, -0.038402557373046875, -0.02320098876953125, -0.007999420166015625, 0.0072021484375, 0.022403717041015625, 0.03760528564453125, 0.052806854248046875, 0.0680084228515625, 0.08320999145507812, 0.09841156005859375, 0.11361312866210938, 0.128814697265625, 0.14401626586914062, 0.15921783447265625, 0.17441940307617188, 0.1896209716796875, 0.20482254028320312, 0.22002410888671875, 0.23522567749023438, 0.25042724609375, 0.2656288146972656, 0.28083038330078125, 0.2960319519042969, 0.3112335205078125, 0.3264350891113281, 0.34163665771484375, 0.3568382263183594, 0.372039794921875, 0.3872413635253906, 0.40244293212890625, 0.4176445007324219, 0.4328460693359375, 0.4480476379394531, 0.46324920654296875, 0.4784507751464844, 0.49365234375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 5.0, 10.0, 9.0, 5.0, 9.0, 18.0, 9.0, 14.0, 13.0, 21.0, 16.0, 18.0, 24.0, 25.0, 35.0, 22.0, 31.0, 35.0, 34.0, 40.0, 31.0, 32.0, 1059.0, 38.0, 40.0, 36.0, 38.0, 40.0, 33.0, 26.0, 27.0, 28.0, 23.0, 17.0, 29.0, 18.0, 21.0, 15.0, 17.0, 11.0, 7.0, 4.0, 7.0, 11.0, 9.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0], "bins": [-1.7978515625, -1.74188232421875, -1.6859130859375, -1.62994384765625, -1.573974609375, -1.51800537109375, -1.4620361328125, -1.40606689453125, -1.35009765625, -1.29412841796875, -1.2381591796875, -1.18218994140625, -1.126220703125, -1.07025146484375, -1.0142822265625, -0.95831298828125, -0.90234375, -0.84637451171875, -0.7904052734375, -0.73443603515625, -0.678466796875, -0.62249755859375, -0.5665283203125, -0.51055908203125, -0.45458984375, -0.39862060546875, -0.3426513671875, -0.28668212890625, -0.230712890625, -0.17474365234375, -0.1187744140625, -0.06280517578125, -0.0068359375, 0.04913330078125, 0.1051025390625, 0.16107177734375, 0.217041015625, 0.27301025390625, 0.3289794921875, 0.38494873046875, 0.44091796875, 0.49688720703125, 0.5528564453125, 0.60882568359375, 0.664794921875, 0.72076416015625, 0.7767333984375, 0.83270263671875, 0.888671875, 0.94464111328125, 1.0006103515625, 1.05657958984375, 1.112548828125, 1.16851806640625, 1.2244873046875, 1.28045654296875, 1.33642578125, 1.39239501953125, 1.4483642578125, 1.50433349609375, 1.560302734375, 1.61627197265625, 1.6722412109375, 1.72821044921875, 1.7841796875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 4.0, 11.0, 9.0, 14.0, 32.0, 40.0, 69.0, 97.0, 133.0, 195.0, 312.0, 455.0, 614.0, 873.0, 1323.0, 1910.0, 2697.0, 3740.0, 5565.0, 8157.0, 12025.0, 18152.0, 27632.0, 43856.0, 72808.0, 131890.0, 1319190.0, 190860.0, 96179.0, 55855.0, 34280.0, 21985.0, 14690.0, 9678.0, 6725.0, 4602.0, 3167.0, 2222.0, 1574.0, 1082.0, 748.0, 529.0, 387.0, 243.0, 166.0, 117.0, 92.0, 52.0, 38.0, 21.0, 18.0, 11.0, 7.0, 2.0, 3.0, 2.0, 3.0, 1.0], "bins": [-0.5166015625, -0.5008277893066406, -0.48505401611328125, -0.4692802429199219, -0.4535064697265625, -0.4377326965332031, -0.42195892333984375, -0.4061851501464844, -0.390411376953125, -0.3746376037597656, -0.35886383056640625, -0.3430900573730469, -0.3273162841796875, -0.3115425109863281, -0.29576873779296875, -0.2799949645996094, -0.26422119140625, -0.24844741821289062, -0.23267364501953125, -0.21689987182617188, -0.2011260986328125, -0.18535232543945312, -0.16957855224609375, -0.15380477905273438, -0.138031005859375, -0.12225723266601562, -0.10648345947265625, -0.09070968627929688, -0.0749359130859375, -0.059162139892578125, -0.04338836669921875, -0.027614593505859375, -0.0118408203125, 0.003932952880859375, 0.01970672607421875, 0.035480499267578125, 0.0512542724609375, 0.06702804565429688, 0.08280181884765625, 0.09857559204101562, 0.114349365234375, 0.13012313842773438, 0.14589691162109375, 0.16167068481445312, 0.1774444580078125, 0.19321823120117188, 0.20899200439453125, 0.22476577758789062, 0.24053955078125, 0.2563133239746094, 0.27208709716796875, 0.2878608703613281, 0.3036346435546875, 0.3194084167480469, 0.33518218994140625, 0.3509559631347656, 0.366729736328125, 0.3825035095214844, 0.39827728271484375, 0.4140510559082031, 0.4298248291015625, 0.4455986022949219, 0.46137237548828125, 0.4771461486816406, 0.492919921875]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 4.0, 8.0, 7.0, 7.0, 9.0, 9.0, 13.0, 11.0, 15.0, 20.0, 22.0, 22.0, 38.0, 35.0, 43.0, 44.0, 61.0, 57.0, 56.0, 74.0, 61.0, 49.0, 56.0, 38.0, 49.0, 35.0, 23.0, 20.0, 23.0, 14.0, 15.0, 15.0, 5.0, 9.0, 10.0, 6.0, 4.0, 8.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00033974647521972656, -0.0003298148512840271, -0.00031988322734832764, -0.0003099516034126282, -0.0003000199794769287, -0.00029008835554122925, -0.0002801567316055298, -0.0002702251076698303, -0.00026029348373413086, -0.0002503618597984314, -0.00024043023586273193, -0.00023049861192703247, -0.000220566987991333, -0.00021063536405563354, -0.00020070374011993408, -0.00019077211618423462, -0.00018084049224853516, -0.0001709088683128357, -0.00016097724437713623, -0.00015104562044143677, -0.0001411139965057373, -0.00013118237257003784, -0.00012125074863433838, -0.00011131912469863892, -0.00010138750076293945, -9.145587682723999e-05, -8.152425289154053e-05, -7.159262895584106e-05, -6.16610050201416e-05, -5.172938108444214e-05, -4.1797757148742676e-05, -3.186613321304321e-05, -2.193450927734375e-05, -1.2002885341644287e-05, -2.0712614059448242e-06, 7.860362529754639e-06, 1.77919864654541e-05, 2.7723610401153564e-05, 3.765523433685303e-05, 4.758685827255249e-05, 5.751848220825195e-05, 6.745010614395142e-05, 7.738173007965088e-05, 8.731335401535034e-05, 9.72449779510498e-05, 0.00010717660188674927, 0.00011710822582244873, 0.0001270398497581482, 0.00013697147369384766, 0.00014690309762954712, 0.00015683472156524658, 0.00016676634550094604, 0.0001766979694366455, 0.00018662959337234497, 0.00019656121730804443, 0.0002064928412437439, 0.00021642446517944336, 0.00022635608911514282, 0.00023628771305084229, 0.00024621933698654175, 0.0002561509609222412, 0.0002660825848579407, 0.00027601420879364014, 0.0002859458327293396, 0.00029587745666503906]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 8.0, 6.0, 4.0, 8.0, 9.0, 7.0, 9.0, 17.0, 23.0, 23.0, 27.0, 36.0, 58.0, 54.0, 76.0, 105.0, 194.0, 363.0, 779.0, 7791.0, 1031378.0, 5795.0, 742.0, 366.0, 185.0, 118.0, 76.0, 59.0, 44.0, 36.0, 30.0, 30.0, 20.0, 17.0, 12.0, 11.0, 8.0, 11.0, 7.0, 4.0, 5.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.005908966064453125, -0.00570148229598999, -0.0054939985275268555, -0.005286514759063721, -0.005079030990600586, -0.004871547222137451, -0.004664063453674316, -0.004456579685211182, -0.004249095916748047, -0.004041612148284912, -0.0038341283798217773, -0.0036266446113586426, -0.003419160842895508, -0.003211677074432373, -0.0030041933059692383, -0.0027967095375061035, -0.0025892257690429688, -0.002381742000579834, -0.0021742582321166992, -0.0019667744636535645, -0.0017592906951904297, -0.001551806926727295, -0.0013443231582641602, -0.0011368393898010254, -0.0009293556213378906, -0.0007218718528747559, -0.0005143880844116211, -0.00030690431594848633, -9.942054748535156e-05, 0.0001080632209777832, 0.00031554698944091797, 0.0005230307579040527, 0.0007305145263671875, 0.0009379982948303223, 0.001145482063293457, 0.0013529658317565918, 0.0015604496002197266, 0.0017679333686828613, 0.001975417137145996, 0.002182900905609131, 0.0023903846740722656, 0.0025978684425354004, 0.002805352210998535, 0.00301283597946167, 0.0032203197479248047, 0.0034278035163879395, 0.0036352872848510742, 0.003842771053314209, 0.004050254821777344, 0.0042577385902404785, 0.004465222358703613, 0.004672706127166748, 0.004880189895629883, 0.005087673664093018, 0.005295157432556152, 0.005502641201019287, 0.005710124969482422, 0.005917608737945557, 0.006125092506408691, 0.006332576274871826, 0.006540060043334961, 0.006747543811798096, 0.0069550275802612305, 0.007162511348724365, 0.0073699951171875]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 7.0, 36.0, 127.0, 273.0, 281.0, 179.0, 78.0, 28.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006201037322171032, -0.000606104324106127, -0.0005921049742028117, -0.0005781055660918355, -0.0005641062161885202, -0.000550106808077544, -0.0005361074581742287, -0.0005221080500632524, -0.0005081087001599371, -0.0004941092920489609, -0.0004801099421456456, -0.00046611056313849986, -0.0004521111841313541, -0.0004381117760203779, -0.00042411242611706257, -0.00041011301800608635, -0.00039611360989511013, -0.00038211423088796437, -0.0003681148518808186, -0.00035411547287367284, -0.0003401160938665271, -0.00032611668575555086, -0.00031211733585223556, -0.00029811792774125934, -0.00028411857783794403, -0.00027011919883079827, -0.0002561198198236525, -0.00024212044081650674, -0.00022812104725744575, -0.0002141216682503, -0.00020012228924315423, -0.00018612289568409324, -0.00017212351667694747, -0.0001581241376698017, -0.00014412475866265595, -0.0001301253796555102, -0.0001161259860964492, -0.00010212660708930343, -8.812722808215767e-05, -7.41278417990543e-05, -6.012846279190853e-05, -4.612908014678396e-05, -3.212969750165939e-05, -1.813031849451363e-05, -4.130935849389061e-06, 9.868446795735508e-06, 2.386782580288127e-05, 3.786721208598465e-05, 5.186659109313041e-05, 6.586597010027617e-05, 7.986535638337955e-05, 9.386473539052531e-05, 0.00010786412167362869, 0.00012186350068077445, 0.0001358628796879202, 0.00014986225869506598, 0.00016386163770221174, 0.0001778610167093575, 0.00019186039571650326, 0.00020585977472364902, 0.00021985916828271002, 0.00023385854728985578, 0.00024785794084891677, 0.00026185731985606253, 0.0002758566988632083]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 1.0, 4.0, 3.0, 9.0, 17.0, 13.0, 14.0, 9.0, 17.0, 18.0, 23.0, 25.0, 20.0, 32.0, 19.0, 30.0, 41.0, 44.0, 37.0, 36.0, 50.0, 44.0, 33.0, 39.0, 35.0, 36.0, 43.0, 36.0, 29.0, 24.0, 29.0, 30.0, 22.0, 29.0, 18.0, 14.0, 16.0, 19.0, 15.0, 10.0, 5.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014156103134155273, -0.0001367218792438507, -0.00013188272714614868, -0.00012704357504844666, -0.00012220442295074463, -0.0001173652708530426, -0.00011252611875534058, -0.00010768696665763855, -0.00010284781455993652, -9.80086624622345e-05, -9.316951036453247e-05, -8.833035826683044e-05, -8.349120616912842e-05, -7.865205407142639e-05, -7.381290197372437e-05, -6.897374987602234e-05, -6.413459777832031e-05, -5.9295445680618286e-05, -5.445629358291626e-05, -4.9617141485214233e-05, -4.477798938751221e-05, -3.993883728981018e-05, -3.5099685192108154e-05, -3.0260533094406128e-05, -2.54213809967041e-05, -2.0582228899002075e-05, -1.574307680130005e-05, -1.0903924703598022e-05, -6.064772605895996e-06, -1.2256205081939697e-06, 3.6135315895080566e-06, 8.452683687210083e-06, 1.329183578491211e-05, 1.8130987882614136e-05, 2.2970139980316162e-05, 2.780929207801819e-05, 3.2648444175720215e-05, 3.748759627342224e-05, 4.232674837112427e-05, 4.7165900468826294e-05, 5.200505256652832e-05, 5.684420466423035e-05, 6.168335676193237e-05, 6.65225088596344e-05, 7.136166095733643e-05, 7.620081305503845e-05, 8.103996515274048e-05, 8.58791172504425e-05, 9.071826934814453e-05, 9.555742144584656e-05, 0.00010039657354354858, 0.00010523572564125061, 0.00011007487773895264, 0.00011491402983665466, 0.00011975318193435669, 0.00012459233403205872, 0.00012943148612976074, 0.00013427063822746277, 0.0001391097903251648, 0.00014394894242286682, 0.00014878809452056885, 0.00015362724661827087, 0.0001584663987159729, 0.00016330555081367493, 0.00016814470291137695]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 7.0, 6.0, 12.0, 7.0, 11.0, 9.0, 13.0, 15.0, 19.0, 20.0, 25.0, 23.0, 32.0, 28.0, 24.0, 39.0, 39.0, 36.0, 32.0, 48.0, 40.0, 30.0, 45.0, 38.0, 29.0, 33.0, 30.0, 35.0, 26.0, 31.0, 32.0, 35.0, 24.0, 23.0, 14.0, 14.0, 11.0, 14.0, 5.0, 9.0, 8.0, 9.0, 8.0, 3.0, 1.0, 4.0, 4.0, 4.0, 0.0, 1.0], "bins": [-3.298828125, -3.205657958984375, -3.11248779296875, -3.019317626953125, -2.9261474609375, -2.832977294921875, -2.73980712890625, -2.646636962890625, -2.553466796875, -2.460296630859375, -2.36712646484375, -2.273956298828125, -2.1807861328125, -2.087615966796875, -1.99444580078125, -1.901275634765625, -1.80810546875, -1.714935302734375, -1.62176513671875, -1.528594970703125, -1.4354248046875, -1.342254638671875, -1.24908447265625, -1.155914306640625, -1.062744140625, -0.969573974609375, -0.87640380859375, -0.783233642578125, -0.6900634765625, -0.596893310546875, -0.50372314453125, -0.410552978515625, -0.3173828125, -0.224212646484375, -0.13104248046875, -0.037872314453125, 0.0552978515625, 0.148468017578125, 0.24163818359375, 0.334808349609375, 0.427978515625, 0.521148681640625, 0.61431884765625, 0.707489013671875, 0.8006591796875, 0.893829345703125, 0.98699951171875, 1.080169677734375, 1.17333984375, 1.266510009765625, 1.35968017578125, 1.452850341796875, 1.5460205078125, 1.639190673828125, 1.73236083984375, 1.825531005859375, 1.918701171875, 2.011871337890625, 2.10504150390625, 2.198211669921875, 2.2913818359375, 2.384552001953125, 2.47772216796875, 2.570892333984375, 2.6640625]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 5.0, 6.0, 9.0, 7.0, 20.0, 14.0, 24.0, 29.0, 30.0, 39.0, 58.0, 80.0, 112.0, 142.0, 273.0, 495.0, 1010.0, 2377.0, 5800.0, 14689.0, 36508.0, 86675.0, 198967.0, 367400.0, 191269.0, 83299.0, 34925.0, 14155.0, 5571.0, 2280.0, 972.0, 476.0, 231.0, 168.0, 92.0, 72.0, 57.0, 57.0, 28.0, 30.0, 26.0, 21.0, 14.0, 15.0, 7.0, 10.0, 5.0, 3.0, 5.0, 0.0, 0.0, 1.0], "bins": [-3.607421875, -3.5057373046875, -3.404052734375, -3.3023681640625, -3.20068359375, -3.0989990234375, -2.997314453125, -2.8956298828125, -2.7939453125, -2.6922607421875, -2.590576171875, -2.4888916015625, -2.38720703125, -2.2855224609375, -2.183837890625, -2.0821533203125, -1.98046875, -1.8787841796875, -1.777099609375, -1.6754150390625, -1.57373046875, -1.4720458984375, -1.370361328125, -1.2686767578125, -1.1669921875, -1.0653076171875, -0.963623046875, -0.8619384765625, -0.76025390625, -0.6585693359375, -0.556884765625, -0.4552001953125, -0.353515625, -0.2518310546875, -0.150146484375, -0.0484619140625, 0.05322265625, 0.1549072265625, 0.256591796875, 0.3582763671875, 0.4599609375, 0.5616455078125, 0.663330078125, 0.7650146484375, 0.86669921875, 0.9683837890625, 1.070068359375, 1.1717529296875, 1.2734375, 1.3751220703125, 1.476806640625, 1.5784912109375, 1.68017578125, 1.7818603515625, 1.883544921875, 1.9852294921875, 2.0869140625, 2.1885986328125, 2.290283203125, 2.3919677734375, 2.49365234375, 2.5953369140625, 2.697021484375, 2.7987060546875, 2.900390625]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 4.0, 4.0, 3.0, 2.0, 3.0, 4.0, 8.0, 6.0, 16.0, 10.0, 14.0, 16.0, 22.0, 31.0, 19.0, 28.0, 40.0, 28.0, 35.0, 43.0, 59.0, 73.0, 148.0, 351.0, 1455.0, 164.0, 83.0, 47.0, 36.0, 34.0, 38.0, 29.0, 30.0, 19.0, 30.0, 23.0, 22.0, 17.0, 10.0, 12.0, 11.0, 6.0, 8.0, 7.0, 1.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.0625, -9.7275390625, -9.392578125, -9.0576171875, -8.72265625, -8.3876953125, -8.052734375, -7.7177734375, -7.3828125, -7.0478515625, -6.712890625, -6.3779296875, -6.04296875, -5.7080078125, -5.373046875, -5.0380859375, -4.703125, -4.3681640625, -4.033203125, -3.6982421875, -3.36328125, -3.0283203125, -2.693359375, -2.3583984375, -2.0234375, -1.6884765625, -1.353515625, -1.0185546875, -0.68359375, -0.3486328125, -0.013671875, 0.3212890625, 0.65625, 0.9912109375, 1.326171875, 1.6611328125, 1.99609375, 2.3310546875, 2.666015625, 3.0009765625, 3.3359375, 3.6708984375, 4.005859375, 4.3408203125, 4.67578125, 5.0107421875, 5.345703125, 5.6806640625, 6.015625, 6.3505859375, 6.685546875, 7.0205078125, 7.35546875, 7.6904296875, 8.025390625, 8.3603515625, 8.6953125, 9.0302734375, 9.365234375, 9.7001953125, 10.03515625, 10.3701171875, 10.705078125, 11.0400390625, 11.375]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 5.0, 10.0, 7.0, 6.0, 11.0, 11.0, 19.0, 13.0, 17.0, 27.0, 32.0, 54.0, 80.0, 116.0, 180.0, 280.0, 611.0, 1715.0, 528739.0, 2609977.0, 2233.0, 634.0, 319.0, 162.0, 116.0, 79.0, 60.0, 48.0, 32.0, 19.0, 22.0, 12.0, 15.0, 9.0, 8.0, 7.0, 6.0, 3.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.1875, -39.8173828125, -38.447265625, -37.0771484375, -35.70703125, -34.3369140625, -32.966796875, -31.5966796875, -30.2265625, -28.8564453125, -27.486328125, -26.1162109375, -24.74609375, -23.3759765625, -22.005859375, -20.6357421875, -19.265625, -17.8955078125, -16.525390625, -15.1552734375, -13.78515625, -12.4150390625, -11.044921875, -9.6748046875, -8.3046875, -6.9345703125, -5.564453125, -4.1943359375, -2.82421875, -1.4541015625, -0.083984375, 1.2861328125, 2.65625, 4.0263671875, 5.396484375, 6.7666015625, 8.13671875, 9.5068359375, 10.876953125, 12.2470703125, 13.6171875, 14.9873046875, 16.357421875, 17.7275390625, 19.09765625, 20.4677734375, 21.837890625, 23.2080078125, 24.578125, 25.9482421875, 27.318359375, 28.6884765625, 30.05859375, 31.4287109375, 32.798828125, 34.1689453125, 35.5390625, 36.9091796875, 38.279296875, 39.6494140625, 41.01953125, 42.3896484375, 43.759765625, 45.1298828125, 46.5]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 7.0, 27.0, 153.0, 347.0, 315.0, 141.0, 22.0, 2.0, 2.0, 0.0, 1.0], "bins": [-69.21880340576172, -68.00346374511719, -66.78813171386719, -65.57279205322266, -64.35745239257812, -63.14211654663086, -61.926780700683594, -60.71144104003906, -59.4961051940918, -58.28076934814453, -57.0654296875, -55.850093841552734, -54.63475799560547, -53.41941833496094, -52.20408248901367, -50.988746643066406, -49.773406982421875, -48.55807113647461, -47.34273147583008, -46.12739562988281, -44.91205596923828, -43.696720123291016, -42.48138427734375, -41.26604461669922, -40.05070877075195, -38.83537292480469, -37.620033264160156, -36.40469741821289, -35.189361572265625, -33.974021911621094, -32.75868606567383, -31.54334831237793, -30.32801055908203, -29.112672805786133, -27.897335052490234, -26.68199920654297, -25.46666145324707, -24.251323699951172, -23.035987854003906, -21.820650100708008, -20.60531234741211, -19.38997459411621, -18.174636840820312, -16.959300994873047, -15.743963241577148, -14.52862548828125, -13.313288688659668, -12.097951889038086, -10.882614135742188, -9.667276382446289, -8.451939582824707, -7.236602306365967, -6.021265029907227, -4.805927753448486, -3.590590476989746, -2.375253677368164, -1.1599159240722656, 0.05542135238647461, 1.2707586288452148, 2.486095905303955, 3.7014331817626953, 4.9167704582214355, 6.132107734680176, 7.347444534301758, 8.562782287597656]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 4.0, 2.0, 7.0, 6.0, 9.0, 9.0, 8.0, 14.0, 13.0, 17.0, 23.0, 19.0, 25.0, 19.0, 31.0, 24.0, 35.0, 29.0, 37.0, 26.0, 40.0, 41.0, 38.0, 44.0, 35.0, 40.0, 41.0, 25.0, 33.0, 34.0, 31.0, 20.0, 32.0, 20.0, 27.0, 26.0, 21.0, 16.0, 15.0, 21.0, 6.0, 12.0, 7.0, 7.0, 6.0, 9.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.22670555114746, -20.48387336730957, -19.741043090820312, -18.998210906982422, -18.25537872314453, -17.512548446655273, -16.769716262817383, -16.026885986328125, -15.284053802490234, -14.54122257232666, -13.798391342163086, -13.055559158325195, -12.312727928161621, -11.569896697998047, -10.827064514160156, -10.084233283996582, -9.341402053833008, -8.598570823669434, -7.855739116668701, -7.112907409667969, -6.3700761795043945, -5.62724494934082, -4.884413242340088, -4.1415815353393555, -3.3987503051757812, -2.655918836593628, -1.9130873680114746, -1.1702558994293213, -0.42742443084716797, 0.31540703773498535, 1.0582385063171387, 1.801070213317871, 2.543903350830078, 3.2867348194122314, 4.029566287994385, 4.772397994995117, 5.515229225158691, 6.258060455322266, 7.000892162322998, 7.7437238693237305, 8.486555099487305, 9.229386329650879, 9.972217559814453, 10.715049743652344, 11.457880973815918, 12.200712203979492, 12.943544387817383, 13.686375617980957, 14.429206848144531, 15.172038078308105, 15.91486930847168, 16.65770149230957, 17.400531768798828, 18.14336395263672, 18.88619613647461, 19.6290283203125, 20.371858596801758, 21.11469078063965, 21.857521057128906, 22.600353240966797, 23.343185424804688, 24.086015701293945, 24.828847885131836, 25.571678161621094, 26.314510345458984]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 6.0, 8.0, 3.0, 8.0, 8.0, 13.0, 12.0, 11.0, 15.0, 24.0, 16.0, 28.0, 22.0, 24.0, 26.0, 31.0, 31.0, 31.0, 25.0, 40.0, 55.0, 43.0, 41.0, 31.0, 30.0, 35.0, 33.0, 37.0, 23.0, 30.0, 28.0, 26.0, 31.0, 23.0, 22.0, 19.0, 20.0, 21.0, 15.0, 19.0, 9.0, 5.0, 9.0, 3.0, 2.0, 3.0, 4.0, 5.0, 2.0, 0.0, 1.0, 3.0, 1.0], "bins": [-3.47265625, -3.370147705078125, -3.26763916015625, -3.165130615234375, -3.0626220703125, -2.960113525390625, -2.85760498046875, -2.755096435546875, -2.652587890625, -2.550079345703125, -2.44757080078125, -2.345062255859375, -2.2425537109375, -2.140045166015625, -2.03753662109375, -1.935028076171875, -1.83251953125, -1.730010986328125, -1.62750244140625, -1.524993896484375, -1.4224853515625, -1.319976806640625, -1.21746826171875, -1.114959716796875, -1.012451171875, -0.909942626953125, -0.80743408203125, -0.704925537109375, -0.6024169921875, -0.499908447265625, -0.39739990234375, -0.294891357421875, -0.1923828125, -0.089874267578125, 0.01263427734375, 0.115142822265625, 0.2176513671875, 0.320159912109375, 0.42266845703125, 0.525177001953125, 0.627685546875, 0.730194091796875, 0.83270263671875, 0.935211181640625, 1.0377197265625, 1.140228271484375, 1.24273681640625, 1.345245361328125, 1.44775390625, 1.550262451171875, 1.65277099609375, 1.755279541015625, 1.8577880859375, 1.960296630859375, 2.06280517578125, 2.165313720703125, 2.267822265625, 2.370330810546875, 2.47283935546875, 2.575347900390625, 2.6778564453125, 2.780364990234375, 2.88287353515625, 2.985382080078125, 3.087890625]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 4.0, 5.0, 7.0, 10.0, 4.0, 8.0, 10.0, 18.0, 23.0, 19.0, 27.0, 26.0, 36.0, 45.0, 55.0, 54.0, 93.0, 103.0, 139.0, 204.0, 432.0, 1782.0, 32566.0, 1352374.0, 2666509.0, 133785.0, 4243.0, 699.0, 246.0, 134.0, 122.0, 99.0, 75.0, 56.0, 46.0, 45.0, 31.0, 29.0, 24.0, 26.0, 18.0, 17.0, 7.0, 10.0, 10.0, 0.0, 4.0, 0.0, 4.0, 3.0, 2.0, 3.0, 0.0, 3.0], "bins": [-11.296875, -10.96630859375, -10.6357421875, -10.30517578125, -9.974609375, -9.64404296875, -9.3134765625, -8.98291015625, -8.65234375, -8.32177734375, -7.9912109375, -7.66064453125, -7.330078125, -6.99951171875, -6.6689453125, -6.33837890625, -6.0078125, -5.67724609375, -5.3466796875, -5.01611328125, -4.685546875, -4.35498046875, -4.0244140625, -3.69384765625, -3.36328125, -3.03271484375, -2.7021484375, -2.37158203125, -2.041015625, -1.71044921875, -1.3798828125, -1.04931640625, -0.71875, -0.38818359375, -0.0576171875, 0.27294921875, 0.603515625, 0.93408203125, 1.2646484375, 1.59521484375, 1.92578125, 2.25634765625, 2.5869140625, 2.91748046875, 3.248046875, 3.57861328125, 3.9091796875, 4.23974609375, 4.5703125, 4.90087890625, 5.2314453125, 5.56201171875, 5.892578125, 6.22314453125, 6.5537109375, 6.88427734375, 7.21484375, 7.54541015625, 7.8759765625, 8.20654296875, 8.537109375, 8.86767578125, 9.1982421875, 9.52880859375, 9.859375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 10.0, 13.0, 10.0, 14.0, 17.0, 22.0, 28.0, 28.0, 48.0, 72.0, 78.0, 122.0, 137.0, 198.0, 286.0, 381.0, 447.0, 459.0, 419.0, 341.0, 240.0, 185.0, 140.0, 97.0, 62.0, 53.0, 46.0, 27.0, 21.0, 20.0, 13.0, 12.0, 8.0, 6.0, 5.0, 7.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.7890625, -6.5909423828125, -6.392822265625, -6.1947021484375, -5.99658203125, -5.7984619140625, -5.600341796875, -5.4022216796875, -5.2041015625, -5.0059814453125, -4.807861328125, -4.6097412109375, -4.41162109375, -4.2135009765625, -4.015380859375, -3.8172607421875, -3.619140625, -3.4210205078125, -3.222900390625, -3.0247802734375, -2.82666015625, -2.6285400390625, -2.430419921875, -2.2322998046875, -2.0341796875, -1.8360595703125, -1.637939453125, -1.4398193359375, -1.24169921875, -1.0435791015625, -0.845458984375, -0.6473388671875, -0.44921875, -0.2510986328125, -0.052978515625, 0.1451416015625, 0.34326171875, 0.5413818359375, 0.739501953125, 0.9376220703125, 1.1357421875, 1.3338623046875, 1.531982421875, 1.7301025390625, 1.92822265625, 2.1263427734375, 2.324462890625, 2.5225830078125, 2.720703125, 2.9188232421875, 3.116943359375, 3.3150634765625, 3.51318359375, 3.7113037109375, 3.909423828125, 4.1075439453125, 4.3056640625, 4.5037841796875, 4.701904296875, 4.9000244140625, 5.09814453125, 5.2962646484375, 5.494384765625, 5.6925048828125, 5.890625]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 6.0, 7.0, 4.0, 8.0, 15.0, 15.0, 18.0, 28.0, 37.0, 40.0, 71.0, 87.0, 124.0, 191.0, 277.0, 402.0, 667.0, 13883.0, 4068152.0, 107829.0, 956.0, 406.0, 279.0, 209.0, 144.0, 116.0, 81.0, 54.0, 42.0, 31.0, 25.0, 16.0, 18.0, 10.0, 11.0, 8.0, 6.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-29.875, -28.8671875, -27.859375, -26.8515625, -25.84375, -24.8359375, -23.828125, -22.8203125, -21.8125, -20.8046875, -19.796875, -18.7890625, -17.78125, -16.7734375, -15.765625, -14.7578125, -13.75, -12.7421875, -11.734375, -10.7265625, -9.71875, -8.7109375, -7.703125, -6.6953125, -5.6875, -4.6796875, -3.671875, -2.6640625, -1.65625, -0.6484375, 0.359375, 1.3671875, 2.375, 3.3828125, 4.390625, 5.3984375, 6.40625, 7.4140625, 8.421875, 9.4296875, 10.4375, 11.4453125, 12.453125, 13.4609375, 14.46875, 15.4765625, 16.484375, 17.4921875, 18.5, 19.5078125, 20.515625, 21.5234375, 22.53125, 23.5390625, 24.546875, 25.5546875, 26.5625, 27.5703125, 28.578125, 29.5859375, 30.59375, 31.6015625, 32.609375, 33.6171875, 34.625]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 48.0, 152.0, 313.0, 313.0, 143.0, 34.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.572322845458984, -29.463878631591797, -27.355432510375977, -25.246986389160156, -23.13854217529297, -21.03009796142578, -18.92165184020996, -16.81320571899414, -14.704761505126953, -12.59631633758545, -10.487871170043945, -8.379426002502441, -6.2709808349609375, -4.162535667419434, -2.0540904998779297, 0.05435466766357422, 2.162799835205078, 4.271245002746582, 6.379690170288086, 8.48813533782959, 10.596580505371094, 12.705025672912598, 14.813470840454102, 16.921916961669922, 19.03036117553711, 21.138805389404297, 23.247251510620117, 25.355697631835938, 27.464141845703125, 29.572586059570312, 31.681032180786133, 33.78947830200195, 35.897926330566406, 38.006370544433594, 40.11481475830078, 42.223262786865234, 44.33170700073242, 46.44015121459961, 48.54859924316406, 50.65704345703125, 52.76548767089844, 54.873931884765625, 56.98237609863281, 59.090824127197266, 61.19926834106445, 63.30771255493164, 65.4161605834961, 67.52460479736328, 69.63304901123047, 71.74149322509766, 73.84993743896484, 75.95838165283203, 78.06683349609375, 80.17527770996094, 82.28372192382812, 84.39216613769531, 86.5006103515625, 88.60905456542969, 90.71749877929688, 92.82594299316406, 94.93438720703125, 97.04283905029297, 99.15128326416016, 101.25972747802734, 103.36817169189453]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 10.0, 4.0, 5.0, 8.0, 7.0, 11.0, 12.0, 15.0, 16.0, 25.0, 18.0, 24.0, 32.0, 28.0, 30.0, 31.0, 47.0, 39.0, 36.0, 49.0, 36.0, 40.0, 36.0, 33.0, 46.0, 40.0, 52.0, 39.0, 32.0, 28.0, 30.0, 18.0, 20.0, 19.0, 12.0, 16.0, 18.0, 9.0, 9.0, 6.0, 6.0, 4.0, 6.0, 2.0, 0.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.979713439941406, -22.316659927368164, -21.653608322143555, -20.990554809570312, -20.327503204345703, -19.66444969177246, -19.00139808654785, -18.33834457397461, -17.67529296875, -17.012239456176758, -16.34918785095215, -15.686135292053223, -15.023082733154297, -14.360029220581055, -13.696976661682129, -13.033924102783203, -12.370870590209961, -11.707818031311035, -11.04476547241211, -10.381712913513184, -9.718660354614258, -9.055606842041016, -8.39255428314209, -7.729501724243164, -7.066449165344238, -6.4033966064453125, -5.740344047546387, -5.077291011810303, -4.414238452911377, -3.751185894012451, -3.0881330966949463, -2.4250802993774414, -1.7620258331298828, -1.0989731550216675, -0.43592047691345215, 0.22713220119476318, 0.8901848793029785, 1.5532374382019043, 2.216290235519409, 2.879343032836914, 3.54239559173584, 4.205448150634766, 4.868500709533691, 5.531553745269775, 6.194606304168701, 6.857658863067627, 7.520711898803711, 8.183764457702637, 8.846817016601562, 9.509869575500488, 10.172922134399414, 10.83597469329834, 11.499027252197266, 12.162080764770508, 12.825133323669434, 13.48818588256836, 14.151238441467285, 14.814291000366211, 15.477343559265137, 16.140396118164062, 16.803449630737305, 17.466501235961914, 18.129554748535156, 18.792606353759766, 19.455659866333008]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 8.0, 8.0, 2.0, 5.0, 9.0, 12.0, 20.0, 19.0, 20.0, 24.0, 14.0, 34.0, 24.0, 33.0, 26.0, 28.0, 32.0, 32.0, 29.0, 45.0, 54.0, 31.0, 44.0, 39.0, 37.0, 38.0, 39.0, 44.0, 42.0, 33.0, 21.0, 30.0, 24.0, 19.0, 21.0, 15.0, 9.0, 7.0, 11.0, 9.0, 3.0, 5.0, 2.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.580078125, -3.472930908203125, -3.36578369140625, -3.258636474609375, -3.1514892578125, -3.044342041015625, -2.93719482421875, -2.830047607421875, -2.722900390625, -2.615753173828125, -2.50860595703125, -2.401458740234375, -2.2943115234375, -2.187164306640625, -2.08001708984375, -1.972869873046875, -1.86572265625, -1.758575439453125, -1.65142822265625, -1.544281005859375, -1.4371337890625, -1.329986572265625, -1.22283935546875, -1.115692138671875, -1.008544921875, -0.901397705078125, -0.79425048828125, -0.687103271484375, -0.5799560546875, -0.472808837890625, -0.36566162109375, -0.258514404296875, -0.1513671875, -0.044219970703125, 0.06292724609375, 0.170074462890625, 0.2772216796875, 0.384368896484375, 0.49151611328125, 0.598663330078125, 0.705810546875, 0.812957763671875, 0.92010498046875, 1.027252197265625, 1.1343994140625, 1.241546630859375, 1.34869384765625, 1.455841064453125, 1.56298828125, 1.670135498046875, 1.77728271484375, 1.884429931640625, 1.9915771484375, 2.098724365234375, 2.20587158203125, 2.313018798828125, 2.420166015625, 2.527313232421875, 2.63446044921875, 2.741607666015625, 2.8487548828125, 2.955902099609375, 3.06304931640625, 3.170196533203125, 3.27734375]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 4.0, 2.0, 7.0, 7.0, 28.0, 25.0, 24.0, 38.0, 75.0, 111.0, 153.0, 232.0, 304.0, 465.0, 708.0, 994.0, 1375.0, 2013.0, 2846.0, 4301.0, 6010.0, 8886.0, 12490.0, 18304.0, 26968.0, 40852.0, 64013.0, 107949.0, 212449.0, 224806.0, 113778.0, 66679.0, 42513.0, 27692.0, 18796.0, 13148.0, 8884.0, 6214.0, 4451.0, 3141.0, 2034.0, 1442.0, 1045.0, 746.0, 438.0, 347.0, 257.0, 161.0, 121.0, 69.0, 57.0, 38.0, 26.0, 25.0, 6.0, 11.0, 3.0, 6.0, 2.0, 0.0, 3.0], "bins": [-0.52685546875, -0.5104141235351562, -0.4939727783203125, -0.47753143310546875, -0.461090087890625, -0.44464874267578125, -0.4282073974609375, -0.41176605224609375, -0.39532470703125, -0.37888336181640625, -0.3624420166015625, -0.34600067138671875, -0.329559326171875, -0.31311798095703125, -0.2966766357421875, -0.28023529052734375, -0.2637939453125, -0.24735260009765625, -0.2309112548828125, -0.21446990966796875, -0.198028564453125, -0.18158721923828125, -0.1651458740234375, -0.14870452880859375, -0.13226318359375, -0.11582183837890625, -0.0993804931640625, -0.08293914794921875, -0.066497802734375, -0.05005645751953125, -0.0336151123046875, -0.01717376708984375, -0.000732421875, 0.01570892333984375, 0.0321502685546875, 0.04859161376953125, 0.065032958984375, 0.08147430419921875, 0.0979156494140625, 0.11435699462890625, 0.13079833984375, 0.14723968505859375, 0.1636810302734375, 0.18012237548828125, 0.196563720703125, 0.21300506591796875, 0.2294464111328125, 0.24588775634765625, 0.2623291015625, 0.27877044677734375, 0.2952117919921875, 0.31165313720703125, 0.328094482421875, 0.34453582763671875, 0.3609771728515625, 0.37741851806640625, 0.39385986328125, 0.41030120849609375, 0.4267425537109375, 0.44318389892578125, 0.459625244140625, 0.47606658935546875, 0.4925079345703125, 0.5089492797851562, 0.525390625]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 1.0, 2.0, 6.0, 4.0, 8.0, 7.0, 8.0, 9.0, 9.0, 20.0, 14.0, 17.0, 21.0, 23.0, 27.0, 27.0, 21.0, 36.0, 30.0, 23.0, 38.0, 32.0, 41.0, 39.0, 42.0, 1057.0, 42.0, 51.0, 34.0, 35.0, 25.0, 35.0, 32.0, 24.0, 26.0, 28.0, 26.0, 15.0, 11.0, 15.0, 16.0, 7.0, 9.0, 9.0, 9.0, 2.0, 5.0, 1.0, 6.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.9033203125, -1.842681884765625, -1.78204345703125, -1.721405029296875, -1.6607666015625, -1.600128173828125, -1.53948974609375, -1.478851318359375, -1.418212890625, -1.357574462890625, -1.29693603515625, -1.236297607421875, -1.1756591796875, -1.115020751953125, -1.05438232421875, -0.993743896484375, -0.93310546875, -0.872467041015625, -0.81182861328125, -0.751190185546875, -0.6905517578125, -0.629913330078125, -0.56927490234375, -0.508636474609375, -0.447998046875, -0.387359619140625, -0.32672119140625, -0.266082763671875, -0.2054443359375, -0.144805908203125, -0.08416748046875, -0.023529052734375, 0.037109375, 0.097747802734375, 0.15838623046875, 0.219024658203125, 0.2796630859375, 0.340301513671875, 0.40093994140625, 0.461578369140625, 0.522216796875, 0.582855224609375, 0.64349365234375, 0.704132080078125, 0.7647705078125, 0.825408935546875, 0.88604736328125, 0.946685791015625, 1.00732421875, 1.067962646484375, 1.12860107421875, 1.189239501953125, 1.2498779296875, 1.310516357421875, 1.37115478515625, 1.431793212890625, 1.492431640625, 1.553070068359375, 1.61370849609375, 1.674346923828125, 1.7349853515625, 1.795623779296875, 1.85626220703125, 1.916900634765625, 1.9775390625]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 5.0, 5.0, 10.0, 7.0, 18.0, 41.0, 48.0, 64.0, 89.0, 141.0, 190.0, 289.0, 392.0, 534.0, 825.0, 1153.0, 1567.0, 2190.0, 3289.0, 4575.0, 6722.0, 9891.0, 14788.0, 22682.0, 35484.0, 57403.0, 98210.0, 197229.0, 1315729.0, 125963.0, 70962.0, 43171.0, 27499.0, 17915.0, 11998.0, 8029.0, 5571.0, 3780.0, 2637.0, 1781.0, 1302.0, 888.0, 619.0, 456.0, 340.0, 204.0, 141.0, 96.0, 65.0, 59.0, 35.0, 21.0, 15.0, 10.0, 7.0, 6.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.50830078125, -0.49201202392578125, -0.4757232666015625, -0.45943450927734375, -0.443145751953125, -0.42685699462890625, -0.4105682373046875, -0.39427947998046875, -0.37799072265625, -0.36170196533203125, -0.3454132080078125, -0.32912445068359375, -0.312835693359375, -0.29654693603515625, -0.2802581787109375, -0.26396942138671875, -0.2476806640625, -0.23139190673828125, -0.2151031494140625, -0.19881439208984375, -0.182525634765625, -0.16623687744140625, -0.1499481201171875, -0.13365936279296875, -0.11737060546875, -0.10108184814453125, -0.0847930908203125, -0.06850433349609375, -0.052215576171875, -0.03592681884765625, -0.0196380615234375, -0.00334930419921875, 0.012939453125, 0.02922821044921875, 0.0455169677734375, 0.06180572509765625, 0.078094482421875, 0.09438323974609375, 0.1106719970703125, 0.12696075439453125, 0.14324951171875, 0.15953826904296875, 0.1758270263671875, 0.19211578369140625, 0.208404541015625, 0.22469329833984375, 0.2409820556640625, 0.25727081298828125, 0.2735595703125, 0.28984832763671875, 0.3061370849609375, 0.32242584228515625, 0.338714599609375, 0.35500335693359375, 0.3712921142578125, 0.38758087158203125, 0.40386962890625, 0.42015838623046875, 0.4364471435546875, 0.45273590087890625, 0.469024658203125, 0.48531341552734375, 0.5016021728515625, 0.5178909301757812, 0.5341796875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 0.0, 1.0, 4.0, 9.0, 13.0, 11.0, 18.0, 31.0, 34.0, 56.0, 64.0, 93.0, 73.0, 76.0, 99.0, 81.0, 70.0, 87.0, 43.0, 40.0, 26.0, 17.0, 17.0, 16.0, 8.0, 6.0, 4.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000591278076171875, -0.0005702376365661621, -0.0005491971969604492, -0.0005281567573547363, -0.0005071163177490234, -0.00048607587814331055, -0.00046503543853759766, -0.00044399499893188477, -0.0004229545593261719, -0.000401914119720459, -0.0003808736801147461, -0.0003598332405090332, -0.0003387928009033203, -0.0003177523612976074, -0.00029671192169189453, -0.00027567148208618164, -0.00025463104248046875, -0.00023359060287475586, -0.00021255016326904297, -0.00019150972366333008, -0.0001704692840576172, -0.0001494288444519043, -0.0001283884048461914, -0.00010734796524047852, -8.630752563476562e-05, -6.526708602905273e-05, -4.4226646423339844e-05, -2.3186206817626953e-05, -2.1457672119140625e-06, 1.8894672393798828e-05, 3.993511199951172e-05, 6.097555160522461e-05, 8.20159912109375e-05, 0.00010305643081665039, 0.00012409687042236328, 0.00014513731002807617, 0.00016617774963378906, 0.00018721818923950195, 0.00020825862884521484, 0.00022929906845092773, 0.0002503395080566406, 0.0002713799476623535, 0.0002924203872680664, 0.0003134608268737793, 0.0003345012664794922, 0.0003555417060852051, 0.00037658214569091797, 0.00039762258529663086, 0.00041866302490234375, 0.00043970346450805664, 0.00046074390411376953, 0.0004817843437194824, 0.0005028247833251953, 0.0005238652229309082, 0.0005449056625366211, 0.000565946102142334, 0.0005869865417480469, 0.0006080269813537598, 0.0006290674209594727, 0.0006501078605651855, 0.0006711483001708984, 0.0006921887397766113, 0.0007132291793823242, 0.0007342696189880371, 0.00075531005859375]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 2.0, 5.0, 5.0, 9.0, 9.0, 14.0, 29.0, 41.0, 47.0, 49.0, 114.0, 142.0, 291.0, 830.0, 38302.0, 1006473.0, 1250.0, 376.0, 194.0, 120.0, 87.0, 58.0, 27.0, 23.0, 19.0, 13.0, 7.0, 4.0, 3.0, 5.0, 4.0, 0.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.0155487060546875, -0.015118718147277832, -0.014688730239868164, -0.014258742332458496, -0.013828754425048828, -0.01339876651763916, -0.012968778610229492, -0.012538790702819824, -0.012108802795410156, -0.011678814888000488, -0.01124882698059082, -0.010818839073181152, -0.010388851165771484, -0.009958863258361816, -0.009528875350952148, -0.00909888744354248, -0.008668899536132812, -0.008238911628723145, -0.0078089237213134766, -0.007378935813903809, -0.006948947906494141, -0.006518959999084473, -0.006088972091674805, -0.005658984184265137, -0.005228996276855469, -0.004799008369445801, -0.004369020462036133, -0.003939032554626465, -0.003509044647216797, -0.003079056739807129, -0.002649068832397461, -0.002219080924987793, -0.001789093017578125, -0.001359105110168457, -0.0009291172027587891, -0.0004991292953491211, -6.914138793945312e-05, 0.00036084651947021484, 0.0007908344268798828, 0.0012208223342895508, 0.0016508102416992188, 0.0020807981491088867, 0.0025107860565185547, 0.0029407739639282227, 0.0033707618713378906, 0.0038007497787475586, 0.0042307376861572266, 0.0046607255935668945, 0.0050907135009765625, 0.0055207014083862305, 0.0059506893157958984, 0.006380677223205566, 0.006810665130615234, 0.007240653038024902, 0.00767064094543457, 0.008100628852844238, 0.008530616760253906, 0.008960604667663574, 0.009390592575073242, 0.00982058048248291, 0.010250568389892578, 0.010680556297302246, 0.011110544204711914, 0.011540532112121582, 0.01197052001953125]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 6.0, 41.0, 352.0, 510.0, 101.0, 5.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.0020160379353910685, -0.001980794593691826, -0.001945551368407905, -0.0019103080267086625, -0.00187506468500942, -0.0018398214597254992, -0.0018045781180262566, -0.001769334776327014, -0.0017340915510430932, -0.0016988482093438506, -0.0016636049840599298, -0.0016283616423606873, -0.0015931183006614447, -0.001557875075377524, -0.0015226317336782813, -0.0014873885083943605, -0.001452145166695118, -0.0014169018249958754, -0.0013816585997119546, -0.001346415258012712, -0.0013111719163134694, -0.0012759286910295486, -0.001240685349330306, -0.0012054420076310635, -0.0011701986659318209, -0.0011349553242325783, -0.0010997120989486575, -0.001064468757249415, -0.0010292254155501723, -0.0009939821902662516, -0.000958738848567009, -0.0009234955650754273, -0.0008882522815838456, -0.0008530089980922639, -0.0008177656563930213, -0.0007825223729014397, -0.000747279089409858, -0.0007120358059182763, -0.0006767924642190337, -0.000641549180727452, -0.0006063058972358704, -0.0005710626137442887, -0.0005358192720450461, -0.0005005759885534644, -0.00046533270506188273, -0.0004300893924664706, -0.00039484607987105846, -0.0003596027963794768, -0.0003243594546802342, -0.00028911614208482206, -0.0002538728585932404, -0.00021862954599782825, -0.00018338624795433134, -0.00014814294991083443, -0.0001128996373154223, -7.765635382384062e-05, -4.241304122842848e-05, -7.169739546952769e-06, 2.8073562134522945e-05, 6.331686745397747e-05, 9.856016549747437e-05, 0.00013380346354097128, 0.00016904677613638341, 0.0002042900596279651, 0.00023953337222337723]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 1.0, 5.0, 5.0, 7.0, 5.0, 8.0, 12.0, 12.0, 11.0, 17.0, 17.0, 21.0, 25.0, 37.0, 22.0, 23.0, 35.0, 37.0, 29.0, 30.0, 50.0, 38.0, 44.0, 63.0, 40.0, 32.0, 42.0, 31.0, 39.0, 22.0, 37.0, 30.0, 22.0, 35.0, 18.0, 16.0, 17.0, 12.0, 14.0, 8.0, 9.0, 5.0, 5.0, 4.0, 7.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00023794174194335938, -0.00023050233721733093, -0.0002230629324913025, -0.00021562352776527405, -0.0002081841230392456, -0.00020074471831321716, -0.00019330531358718872, -0.00018586590886116028, -0.00017842650413513184, -0.0001709870994091034, -0.00016354769468307495, -0.0001561082899570465, -0.00014866888523101807, -0.00014122948050498962, -0.00013379007577896118, -0.00012635067105293274, -0.0001189112663269043, -0.00011147186160087585, -0.00010403245687484741, -9.659305214881897e-05, -8.915364742279053e-05, -8.171424269676208e-05, -7.427483797073364e-05, -6.68354332447052e-05, -5.939602851867676e-05, -5.1956623792648315e-05, -4.451721906661987e-05, -3.707781434059143e-05, -2.9638409614562988e-05, -2.2199004888534546e-05, -1.4759600162506104e-05, -7.320195436477661e-06, 1.1920928955078125e-07, 7.558614015579224e-06, 1.4998018741607666e-05, 2.243742346763611e-05, 2.987682819366455e-05, 3.731623291969299e-05, 4.4755637645721436e-05, 5.219504237174988e-05, 5.963444709777832e-05, 6.707385182380676e-05, 7.45132565498352e-05, 8.195266127586365e-05, 8.939206600189209e-05, 9.683147072792053e-05, 0.00010427087545394897, 0.00011171028017997742, 0.00011914968490600586, 0.0001265890896320343, 0.00013402849435806274, 0.0001414678990840912, 0.00014890730381011963, 0.00015634670853614807, 0.00016378611326217651, 0.00017122551798820496, 0.0001786649227142334, 0.00018610432744026184, 0.00019354373216629028, 0.00020098313689231873, 0.00020842254161834717, 0.0002158619463443756, 0.00022330135107040405, 0.0002307407557964325, 0.00023818016052246094]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 8.0, 8.0, 2.0, 5.0, 9.0, 12.0, 20.0, 19.0, 20.0, 24.0, 14.0, 34.0, 24.0, 33.0, 26.0, 28.0, 32.0, 32.0, 29.0, 45.0, 54.0, 31.0, 44.0, 39.0, 37.0, 38.0, 39.0, 44.0, 42.0, 33.0, 21.0, 30.0, 24.0, 19.0, 21.0, 15.0, 9.0, 7.0, 11.0, 9.0, 3.0, 5.0, 2.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.580078125, -3.472930908203125, -3.36578369140625, -3.258636474609375, -3.1514892578125, -3.044342041015625, -2.93719482421875, -2.830047607421875, -2.722900390625, -2.615753173828125, -2.50860595703125, -2.401458740234375, -2.2943115234375, -2.187164306640625, -2.08001708984375, -1.972869873046875, -1.86572265625, -1.758575439453125, -1.65142822265625, -1.544281005859375, -1.4371337890625, -1.329986572265625, -1.22283935546875, -1.115692138671875, -1.008544921875, -0.901397705078125, -0.79425048828125, -0.687103271484375, -0.5799560546875, -0.472808837890625, -0.36566162109375, -0.258514404296875, -0.1513671875, -0.044219970703125, 0.06292724609375, 0.170074462890625, 0.2772216796875, 0.384368896484375, 0.49151611328125, 0.598663330078125, 0.705810546875, 0.812957763671875, 0.92010498046875, 1.027252197265625, 1.1343994140625, 1.241546630859375, 1.34869384765625, 1.455841064453125, 1.56298828125, 1.670135498046875, 1.77728271484375, 1.884429931640625, 1.9915771484375, 2.098724365234375, 2.20587158203125, 2.313018798828125, 2.420166015625, 2.527313232421875, 2.63446044921875, 2.741607666015625, 2.8487548828125, 2.955902099609375, 3.06304931640625, 3.170196533203125, 3.27734375]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 4.0, 6.0, 8.0, 10.0, 11.0, 16.0, 24.0, 24.0, 27.0, 37.0, 53.0, 62.0, 98.0, 126.0, 169.0, 264.0, 567.0, 1548.0, 7210.0, 46621.0, 328456.0, 572347.0, 75160.0, 11730.0, 2138.0, 719.0, 369.0, 203.0, 141.0, 108.0, 63.0, 62.0, 44.0, 31.0, 20.0, 19.0, 15.0, 10.0, 15.0, 6.0, 2.0, 5.0, 5.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.7265625, -7.50018310546875, -7.2738037109375, -7.04742431640625, -6.821044921875, -6.59466552734375, -6.3682861328125, -6.14190673828125, -5.91552734375, -5.68914794921875, -5.4627685546875, -5.23638916015625, -5.010009765625, -4.78363037109375, -4.5572509765625, -4.33087158203125, -4.1044921875, -3.87811279296875, -3.6517333984375, -3.42535400390625, -3.198974609375, -2.97259521484375, -2.7462158203125, -2.51983642578125, -2.29345703125, -2.06707763671875, -1.8406982421875, -1.61431884765625, -1.387939453125, -1.16156005859375, -0.9351806640625, -0.70880126953125, -0.482421875, -0.25604248046875, -0.0296630859375, 0.19671630859375, 0.423095703125, 0.64947509765625, 0.8758544921875, 1.10223388671875, 1.32861328125, 1.55499267578125, 1.7813720703125, 2.00775146484375, 2.234130859375, 2.46051025390625, 2.6868896484375, 2.91326904296875, 3.1396484375, 3.36602783203125, 3.5924072265625, 3.81878662109375, 4.045166015625, 4.27154541015625, 4.4979248046875, 4.72430419921875, 4.95068359375, 5.17706298828125, 5.4034423828125, 5.62982177734375, 5.856201171875, 6.08258056640625, 6.3089599609375, 6.53533935546875, 6.76171875]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 4.0, 6.0, 9.0, 5.0, 12.0, 9.0, 16.0, 10.0, 15.0, 23.0, 22.0, 34.0, 30.0, 27.0, 38.0, 40.0, 43.0, 59.0, 71.0, 129.0, 352.0, 1465.0, 147.0, 78.0, 56.0, 45.0, 27.0, 30.0, 28.0, 33.0, 20.0, 19.0, 17.0, 18.0, 11.0, 15.0, 14.0, 13.0, 9.0, 7.0, 9.0, 6.0, 6.0, 5.0, 7.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0], "bins": [-10.7890625, -10.452880859375, -10.11669921875, -9.780517578125, -9.4443359375, -9.108154296875, -8.77197265625, -8.435791015625, -8.099609375, -7.763427734375, -7.42724609375, -7.091064453125, -6.7548828125, -6.418701171875, -6.08251953125, -5.746337890625, -5.41015625, -5.073974609375, -4.73779296875, -4.401611328125, -4.0654296875, -3.729248046875, -3.39306640625, -3.056884765625, -2.720703125, -2.384521484375, -2.04833984375, -1.712158203125, -1.3759765625, -1.039794921875, -0.70361328125, -0.367431640625, -0.03125, 0.304931640625, 0.64111328125, 0.977294921875, 1.3134765625, 1.649658203125, 1.98583984375, 2.322021484375, 2.658203125, 2.994384765625, 3.33056640625, 3.666748046875, 4.0029296875, 4.339111328125, 4.67529296875, 5.011474609375, 5.34765625, 5.683837890625, 6.02001953125, 6.356201171875, 6.6923828125, 7.028564453125, 7.36474609375, 7.700927734375, 8.037109375, 8.373291015625, 8.70947265625, 9.045654296875, 9.3818359375, 9.718017578125, 10.05419921875, 10.390380859375, 10.7265625]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 1.0, 4.0, 2.0, 9.0, 8.0, 8.0, 11.0, 16.0, 16.0, 24.0, 15.0, 40.0, 30.0, 43.0, 45.0, 55.0, 67.0, 81.0, 124.0, 208.0, 463.0, 1203.0, 21611.0, 3108733.0, 10698.0, 973.0, 406.0, 215.0, 136.0, 112.0, 82.0, 53.0, 46.0, 28.0, 32.0, 24.0, 30.0, 10.0, 12.0, 8.0, 7.0, 8.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.75, -34.61279296875, -33.4755859375, -32.33837890625, -31.201171875, -30.06396484375, -28.9267578125, -27.78955078125, -26.65234375, -25.51513671875, -24.3779296875, -23.24072265625, -22.103515625, -20.96630859375, -19.8291015625, -18.69189453125, -17.5546875, -16.41748046875, -15.2802734375, -14.14306640625, -13.005859375, -11.86865234375, -10.7314453125, -9.59423828125, -8.45703125, -7.31982421875, -6.1826171875, -5.04541015625, -3.908203125, -2.77099609375, -1.6337890625, -0.49658203125, 0.640625, 1.77783203125, 2.9150390625, 4.05224609375, 5.189453125, 6.32666015625, 7.4638671875, 8.60107421875, 9.73828125, 10.87548828125, 12.0126953125, 13.14990234375, 14.287109375, 15.42431640625, 16.5615234375, 17.69873046875, 18.8359375, 19.97314453125, 21.1103515625, 22.24755859375, 23.384765625, 24.52197265625, 25.6591796875, 26.79638671875, 27.93359375, 29.07080078125, 30.2080078125, 31.34521484375, 32.482421875, 33.61962890625, 34.7568359375, 35.89404296875, 37.03125]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 22.0, 89.0, 284.0, 360.0, 210.0, 43.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.74382781982422, -51.605743408203125, -50.46765899658203, -49.32957077026367, -48.19148635864258, -47.053401947021484, -45.91531753540039, -44.77722930908203, -43.63914489746094, -42.501060485839844, -41.36297607421875, -40.22488784790039, -39.0868034362793, -37.9487190246582, -36.81063461303711, -35.67254638671875, -34.534461975097656, -33.39637756347656, -32.25829315185547, -31.120206832885742, -29.982120513916016, -28.844036102294922, -27.705951690673828, -26.5678653717041, -25.42978286743164, -24.291698455810547, -23.15361213684082, -22.015527725219727, -20.87744140625, -19.739356994628906, -18.601272583007812, -17.463186264038086, -16.32509994506836, -15.18701457977295, -14.048929214477539, -12.910844802856445, -11.772758483886719, -10.634674072265625, -9.496588706970215, -8.358503341674805, -7.2204179763793945, -6.082332611083984, -4.944247245788574, -3.8061623573303223, -2.668076992034912, -1.529991626739502, -0.39190673828125, 0.7461786270141602, 1.8842639923095703, 3.0223493576049805, 4.160434722900391, 5.298519611358643, 6.436604976654053, 7.574690341949463, 8.712775230407715, 9.850860595703125, 10.988945960998535, 12.127031326293945, 13.265116691589355, 14.403202056884766, 15.54128646850586, 16.679372787475586, 17.81745719909668, 18.955543518066406, 20.0936279296875]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 4.0, 10.0, 12.0, 11.0, 16.0, 14.0, 13.0, 36.0, 23.0, 28.0, 37.0, 38.0, 46.0, 41.0, 47.0, 51.0, 50.0, 57.0, 57.0, 48.0, 61.0, 44.0, 42.0, 39.0, 26.0, 33.0, 22.0, 23.0, 13.0, 12.0, 18.0, 7.0, 10.0, 3.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-51.57958221435547, -50.222007751464844, -48.86442947387695, -47.50685501098633, -46.14927673339844, -44.79170227050781, -43.43412780761719, -42.0765495300293, -40.71897506713867, -39.36140060424805, -38.003822326660156, -36.64624786376953, -35.28866958618164, -33.931095123291016, -32.573516845703125, -31.2159423828125, -29.858366012573242, -28.500789642333984, -27.143213272094727, -25.78563690185547, -24.428062438964844, -23.070486068725586, -21.712909698486328, -20.355335235595703, -18.997756958007812, -17.640180587768555, -16.282604217529297, -14.925028800964355, -13.567453384399414, -12.209877014160156, -10.852300643920898, -9.494725227355957, -8.137149810791016, -6.779573917388916, -5.421998023986816, -4.064421653747559, -2.706845760345459, -1.3492698669433594, 0.008306503295898438, 1.3658819198608398, 2.7234582901000977, 4.081034183502197, 5.438610076904297, 6.796186447143555, 8.153762817382812, 9.511338233947754, 10.868914604187012, 12.226490020751953, 13.584066390991211, 14.941642761230469, 16.299219131469727, 17.656795501708984, 19.01436996459961, 20.371946334838867, 21.729522705078125, 23.08709716796875, 24.44467544555664, 25.8022518157959, 27.159828186035156, 28.51740264892578, 29.87497901916504, 31.232555389404297, 32.59013366699219, 33.94770812988281, 35.30528259277344]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 5.0, 5.0, 7.0, 4.0, 9.0, 8.0, 14.0, 13.0, 25.0, 24.0, 27.0, 22.0, 27.0, 31.0, 30.0, 29.0, 35.0, 35.0, 41.0, 40.0, 39.0, 41.0, 54.0, 47.0, 23.0, 47.0, 44.0, 34.0, 43.0, 29.0, 28.0, 20.0, 31.0, 14.0, 22.0, 17.0, 1.0, 10.0, 4.0, 11.0, 4.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.25, -4.121795654296875, -3.99359130859375, -3.865386962890625, -3.7371826171875, -3.608978271484375, -3.48077392578125, -3.352569580078125, -3.224365234375, -3.096160888671875, -2.96795654296875, -2.839752197265625, -2.7115478515625, -2.583343505859375, -2.45513916015625, -2.326934814453125, -2.19873046875, -2.070526123046875, -1.94232177734375, -1.814117431640625, -1.6859130859375, -1.557708740234375, -1.42950439453125, -1.301300048828125, -1.173095703125, -1.044891357421875, -0.91668701171875, -0.788482666015625, -0.6602783203125, -0.532073974609375, -0.40386962890625, -0.275665283203125, -0.1474609375, -0.019256591796875, 0.10894775390625, 0.237152099609375, 0.3653564453125, 0.493560791015625, 0.62176513671875, 0.749969482421875, 0.878173828125, 1.006378173828125, 1.13458251953125, 1.262786865234375, 1.3909912109375, 1.519195556640625, 1.64739990234375, 1.775604248046875, 1.90380859375, 2.032012939453125, 2.16021728515625, 2.288421630859375, 2.4166259765625, 2.544830322265625, 2.67303466796875, 2.801239013671875, 2.929443359375, 3.057647705078125, 3.18585205078125, 3.314056396484375, 3.4422607421875, 3.570465087890625, 3.69866943359375, 3.826873779296875, 3.955078125]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 4.0, 1.0, 3.0, 12.0, 6.0, 13.0, 17.0, 23.0, 20.0, 39.0, 32.0, 47.0, 65.0, 90.0, 152.0, 237.0, 397.0, 793.0, 2226.0, 10856.0, 79154.0, 524677.0, 1629817.0, 1448927.0, 421252.0, 63009.0, 8751.0, 1964.0, 712.0, 321.0, 213.0, 126.0, 70.0, 68.0, 41.0, 34.0, 24.0, 25.0, 20.0, 14.0, 7.0, 4.0, 8.0, 6.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.60546875, -5.43524169921875, -5.2650146484375, -5.09478759765625, -4.924560546875, -4.75433349609375, -4.5841064453125, -4.41387939453125, -4.24365234375, -4.07342529296875, -3.9031982421875, -3.73297119140625, -3.562744140625, -3.39251708984375, -3.2222900390625, -3.05206298828125, -2.8818359375, -2.71160888671875, -2.5413818359375, -2.37115478515625, -2.200927734375, -2.03070068359375, -1.8604736328125, -1.69024658203125, -1.52001953125, -1.34979248046875, -1.1795654296875, -1.00933837890625, -0.839111328125, -0.66888427734375, -0.4986572265625, -0.32843017578125, -0.158203125, 0.01202392578125, 0.1822509765625, 0.35247802734375, 0.522705078125, 0.69293212890625, 0.8631591796875, 1.03338623046875, 1.20361328125, 1.37384033203125, 1.5440673828125, 1.71429443359375, 1.884521484375, 2.05474853515625, 2.2249755859375, 2.39520263671875, 2.5654296875, 2.73565673828125, 2.9058837890625, 3.07611083984375, 3.246337890625, 3.41656494140625, 3.5867919921875, 3.75701904296875, 3.92724609375, 4.09747314453125, 4.2677001953125, 4.43792724609375, 4.608154296875, 4.77838134765625, 4.9486083984375, 5.11883544921875, 5.2890625]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 5.0, 3.0, 5.0, 6.0, 11.0, 13.0, 17.0, 16.0, 31.0, 50.0, 48.0, 67.0, 97.0, 134.0, 169.0, 247.0, 305.0, 388.0, 456.0, 423.0, 395.0, 299.0, 235.0, 188.0, 132.0, 81.0, 70.0, 50.0, 33.0, 23.0, 19.0, 15.0, 12.0, 7.0, 9.0, 3.0, 3.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.49609375, -7.2811279296875, -7.066162109375, -6.8511962890625, -6.63623046875, -6.4212646484375, -6.206298828125, -5.9913330078125, -5.7763671875, -5.5614013671875, -5.346435546875, -5.1314697265625, -4.91650390625, -4.7015380859375, -4.486572265625, -4.2716064453125, -4.056640625, -3.8416748046875, -3.626708984375, -3.4117431640625, -3.19677734375, -2.9818115234375, -2.766845703125, -2.5518798828125, -2.3369140625, -2.1219482421875, -1.906982421875, -1.6920166015625, -1.47705078125, -1.2620849609375, -1.047119140625, -0.8321533203125, -0.6171875, -0.4022216796875, -0.187255859375, 0.0277099609375, 0.24267578125, 0.4576416015625, 0.672607421875, 0.8875732421875, 1.1025390625, 1.3175048828125, 1.532470703125, 1.7474365234375, 1.96240234375, 2.1773681640625, 2.392333984375, 2.6072998046875, 2.822265625, 3.0372314453125, 3.252197265625, 3.4671630859375, 3.68212890625, 3.8970947265625, 4.112060546875, 4.3270263671875, 4.5419921875, 4.7569580078125, 4.971923828125, 5.1868896484375, 5.40185546875, 5.6168212890625, 5.831787109375, 6.0467529296875, 6.26171875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 6.0, 11.0, 19.0, 17.0, 26.0, 26.0, 52.0, 68.0, 118.0, 165.0, 261.0, 446.0, 747.0, 1618.0, 10611.0, 3220024.0, 952049.0, 5007.0, 1323.0, 589.0, 358.0, 238.0, 148.0, 107.0, 62.0, 52.0, 42.0, 23.0, 12.0, 9.0, 14.0, 6.0, 7.0, 3.0, 4.0, 8.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.515625, -20.715087890625, -19.91455078125, -19.114013671875, -18.3134765625, -17.512939453125, -16.71240234375, -15.911865234375, -15.111328125, -14.310791015625, -13.51025390625, -12.709716796875, -11.9091796875, -11.108642578125, -10.30810546875, -9.507568359375, -8.70703125, -7.906494140625, -7.10595703125, -6.305419921875, -5.5048828125, -4.704345703125, -3.90380859375, -3.103271484375, -2.302734375, -1.502197265625, -0.70166015625, 0.098876953125, 0.8994140625, 1.699951171875, 2.50048828125, 3.301025390625, 4.1015625, 4.902099609375, 5.70263671875, 6.503173828125, 7.3037109375, 8.104248046875, 8.90478515625, 9.705322265625, 10.505859375, 11.306396484375, 12.10693359375, 12.907470703125, 13.7080078125, 14.508544921875, 15.30908203125, 16.109619140625, 16.91015625, 17.710693359375, 18.51123046875, 19.311767578125, 20.1123046875, 20.912841796875, 21.71337890625, 22.513916015625, 23.314453125, 24.114990234375, 24.91552734375, 25.716064453125, 26.5166015625, 27.317138671875, 28.11767578125, 28.918212890625, 29.71875]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 42.0, 386.0, 498.0, 86.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-136.50393676757812, -132.3837890625, -128.26364135742188, -124.14350891113281, -120.02336120605469, -115.90321350097656, -111.78307342529297, -107.66293334960938, -103.54278564453125, -99.42263793945312, -95.30249786376953, -91.18235778808594, -87.06221008300781, -82.94206237792969, -78.8219223022461, -74.7017822265625, -70.58163452148438, -66.46148681640625, -62.341346740722656, -58.2212028503418, -54.10105895996094, -49.98091506958008, -45.86077117919922, -41.74062728881836, -37.6204833984375, -33.50033950805664, -29.38019561767578, -25.260051727294922, -21.139907836914062, -17.019763946533203, -12.899620056152344, -8.779476165771484, -4.6593170166015625, -0.5391731262207031, 3.5809707641601562, 7.701114654541016, 11.821258544921875, 15.941402435302734, 20.061546325683594, 24.181690216064453, 28.301834106445312, 32.42197799682617, 36.54212188720703, 40.66226577758789, 44.78240966796875, 48.90255355834961, 53.02269744873047, 57.14284133911133, 61.26298522949219, 65.38313293457031, 69.5032730102539, 73.6234130859375, 77.74356079101562, 81.86370849609375, 85.98384857177734, 90.10398864746094, 94.22413635253906, 98.34428405761719, 102.46442413330078, 106.58456420898438, 110.7047119140625, 114.82485961914062, 118.94499969482422, 123.06513977050781, 127.18528747558594]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 4.0, 8.0, 3.0, 6.0, 10.0, 19.0, 14.0, 12.0, 19.0, 30.0, 33.0, 39.0, 36.0, 44.0, 32.0, 52.0, 48.0, 47.0, 43.0, 40.0, 48.0, 47.0, 39.0, 48.0, 39.0, 35.0, 28.0, 31.0, 30.0, 15.0, 16.0, 15.0, 15.0, 10.0, 3.0, 14.0, 8.0, 5.0, 2.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.92617416381836, -22.146080017089844, -21.365985870361328, -20.585891723632812, -19.805795669555664, -19.02570152282715, -18.245607376098633, -17.465513229370117, -16.68541717529297, -15.905323028564453, -15.125227928161621, -14.345133781433105, -13.565038681030273, -12.784944534301758, -12.004850387573242, -11.224756240844727, -10.444662094116211, -9.664567947387695, -8.884472846984863, -8.104378700256348, -7.324284076690674, -6.544189453125, -5.764095306396484, -4.9840006828308105, -4.203906059265137, -3.423811435699463, -2.643717050552368, -1.8636226654052734, -1.0835280418395996, -0.3034334182739258, 0.47666072845458984, 1.2567553520202637, 2.0368499755859375, 2.8169445991516113, 3.597038984298706, 4.377133369445801, 5.157227993011475, 5.937322616577148, 6.717416763305664, 7.497511386871338, 8.277606010437012, 9.057700157165527, 9.83779525756836, 10.617889404296875, 11.39798355102539, 12.178078651428223, 12.958172798156738, 13.73826789855957, 14.518362045288086, 15.298456192016602, 16.078550338745117, 16.858646392822266, 17.63874053955078, 18.418834686279297, 19.198928833007812, 19.979022979736328, 20.759117126464844, 21.53921127319336, 22.319305419921875, 23.09939956665039, 23.87949562072754, 24.659589767456055, 25.43968391418457, 26.219778060913086, 26.999874114990234]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 4.0, 4.0, 10.0, 5.0, 9.0, 7.0, 10.0, 3.0, 20.0, 14.0, 20.0, 20.0, 26.0, 29.0, 21.0, 24.0, 35.0, 35.0, 31.0, 43.0, 35.0, 38.0, 39.0, 36.0, 36.0, 49.0, 48.0, 37.0, 35.0, 30.0, 31.0, 26.0, 28.0, 22.0, 22.0, 20.0, 19.0, 16.0, 15.0, 16.0, 10.0, 7.0, 3.0, 3.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-3.515625, -3.40960693359375, -3.3035888671875, -3.19757080078125, -3.091552734375, -2.98553466796875, -2.8795166015625, -2.77349853515625, -2.66748046875, -2.56146240234375, -2.4554443359375, -2.34942626953125, -2.243408203125, -2.13739013671875, -2.0313720703125, -1.92535400390625, -1.8193359375, -1.71331787109375, -1.6072998046875, -1.50128173828125, -1.395263671875, -1.28924560546875, -1.1832275390625, -1.07720947265625, -0.97119140625, -0.86517333984375, -0.7591552734375, -0.65313720703125, -0.547119140625, -0.44110107421875, -0.3350830078125, -0.22906494140625, -0.123046875, -0.01702880859375, 0.0889892578125, 0.19500732421875, 0.301025390625, 0.40704345703125, 0.5130615234375, 0.61907958984375, 0.72509765625, 0.83111572265625, 0.9371337890625, 1.04315185546875, 1.149169921875, 1.25518798828125, 1.3612060546875, 1.46722412109375, 1.5732421875, 1.67926025390625, 1.7852783203125, 1.89129638671875, 1.997314453125, 2.10333251953125, 2.2093505859375, 2.31536865234375, 2.42138671875, 2.52740478515625, 2.6334228515625, 2.73944091796875, 2.845458984375, 2.95147705078125, 3.0574951171875, 3.16351318359375, 3.26953125]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 9.0, 3.0, 13.0, 28.0, 20.0, 42.0, 77.0, 123.0, 194.0, 270.0, 392.0, 628.0, 906.0, 1378.0, 2096.0, 3099.0, 5029.0, 8022.0, 12552.0, 20345.0, 33143.0, 57492.0, 106304.0, 230511.0, 275157.0, 125745.0, 66042.0, 37280.0, 22821.0, 14039.0, 8925.0, 5550.0, 3755.0, 2258.0, 1498.0, 928.0, 655.0, 430.0, 261.0, 201.0, 120.0, 85.0, 39.0, 32.0, 33.0, 16.0, 4.0, 5.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.67041015625, -0.6495361328125, -0.628662109375, -0.6077880859375, -0.5869140625, -0.5660400390625, -0.545166015625, -0.5242919921875, -0.50341796875, -0.4825439453125, -0.461669921875, -0.4407958984375, -0.419921875, -0.3990478515625, -0.378173828125, -0.3572998046875, -0.33642578125, -0.3155517578125, -0.294677734375, -0.2738037109375, -0.2529296875, -0.2320556640625, -0.211181640625, -0.1903076171875, -0.16943359375, -0.1485595703125, -0.127685546875, -0.1068115234375, -0.0859375, -0.0650634765625, -0.044189453125, -0.0233154296875, -0.00244140625, 0.0184326171875, 0.039306640625, 0.0601806640625, 0.0810546875, 0.1019287109375, 0.122802734375, 0.1436767578125, 0.16455078125, 0.1854248046875, 0.206298828125, 0.2271728515625, 0.248046875, 0.2689208984375, 0.289794921875, 0.3106689453125, 0.33154296875, 0.3524169921875, 0.373291015625, 0.3941650390625, 0.4150390625, 0.4359130859375, 0.456787109375, 0.4776611328125, 0.49853515625, 0.5194091796875, 0.540283203125, 0.5611572265625, 0.58203125, 0.6029052734375, 0.623779296875, 0.6446533203125, 0.66552734375]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 3.0, 7.0, 12.0, 9.0, 12.0, 13.0, 11.0, 26.0, 25.0, 42.0, 29.0, 31.0, 44.0, 38.0, 32.0, 56.0, 57.0, 49.0, 1073.0, 58.0, 40.0, 39.0, 48.0, 31.0, 37.0, 31.0, 27.0, 28.0, 22.0, 18.0, 21.0, 10.0, 11.0, 10.0, 9.0, 4.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.8046875, -2.72064208984375, -2.6365966796875, -2.55255126953125, -2.468505859375, -2.38446044921875, -2.3004150390625, -2.21636962890625, -2.13232421875, -2.04827880859375, -1.9642333984375, -1.88018798828125, -1.796142578125, -1.71209716796875, -1.6280517578125, -1.54400634765625, -1.4599609375, -1.37591552734375, -1.2918701171875, -1.20782470703125, -1.123779296875, -1.03973388671875, -0.9556884765625, -0.87164306640625, -0.78759765625, -0.70355224609375, -0.6195068359375, -0.53546142578125, -0.451416015625, -0.36737060546875, -0.2833251953125, -0.19927978515625, -0.115234375, -0.03118896484375, 0.0528564453125, 0.13690185546875, 0.220947265625, 0.30499267578125, 0.3890380859375, 0.47308349609375, 0.55712890625, 0.64117431640625, 0.7252197265625, 0.80926513671875, 0.893310546875, 0.97735595703125, 1.0614013671875, 1.14544677734375, 1.2294921875, 1.31353759765625, 1.3975830078125, 1.48162841796875, 1.565673828125, 1.64971923828125, 1.7337646484375, 1.81781005859375, 1.90185546875, 1.98590087890625, 2.0699462890625, 2.15399169921875, 2.238037109375, 2.32208251953125, 2.4061279296875, 2.49017333984375, 2.57421875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 7.0, 11.0, 18.0, 22.0, 21.0, 38.0, 55.0, 95.0, 121.0, 213.0, 304.0, 470.0, 703.0, 1067.0, 1617.0, 2584.0, 4043.0, 6446.0, 10297.0, 16710.0, 28174.0, 49398.0, 92615.0, 206317.0, 1373086.0, 137841.0, 68475.0, 38144.0, 22234.0, 13306.0, 8332.0, 5037.0, 3262.0, 2113.0, 1328.0, 939.0, 550.0, 375.0, 248.0, 180.0, 104.0, 87.0, 51.0, 41.0, 18.0, 12.0, 10.0, 7.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.74951171875, -0.7269821166992188, -0.7044525146484375, -0.6819229125976562, -0.659393310546875, -0.6368637084960938, -0.6143341064453125, -0.5918045043945312, -0.56927490234375, -0.5467453002929688, -0.5242156982421875, -0.5016860961914062, -0.479156494140625, -0.45662689208984375, -0.4340972900390625, -0.41156768798828125, -0.3890380859375, -0.36650848388671875, -0.3439788818359375, -0.32144927978515625, -0.298919677734375, -0.27639007568359375, -0.2538604736328125, -0.23133087158203125, -0.20880126953125, -0.18627166748046875, -0.1637420654296875, -0.14121246337890625, -0.118682861328125, -0.09615325927734375, -0.0736236572265625, -0.05109405517578125, -0.028564453125, -0.00603485107421875, 0.0164947509765625, 0.03902435302734375, 0.061553955078125, 0.08408355712890625, 0.1066131591796875, 0.12914276123046875, 0.15167236328125, 0.17420196533203125, 0.1967315673828125, 0.21926116943359375, 0.241790771484375, 0.26432037353515625, 0.2868499755859375, 0.30937957763671875, 0.3319091796875, 0.35443878173828125, 0.3769683837890625, 0.39949798583984375, 0.422027587890625, 0.44455718994140625, 0.4670867919921875, 0.48961639404296875, 0.51214599609375, 0.5346755981445312, 0.5572052001953125, 0.5797348022460938, 0.602264404296875, 0.6247940063476562, 0.6473236083984375, 0.6698532104492188, 0.6923828125]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 0.0, 3.0, 3.0, 6.0, 5.0, 0.0, 8.0, 9.0, 16.0, 15.0, 22.0, 18.0, 16.0, 24.0, 34.0, 26.0, 44.0, 46.0, 38.0, 59.0, 78.0, 50.0, 59.0, 68.0, 60.0, 46.0, 47.0, 40.0, 28.0, 24.0, 27.0, 16.0, 11.0, 17.0, 3.0, 4.0, 7.0, 4.0, 4.0, 4.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0], "bins": [-0.0004138946533203125, -0.0004028528928756714, -0.0003918111324310303, -0.00038076937198638916, -0.00036972761154174805, -0.00035868585109710693, -0.0003476440906524658, -0.0003366023302078247, -0.0003255605697631836, -0.0003145188093185425, -0.00030347704887390137, -0.00029243528842926025, -0.00028139352798461914, -0.00027035176753997803, -0.0002593100070953369, -0.0002482682466506958, -0.0002372264862060547, -0.00022618472576141357, -0.00021514296531677246, -0.00020410120487213135, -0.00019305944442749023, -0.00018201768398284912, -0.000170975923538208, -0.0001599341630935669, -0.00014889240264892578, -0.00013785064220428467, -0.00012680888175964355, -0.00011576712131500244, -0.00010472536087036133, -9.368360042572021e-05, -8.26418399810791e-05, -7.160007953643799e-05, -6.0558319091796875e-05, -4.951655864715576e-05, -3.847479820251465e-05, -2.7433037757873535e-05, -1.6391277313232422e-05, -5.349516868591309e-06, 5.692243576049805e-06, 1.6734004020690918e-05, 2.777576446533203e-05, 3.8817524909973145e-05, 4.985928535461426e-05, 6.090104579925537e-05, 7.194280624389648e-05, 8.29845666885376e-05, 9.402632713317871e-05, 0.00010506808757781982, 0.00011610984802246094, 0.00012715160846710205, 0.00013819336891174316, 0.00014923512935638428, 0.0001602768898010254, 0.0001713186502456665, 0.00018236041069030762, 0.00019340217113494873, 0.00020444393157958984, 0.00021548569202423096, 0.00022652745246887207, 0.00023756921291351318, 0.0002486109733581543, 0.0002596527338027954, 0.0002706944942474365, 0.00028173625469207764, 0.00029277801513671875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 8.0, 6.0, 5.0, 11.0, 9.0, 6.0, 9.0, 11.0, 17.0, 42.0, 29.0, 24.0, 45.0, 73.0, 106.0, 161.0, 221.0, 429.0, 1074.0, 89148.0, 953838.0, 1781.0, 619.0, 240.0, 165.0, 104.0, 67.0, 66.0, 49.0, 42.0, 31.0, 20.0, 24.0, 22.0, 13.0, 5.0, 6.0, 7.0, 4.0, 4.0, 6.0, 1.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.006134033203125, -0.005899786949157715, -0.00566554069519043, -0.0054312944412231445, -0.005197048187255859, -0.004962801933288574, -0.004728555679321289, -0.004494309425354004, -0.004260063171386719, -0.004025816917419434, -0.0037915706634521484, -0.0035573244094848633, -0.003323078155517578, -0.003088831901550293, -0.002854585647583008, -0.0026203393936157227, -0.0023860931396484375, -0.0021518468856811523, -0.0019176006317138672, -0.001683354377746582, -0.0014491081237792969, -0.0012148618698120117, -0.0009806156158447266, -0.0007463693618774414, -0.0005121231079101562, -0.0002778768539428711, -4.363059997558594e-05, 0.00019061565399169922, 0.0004248619079589844, 0.0006591081619262695, 0.0008933544158935547, 0.0011276006698608398, 0.001361846923828125, 0.0015960931777954102, 0.0018303394317626953, 0.0020645856857299805, 0.0022988319396972656, 0.0025330781936645508, 0.002767324447631836, 0.003001570701599121, 0.0032358169555664062, 0.0034700632095336914, 0.0037043094635009766, 0.003938555717468262, 0.004172801971435547, 0.004407048225402832, 0.004641294479370117, 0.004875540733337402, 0.0051097869873046875, 0.005344033241271973, 0.005578279495239258, 0.005812525749206543, 0.006046772003173828, 0.006281018257141113, 0.0065152645111083984, 0.006749510765075684, 0.006983757019042969, 0.007218003273010254, 0.007452249526977539, 0.007686495780944824, 0.00792074203491211, 0.008154988288879395, 0.00838923454284668, 0.008623480796813965, 0.00885772705078125]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 7.0, 17.0, 29.0, 46.0, 102.0, 148.0, 166.0, 171.0, 132.0, 95.0, 57.0, 20.0, 8.0, 6.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0002174089604523033, -0.00020824294188059866, -0.00019907692330889404, -0.0001899109047371894, -0.00018074488616548479, -0.00017157886759378016, -0.00016241284902207553, -0.0001532468304503709, -0.00014408081187866628, -0.00013491479330696166, -0.00012574877473525703, -0.0001165827561635524, -0.00010741673759184778, -9.825071902014315e-05, -8.908470044843853e-05, -7.99186818767339e-05, -7.075266330502927e-05, -6.158664473332465e-05, -5.242062616162002e-05, -4.3254607589915395e-05, -3.408858901821077e-05, -2.4922570446506143e-05, -1.5756551874801517e-05, -6.5905333030968904e-06, 2.5754852686077356e-06, 1.1741503840312362e-05, 2.0907522412016988e-05, 3.0073540983721614e-05, 3.923955955542624e-05, 4.8405578127130866e-05, 5.757159669883549e-05, 6.673761527054012e-05, 7.590363384224474e-05, 8.506965241394937e-05, 9.4235670985654e-05, 0.00010340168955735862, 0.00011256770812906325, 0.00012173372670076787, 0.0001308997452724725, 0.00014006576384417713, 0.00014923178241588175, 0.00015839780098758638, 0.000167563819559291, 0.00017672983813099563, 0.00018589585670270026, 0.00019506187527440488, 0.0002042278938461095, 0.00021339391241781414, 0.00022255993098951876, 0.0002317259495612234, 0.00024089196813292801, 0.00025005798670463264, 0.00025922400527633727, 0.0002683900238480419, 0.0002775560424197465, 0.00028672206099145114, 0.00029588807956315577, 0.0003050540981348604, 0.000314220116706565, 0.00032338613527826965, 0.0003325521538499743, 0.0003417181724216789, 0.0003508841909933835, 0.00036005020956508815, 0.0003692162281367928]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 3.0, 2.0, 6.0, 5.0, 6.0, 6.0, 7.0, 12.0, 6.0, 13.0, 11.0, 14.0, 16.0, 15.0, 25.0, 27.0, 35.0, 33.0, 26.0, 47.0, 34.0, 35.0, 45.0, 46.0, 34.0, 40.0, 51.0, 22.0, 39.0, 29.0, 39.0, 37.0, 38.0, 30.0, 26.0, 31.0, 12.0, 18.0, 19.0, 12.0, 8.0, 17.0, 6.0, 3.0, 3.0, 1.0, 5.0, 7.0, 2.0, 0.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0], "bins": [-0.0001887679100036621, -0.00018302258104085922, -0.00017727725207805634, -0.00017153192311525345, -0.00016578659415245056, -0.00016004126518964767, -0.0001542959362268448, -0.0001485506072640419, -0.00014280527830123901, -0.00013705994933843613, -0.00013131462037563324, -0.00012556929141283035, -0.00011982396245002747, -0.00011407863348722458, -0.00010833330452442169, -0.0001025879755616188, -9.684264659881592e-05, -9.109731763601303e-05, -8.535198867321014e-05, -7.960665971040726e-05, -7.386133074760437e-05, -6.811600178480148e-05, -6.23706728219986e-05, -5.662534385919571e-05, -5.088001489639282e-05, -4.5134685933589935e-05, -3.938935697078705e-05, -3.364402800798416e-05, -2.7898699045181274e-05, -2.2153370082378387e-05, -1.64080411195755e-05, -1.0662712156772614e-05, -4.9173831939697266e-06, 8.279457688331604e-07, 6.573274731636047e-06, 1.2318603694438934e-05, 1.806393265724182e-05, 2.3809261620044708e-05, 2.9554590582847595e-05, 3.529991954565048e-05, 4.104524850845337e-05, 4.6790577471256256e-05, 5.253590643405914e-05, 5.828123539686203e-05, 6.402656435966492e-05, 6.97718933224678e-05, 7.551722228527069e-05, 8.126255124807358e-05, 8.700788021087646e-05, 9.275320917367935e-05, 9.849853813648224e-05, 0.00010424386709928513, 0.00010998919606208801, 0.0001157345250248909, 0.00012147985398769379, 0.00012722518295049667, 0.00013297051191329956, 0.00013871584087610245, 0.00014446116983890533, 0.00015020649880170822, 0.0001559518277645111, 0.000161697156727314, 0.00016744248569011688, 0.00017318781465291977, 0.00017893314361572266]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 4.0, 4.0, 10.0, 5.0, 9.0, 7.0, 10.0, 3.0, 20.0, 14.0, 20.0, 20.0, 26.0, 29.0, 21.0, 24.0, 35.0, 35.0, 31.0, 43.0, 35.0, 38.0, 39.0, 36.0, 36.0, 49.0, 48.0, 37.0, 35.0, 30.0, 31.0, 26.0, 28.0, 22.0, 22.0, 20.0, 19.0, 16.0, 15.0, 16.0, 10.0, 7.0, 3.0, 3.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-3.515625, -3.40960693359375, -3.3035888671875, -3.19757080078125, -3.091552734375, -2.98553466796875, -2.8795166015625, -2.77349853515625, -2.66748046875, -2.56146240234375, -2.4554443359375, -2.34942626953125, -2.243408203125, -2.13739013671875, -2.0313720703125, -1.92535400390625, -1.8193359375, -1.71331787109375, -1.6072998046875, -1.50128173828125, -1.395263671875, -1.28924560546875, -1.1832275390625, -1.07720947265625, -0.97119140625, -0.86517333984375, -0.7591552734375, -0.65313720703125, -0.547119140625, -0.44110107421875, -0.3350830078125, -0.22906494140625, -0.123046875, -0.01702880859375, 0.0889892578125, 0.19500732421875, 0.301025390625, 0.40704345703125, 0.5130615234375, 0.61907958984375, 0.72509765625, 0.83111572265625, 0.9371337890625, 1.04315185546875, 1.149169921875, 1.25518798828125, 1.3612060546875, 1.46722412109375, 1.5732421875, 1.67926025390625, 1.7852783203125, 1.89129638671875, 1.997314453125, 2.10333251953125, 2.2093505859375, 2.31536865234375, 2.42138671875, 2.52740478515625, 2.6334228515625, 2.73944091796875, 2.845458984375, 2.95147705078125, 3.0574951171875, 3.16351318359375, 3.26953125]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 6.0, 5.0, 7.0, 8.0, 12.0, 8.0, 5.0, 11.0, 25.0, 35.0, 37.0, 52.0, 90.0, 152.0, 295.0, 609.0, 1389.0, 3409.0, 8644.0, 21195.0, 52179.0, 136748.0, 326092.0, 300045.0, 118911.0, 46449.0, 18997.0, 7566.0, 3033.0, 1291.0, 569.0, 266.0, 125.0, 89.0, 63.0, 30.0, 25.0, 16.0, 10.0, 20.0, 11.0, 3.0, 5.0, 3.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 1.0], "bins": [-3.86328125, -3.7459716796875, -3.628662109375, -3.5113525390625, -3.39404296875, -3.2767333984375, -3.159423828125, -3.0421142578125, -2.9248046875, -2.8074951171875, -2.690185546875, -2.5728759765625, -2.45556640625, -2.3382568359375, -2.220947265625, -2.1036376953125, -1.986328125, -1.8690185546875, -1.751708984375, -1.6343994140625, -1.51708984375, -1.3997802734375, -1.282470703125, -1.1651611328125, -1.0478515625, -0.9305419921875, -0.813232421875, -0.6959228515625, -0.57861328125, -0.4613037109375, -0.343994140625, -0.2266845703125, -0.109375, 0.0079345703125, 0.125244140625, 0.2425537109375, 0.35986328125, 0.4771728515625, 0.594482421875, 0.7117919921875, 0.8291015625, 0.9464111328125, 1.063720703125, 1.1810302734375, 1.29833984375, 1.4156494140625, 1.532958984375, 1.6502685546875, 1.767578125, 1.8848876953125, 2.002197265625, 2.1195068359375, 2.23681640625, 2.3541259765625, 2.471435546875, 2.5887451171875, 2.7060546875, 2.8233642578125, 2.940673828125, 3.0579833984375, 3.17529296875, 3.2926025390625, 3.409912109375, 3.5272216796875, 3.64453125]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 6.0, 1.0, 8.0, 3.0, 6.0, 9.0, 8.0, 12.0, 18.0, 11.0, 21.0, 17.0, 13.0, 21.0, 22.0, 46.0, 42.0, 33.0, 59.0, 54.0, 68.0, 162.0, 1378.0, 416.0, 146.0, 80.0, 53.0, 37.0, 43.0, 36.0, 35.0, 27.0, 28.0, 20.0, 20.0, 14.0, 15.0, 12.0, 6.0, 10.0, 12.0, 7.0, 7.0, 1.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-11.5078125, -11.13623046875, -10.7646484375, -10.39306640625, -10.021484375, -9.64990234375, -9.2783203125, -8.90673828125, -8.53515625, -8.16357421875, -7.7919921875, -7.42041015625, -7.048828125, -6.67724609375, -6.3056640625, -5.93408203125, -5.5625, -5.19091796875, -4.8193359375, -4.44775390625, -4.076171875, -3.70458984375, -3.3330078125, -2.96142578125, -2.58984375, -2.21826171875, -1.8466796875, -1.47509765625, -1.103515625, -0.73193359375, -0.3603515625, 0.01123046875, 0.3828125, 0.75439453125, 1.1259765625, 1.49755859375, 1.869140625, 2.24072265625, 2.6123046875, 2.98388671875, 3.35546875, 3.72705078125, 4.0986328125, 4.47021484375, 4.841796875, 5.21337890625, 5.5849609375, 5.95654296875, 6.328125, 6.69970703125, 7.0712890625, 7.44287109375, 7.814453125, 8.18603515625, 8.5576171875, 8.92919921875, 9.30078125, 9.67236328125, 10.0439453125, 10.41552734375, 10.787109375, 11.15869140625, 11.5302734375, 11.90185546875, 12.2734375]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 6.0, 11.0, 10.0, 17.0, 22.0, 38.0, 31.0, 50.0, 87.0, 148.0, 267.0, 508.0, 1287.0, 31112.0, 3101959.0, 8069.0, 999.0, 467.0, 202.0, 127.0, 76.0, 57.0, 41.0, 36.0, 19.0, 16.0, 20.0, 5.0, 8.0, 3.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.53125, -28.3681640625, -27.205078125, -26.0419921875, -24.87890625, -23.7158203125, -22.552734375, -21.3896484375, -20.2265625, -19.0634765625, -17.900390625, -16.7373046875, -15.57421875, -14.4111328125, -13.248046875, -12.0849609375, -10.921875, -9.7587890625, -8.595703125, -7.4326171875, -6.26953125, -5.1064453125, -3.943359375, -2.7802734375, -1.6171875, -0.4541015625, 0.708984375, 1.8720703125, 3.03515625, 4.1982421875, 5.361328125, 6.5244140625, 7.6875, 8.8505859375, 10.013671875, 11.1767578125, 12.33984375, 13.5029296875, 14.666015625, 15.8291015625, 16.9921875, 18.1552734375, 19.318359375, 20.4814453125, 21.64453125, 22.8076171875, 23.970703125, 25.1337890625, 26.296875, 27.4599609375, 28.623046875, 29.7861328125, 30.94921875, 32.1123046875, 33.275390625, 34.4384765625, 35.6015625, 36.7646484375, 37.927734375, 39.0908203125, 40.25390625, 41.4169921875, 42.580078125, 43.7431640625, 44.90625]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 77.0, 730.0, 202.0, 6.0, 2.0, 2.0], "bins": [-184.623779296875, -181.52517700195312, -178.42657470703125, -175.32798767089844, -172.22938537597656, -169.1307830810547, -166.03219604492188, -162.93359375, -159.83499145507812, -156.73638916015625, -153.63778686523438, -150.53919982910156, -147.4405975341797, -144.3419952392578, -141.243408203125, -138.14480590820312, -135.04620361328125, -131.94760131835938, -128.8489990234375, -125.75041198730469, -122.65180969238281, -119.55320739746094, -116.4546127319336, -113.35601806640625, -110.25741577148438, -107.1588134765625, -104.06021881103516, -100.96162414550781, -97.86302185058594, -94.76441955566406, -91.66582489013672, -88.56723022460938, -85.46862030029297, -82.37002563476562, -79.27142333984375, -76.17282104492188, -73.07422637939453, -69.97563171386719, -66.87702941894531, -63.7784309387207, -60.679832458496094, -57.581233978271484, -54.482635498046875, -51.384037017822266, -48.285438537597656, -45.18684005737305, -42.08824157714844, -38.98964309692383, -35.89104461669922, -32.79244613647461, -29.69384765625, -26.59524917602539, -23.49665069580078, -20.398052215576172, -17.299453735351562, -14.200855255126953, -11.102258682250977, -8.003660202026367, -4.905061721801758, -1.8064632415771484, 1.292135238647461, 4.39073371887207, 7.48933219909668, 10.587930679321289, 13.686529159545898]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 7.0, 7.0, 4.0, 6.0, 12.0, 13.0, 11.0, 9.0, 18.0, 24.0, 29.0, 30.0, 24.0, 37.0, 33.0, 41.0, 44.0, 37.0, 43.0, 44.0, 39.0, 34.0, 45.0, 39.0, 42.0, 36.0, 40.0, 33.0, 32.0, 22.0, 19.0, 18.0, 25.0, 23.0, 9.0, 12.0, 13.0, 9.0, 13.0, 6.0, 5.0, 4.0, 4.0, 7.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-29.117712020874023, -28.188800811767578, -27.2598876953125, -26.330976486206055, -25.40206527709961, -24.47315216064453, -23.544240951538086, -22.61532974243164, -21.686416625976562, -20.757505416870117, -19.82859230041504, -18.899681091308594, -17.97076988220215, -17.04185676574707, -16.112945556640625, -15.184033393859863, -14.255122184753418, -13.326210021972656, -12.397298812866211, -11.46838665008545, -10.539474487304688, -9.610563278198242, -8.68165111541748, -7.752738952636719, -6.823827266693115, -5.894915580749512, -4.96600341796875, -4.0370917320251465, -3.108179807662964, -2.1792678833007812, -1.2503561973571777, -0.321444034576416, 0.6074676513671875, 1.5363795757293701, 2.4652915000915527, 3.3942031860351562, 4.323115348815918, 5.2520270347595215, 6.180938720703125, 7.109850883483887, 8.038763046264648, 8.96767520904541, 9.896586418151855, 10.825498580932617, 11.754410743713379, 12.68332290649414, 13.612234115600586, 14.541146278381348, 15.470057487487793, 16.398969650268555, 17.327880859375, 18.256793975830078, 19.185705184936523, 20.11461639404297, 21.043529510498047, 21.972440719604492, 22.901351928710938, 23.830263137817383, 24.75917625427246, 25.688087463378906, 26.61699867248535, 27.54591178894043, 28.474822998046875, 29.403736114501953, 30.3326473236084]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 1.0, 5.0, 4.0, 8.0, 4.0, 8.0, 12.0, 13.0, 16.0, 10.0, 29.0, 17.0, 15.0, 25.0, 25.0, 31.0, 26.0, 36.0, 37.0, 27.0, 59.0, 40.0, 49.0, 40.0, 34.0, 34.0, 38.0, 36.0, 31.0, 37.0, 37.0, 36.0, 21.0, 30.0, 22.0, 21.0, 9.0, 14.0, 19.0, 12.0, 6.0, 6.0, 7.0, 7.0, 3.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0], "bins": [-3.990234375, -3.873260498046875, -3.75628662109375, -3.639312744140625, -3.5223388671875, -3.405364990234375, -3.28839111328125, -3.171417236328125, -3.054443359375, -2.937469482421875, -2.82049560546875, -2.703521728515625, -2.5865478515625, -2.469573974609375, -2.35260009765625, -2.235626220703125, -2.11865234375, -2.001678466796875, -1.88470458984375, -1.767730712890625, -1.6507568359375, -1.533782958984375, -1.41680908203125, -1.299835205078125, -1.182861328125, -1.065887451171875, -0.94891357421875, -0.831939697265625, -0.7149658203125, -0.597991943359375, -0.48101806640625, -0.364044189453125, -0.2470703125, -0.130096435546875, -0.01312255859375, 0.103851318359375, 0.2208251953125, 0.337799072265625, 0.45477294921875, 0.571746826171875, 0.688720703125, 0.805694580078125, 0.92266845703125, 1.039642333984375, 1.1566162109375, 1.273590087890625, 1.39056396484375, 1.507537841796875, 1.62451171875, 1.741485595703125, 1.85845947265625, 1.975433349609375, 2.0924072265625, 2.209381103515625, 2.32635498046875, 2.443328857421875, 2.560302734375, 2.677276611328125, 2.79425048828125, 2.911224365234375, 3.0281982421875, 3.145172119140625, 3.26214599609375, 3.379119873046875, 3.49609375]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 0.0, 5.0, 9.0, 10.0, 9.0, 6.0, 11.0, 15.0, 21.0, 18.0, 17.0, 28.0, 34.0, 56.0, 64.0, 72.0, 107.0, 167.0, 343.0, 1573.0, 69515.0, 2964696.0, 1143881.0, 12046.0, 764.0, 224.0, 151.0, 83.0, 69.0, 68.0, 40.0, 31.0, 23.0, 24.0, 18.0, 17.0, 13.0, 15.0, 8.0, 12.0, 6.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.9375, -12.53076171875, -12.1240234375, -11.71728515625, -11.310546875, -10.90380859375, -10.4970703125, -10.09033203125, -9.68359375, -9.27685546875, -8.8701171875, -8.46337890625, -8.056640625, -7.64990234375, -7.2431640625, -6.83642578125, -6.4296875, -6.02294921875, -5.6162109375, -5.20947265625, -4.802734375, -4.39599609375, -3.9892578125, -3.58251953125, -3.17578125, -2.76904296875, -2.3623046875, -1.95556640625, -1.548828125, -1.14208984375, -0.7353515625, -0.32861328125, 0.078125, 0.48486328125, 0.8916015625, 1.29833984375, 1.705078125, 2.11181640625, 2.5185546875, 2.92529296875, 3.33203125, 3.73876953125, 4.1455078125, 4.55224609375, 4.958984375, 5.36572265625, 5.7724609375, 6.17919921875, 6.5859375, 6.99267578125, 7.3994140625, 7.80615234375, 8.212890625, 8.61962890625, 9.0263671875, 9.43310546875, 9.83984375, 10.24658203125, 10.6533203125, 11.06005859375, 11.466796875, 11.87353515625, 12.2802734375, 12.68701171875, 13.09375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 5.0, 7.0, 9.0, 27.0, 19.0, 43.0, 71.0, 73.0, 103.0, 210.0, 302.0, 411.0, 574.0, 620.0, 530.0, 374.0, 267.0, 165.0, 100.0, 63.0, 43.0, 24.0, 4.0, 11.0, 8.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-12.03125, -11.765625, -11.5, -11.234375, -10.96875, -10.703125, -10.4375, -10.171875, -9.90625, -9.640625, -9.375, -9.109375, -8.84375, -8.578125, -8.3125, -8.046875, -7.78125, -7.515625, -7.25, -6.984375, -6.71875, -6.453125, -6.1875, -5.921875, -5.65625, -5.390625, -5.125, -4.859375, -4.59375, -4.328125, -4.0625, -3.796875, -3.53125, -3.265625, -3.0, -2.734375, -2.46875, -2.203125, -1.9375, -1.671875, -1.40625, -1.140625, -0.875, -0.609375, -0.34375, -0.078125, 0.1875, 0.453125, 0.71875, 0.984375, 1.25, 1.515625, 1.78125, 2.046875, 2.3125, 2.578125, 2.84375, 3.109375, 3.375, 3.640625, 3.90625, 4.171875, 4.4375, 4.703125, 4.96875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 5.0, 14.0, 8.0, 17.0, 24.0, 46.0, 50.0, 84.0, 139.0, 195.0, 313.0, 500.0, 1223.0, 16487.0, 3858583.0, 312329.0, 2390.0, 707.0, 380.0, 241.0, 160.0, 130.0, 92.0, 55.0, 36.0, 26.0, 18.0, 9.0, 14.0, 5.0, 4.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.0625, -15.205078125, -14.34765625, -13.490234375, -12.6328125, -11.775390625, -10.91796875, -10.060546875, -9.203125, -8.345703125, -7.48828125, -6.630859375, -5.7734375, -4.916015625, -4.05859375, -3.201171875, -2.34375, -1.486328125, -0.62890625, 0.228515625, 1.0859375, 1.943359375, 2.80078125, 3.658203125, 4.515625, 5.373046875, 6.23046875, 7.087890625, 7.9453125, 8.802734375, 9.66015625, 10.517578125, 11.375, 12.232421875, 13.08984375, 13.947265625, 14.8046875, 15.662109375, 16.51953125, 17.376953125, 18.234375, 19.091796875, 19.94921875, 20.806640625, 21.6640625, 22.521484375, 23.37890625, 24.236328125, 25.09375, 25.951171875, 26.80859375, 27.666015625, 28.5234375, 29.380859375, 30.23828125, 31.095703125, 31.953125, 32.810546875, 33.66796875, 34.525390625, 35.3828125, 36.240234375, 37.09765625, 37.955078125, 38.8125]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 52.0, 519.0, 401.0, 41.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-192.8626251220703, -188.92396545410156, -184.98529052734375, -181.046630859375, -177.10797119140625, -173.16929626464844, -169.2306365966797, -165.29196166992188, -161.35330200195312, -157.41464233398438, -153.47596740722656, -149.5373077392578, -145.5986328125, -141.65997314453125, -137.7213134765625, -133.7826385498047, -129.84397888183594, -125.90531158447266, -121.96664428710938, -118.02798461914062, -114.08931732177734, -110.15065002441406, -106.21199035644531, -102.27332305908203, -98.33465576171875, -94.39598846435547, -90.45732116699219, -86.51866149902344, -82.57999420166016, -78.64132690429688, -74.70266723632812, -70.76399993896484, -66.8253402709961, -62.88667297363281, -58.9480094909668, -55.00934600830078, -51.0706787109375, -47.13201141357422, -43.1933479309082, -39.25468444824219, -35.316017150878906, -31.377351760864258, -27.43868637084961, -23.50002098083496, -19.561355590820312, -15.622690200805664, -11.684024810791016, -7.745359420776367, -3.8066940307617188, 0.1319713592529297, 4.070636749267578, 8.009302139282227, 11.947967529296875, 15.886632919311523, 19.825298309326172, 23.76396369934082, 27.70262908935547, 31.641294479370117, 35.579959869384766, 39.51862335205078, 43.45729064941406, 47.395957946777344, 51.33462142944336, 55.273284912109375, 59.211952209472656]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 6.0, 1.0, 7.0, 4.0, 9.0, 11.0, 12.0, 12.0, 12.0, 19.0, 33.0, 35.0, 36.0, 20.0, 42.0, 39.0, 37.0, 41.0, 47.0, 48.0, 34.0, 50.0, 53.0, 39.0, 43.0, 52.0, 29.0, 31.0, 33.0, 18.0, 31.0, 25.0, 15.0, 12.0, 14.0, 9.0, 10.0, 7.0, 9.0, 8.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-25.860363006591797, -25.138200759887695, -24.416038513183594, -23.693878173828125, -22.971715927124023, -22.249553680419922, -21.52739143371582, -20.80522918701172, -20.08306884765625, -19.36090660095215, -18.638744354248047, -17.916584014892578, -17.194421768188477, -16.472259521484375, -15.750097274780273, -15.027935981750488, -14.305773735046387, -13.583611488342285, -12.8614501953125, -12.139287948608398, -11.417126655578613, -10.694964408874512, -9.972803115844727, -9.250640869140625, -8.528478622436523, -7.80631685256958, -7.084155082702637, -6.361992835998535, -5.63983154296875, -4.917669296264648, -4.195507526397705, -3.4733457565307617, -2.7511844635009766, -2.029022693634033, -1.3068608045578003, -0.5846989154815674, 0.13746285438537598, 0.8596246242523193, 1.5817866325378418, 2.303948402404785, 3.0261101722717285, 3.748271942138672, 4.470433712005615, 5.192595481872559, 5.91475772857666, 6.636919021606445, 7.359081268310547, 8.081243515014648, 8.803404808044434, 9.525567054748535, 10.24772834777832, 10.969890594482422, 11.692051887512207, 12.414214134216309, 13.136375427246094, 13.858537673950195, 14.580699920654297, 15.302862167358398, 16.0250244140625, 16.74718475341797, 17.46934700012207, 18.191509246826172, 18.913671493530273, 19.635833740234375, 20.357994079589844]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 7.0, 6.0, 4.0, 8.0, 5.0, 6.0, 13.0, 15.0, 13.0, 17.0, 17.0, 23.0, 38.0, 36.0, 48.0, 49.0, 38.0, 35.0, 53.0, 48.0, 45.0, 37.0, 31.0, 34.0, 35.0, 29.0, 33.0, 41.0, 44.0, 24.0, 30.0, 26.0, 19.0, 19.0, 23.0, 13.0, 8.0, 10.0, 3.0, 8.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.51171875, -4.388824462890625, -4.26593017578125, -4.143035888671875, -4.0201416015625, -3.897247314453125, -3.77435302734375, -3.651458740234375, -3.528564453125, -3.405670166015625, -3.28277587890625, -3.159881591796875, -3.0369873046875, -2.914093017578125, -2.79119873046875, -2.668304443359375, -2.54541015625, -2.422515869140625, -2.29962158203125, -2.176727294921875, -2.0538330078125, -1.930938720703125, -1.80804443359375, -1.685150146484375, -1.562255859375, -1.439361572265625, -1.31646728515625, -1.193572998046875, -1.0706787109375, -0.947784423828125, -0.82489013671875, -0.701995849609375, -0.5791015625, -0.456207275390625, -0.33331298828125, -0.210418701171875, -0.0875244140625, 0.035369873046875, 0.15826416015625, 0.281158447265625, 0.404052734375, 0.526947021484375, 0.64984130859375, 0.772735595703125, 0.8956298828125, 1.018524169921875, 1.14141845703125, 1.264312744140625, 1.38720703125, 1.510101318359375, 1.63299560546875, 1.755889892578125, 1.8787841796875, 2.001678466796875, 2.12457275390625, 2.247467041015625, 2.370361328125, 2.493255615234375, 2.61614990234375, 2.739044189453125, 2.8619384765625, 2.984832763671875, 3.10772705078125, 3.230621337890625, 3.353515625]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 5.0, 11.0, 16.0, 20.0, 18.0, 31.0, 68.0, 94.0, 124.0, 223.0, 308.0, 491.0, 591.0, 1013.0, 1415.0, 2239.0, 3340.0, 5172.0, 8046.0, 12707.0, 20244.0, 34400.0, 60229.0, 108519.0, 227893.0, 269785.0, 125269.0, 66140.0, 38119.0, 22790.0, 13873.0, 8703.0, 5658.0, 3721.0, 2397.0, 1582.0, 1091.0, 746.0, 491.0, 327.0, 233.0, 118.0, 112.0, 50.0, 55.0, 28.0, 22.0, 22.0, 7.0, 1.0, 3.0, 4.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.7119140625, -0.6904067993164062, -0.6688995361328125, -0.6473922729492188, -0.625885009765625, -0.6043777465820312, -0.5828704833984375, -0.5613632202148438, -0.53985595703125, -0.5183486938476562, -0.4968414306640625, -0.47533416748046875, -0.453826904296875, -0.43231964111328125, -0.4108123779296875, -0.38930511474609375, -0.3677978515625, -0.34629058837890625, -0.3247833251953125, -0.30327606201171875, -0.281768798828125, -0.26026153564453125, -0.2387542724609375, -0.21724700927734375, -0.19573974609375, -0.17423248291015625, -0.1527252197265625, -0.13121795654296875, -0.109710693359375, -0.08820343017578125, -0.0666961669921875, -0.04518890380859375, -0.023681640625, -0.00217437744140625, 0.0193328857421875, 0.04084014892578125, 0.062347412109375, 0.08385467529296875, 0.1053619384765625, 0.12686920166015625, 0.14837646484375, 0.16988372802734375, 0.1913909912109375, 0.21289825439453125, 0.234405517578125, 0.25591278076171875, 0.2774200439453125, 0.29892730712890625, 0.3204345703125, 0.34194183349609375, 0.3634490966796875, 0.38495635986328125, 0.406463623046875, 0.42797088623046875, 0.4494781494140625, 0.47098541259765625, 0.49249267578125, 0.5139999389648438, 0.5355072021484375, 0.5570144653320312, 0.578521728515625, 0.6000289916992188, 0.6215362548828125, 0.6430435180664062, 0.66455078125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 4.0, 4.0, 9.0, 6.0, 5.0, 8.0, 10.0, 9.0, 16.0, 12.0, 15.0, 16.0, 32.0, 18.0, 22.0, 27.0, 35.0, 32.0, 36.0, 34.0, 44.0, 37.0, 30.0, 1072.0, 35.0, 37.0, 39.0, 28.0, 38.0, 29.0, 29.0, 32.0, 27.0, 22.0, 20.0, 20.0, 23.0, 18.0, 12.0, 15.0, 18.0, 8.0, 8.0, 10.0, 5.0, 5.0, 6.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0], "bins": [-2.1328125, -2.067962646484375, -2.00311279296875, -1.938262939453125, -1.8734130859375, -1.808563232421875, -1.74371337890625, -1.678863525390625, -1.614013671875, -1.549163818359375, -1.48431396484375, -1.419464111328125, -1.3546142578125, -1.289764404296875, -1.22491455078125, -1.160064697265625, -1.09521484375, -1.030364990234375, -0.96551513671875, -0.900665283203125, -0.8358154296875, -0.770965576171875, -0.70611572265625, -0.641265869140625, -0.576416015625, -0.511566162109375, -0.44671630859375, -0.381866455078125, -0.3170166015625, -0.252166748046875, -0.18731689453125, -0.122467041015625, -0.0576171875, 0.007232666015625, 0.07208251953125, 0.136932373046875, 0.2017822265625, 0.266632080078125, 0.33148193359375, 0.396331787109375, 0.461181640625, 0.526031494140625, 0.59088134765625, 0.655731201171875, 0.7205810546875, 0.785430908203125, 0.85028076171875, 0.915130615234375, 0.97998046875, 1.044830322265625, 1.10968017578125, 1.174530029296875, 1.2393798828125, 1.304229736328125, 1.36907958984375, 1.433929443359375, 1.498779296875, 1.563629150390625, 1.62847900390625, 1.693328857421875, 1.7581787109375, 1.823028564453125, 1.88787841796875, 1.952728271484375, 2.017578125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 4.0, 7.0, 8.0, 8.0, 10.0, 29.0, 48.0, 67.0, 69.0, 101.0, 193.0, 261.0, 374.0, 521.0, 735.0, 1092.0, 1587.0, 2173.0, 3001.0, 4478.0, 6365.0, 9204.0, 14080.0, 20772.0, 32225.0, 52201.0, 87497.0, 170813.0, 1333718.0, 143218.0, 77321.0, 46323.0, 29155.0, 18954.0, 12593.0, 8440.0, 5884.0, 4102.0, 2749.0, 2101.0, 1400.0, 980.0, 687.0, 475.0, 373.0, 256.0, 157.0, 102.0, 72.0, 62.0, 34.0, 25.0, 16.0, 7.0, 10.0, 3.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.57421875, -0.556488037109375, -0.53875732421875, -0.521026611328125, -0.5032958984375, -0.485565185546875, -0.46783447265625, -0.450103759765625, -0.432373046875, -0.414642333984375, -0.39691162109375, -0.379180908203125, -0.3614501953125, -0.343719482421875, -0.32598876953125, -0.308258056640625, -0.29052734375, -0.272796630859375, -0.25506591796875, -0.237335205078125, -0.2196044921875, -0.201873779296875, -0.18414306640625, -0.166412353515625, -0.148681640625, -0.130950927734375, -0.11322021484375, -0.095489501953125, -0.0777587890625, -0.060028076171875, -0.04229736328125, -0.024566650390625, -0.0068359375, 0.010894775390625, 0.02862548828125, 0.046356201171875, 0.0640869140625, 0.081817626953125, 0.09954833984375, 0.117279052734375, 0.135009765625, 0.152740478515625, 0.17047119140625, 0.188201904296875, 0.2059326171875, 0.223663330078125, 0.24139404296875, 0.259124755859375, 0.27685546875, 0.294586181640625, 0.31231689453125, 0.330047607421875, 0.3477783203125, 0.365509033203125, 0.38323974609375, 0.400970458984375, 0.418701171875, 0.436431884765625, 0.45416259765625, 0.471893310546875, 0.4896240234375, 0.507354736328125, 0.52508544921875, 0.542816162109375, 0.560546875]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 7.0, 2.0, 1.0, 2.0, 5.0, 10.0, 15.0, 18.0, 14.0, 19.0, 13.0, 26.0, 28.0, 33.0, 40.0, 43.0, 50.0, 43.0, 70.0, 66.0, 67.0, 50.0, 41.0, 59.0, 45.0, 57.0, 34.0, 32.0, 17.0, 22.0, 12.0, 10.0, 10.0, 5.0, 12.0, 9.0, 6.0, 3.0, 3.0, 3.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0004227161407470703, -0.0004104338586330414, -0.00039815157651901245, -0.0003858692944049835, -0.0003735870122909546, -0.00036130473017692566, -0.00034902244806289673, -0.0003367401659488678, -0.00032445788383483887, -0.00031217560172080994, -0.000299893319606781, -0.0002876110374927521, -0.00027532875537872314, -0.0002630464732646942, -0.0002507641911506653, -0.00023848190903663635, -0.00022619962692260742, -0.0002139173448085785, -0.00020163506269454956, -0.00018935278058052063, -0.0001770704984664917, -0.00016478821635246277, -0.00015250593423843384, -0.0001402236521244049, -0.00012794137001037598, -0.00011565908789634705, -0.00010337680578231812, -9.109452366828918e-05, -7.881224155426025e-05, -6.652995944023132e-05, -5.424767732620239e-05, -4.196539521217346e-05, -2.968311309814453e-05, -1.74008309841156e-05, -5.11854887008667e-06, 7.163733243942261e-06, 1.944601535797119e-05, 3.172829747200012e-05, 4.401057958602905e-05, 5.6292861700057983e-05, 6.857514381408691e-05, 8.085742592811584e-05, 9.313970804214478e-05, 0.0001054219901561737, 0.00011770427227020264, 0.00012998655438423157, 0.0001422688364982605, 0.00015455111861228943, 0.00016683340072631836, 0.0001791156828403473, 0.00019139796495437622, 0.00020368024706840515, 0.00021596252918243408, 0.000228244811296463, 0.00024052709341049194, 0.0002528093755245209, 0.0002650916576385498, 0.00027737393975257874, 0.00028965622186660767, 0.0003019385039806366, 0.00031422078609466553, 0.00032650306820869446, 0.0003387853503227234, 0.0003510676324367523, 0.00036334991455078125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 3.0, 4.0, 8.0, 8.0, 10.0, 13.0, 12.0, 18.0, 18.0, 22.0, 30.0, 39.0, 63.0, 74.0, 114.0, 179.0, 312.0, 554.0, 2123.0, 1018539.0, 24327.0, 921.0, 378.0, 210.0, 148.0, 88.0, 79.0, 57.0, 36.0, 30.0, 27.0, 28.0, 15.0, 21.0, 13.0, 10.0, 7.0, 3.0, 2.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00717926025390625, -0.0069200992584228516, -0.006660938262939453, -0.006401777267456055, -0.006142616271972656, -0.005883455276489258, -0.005624294281005859, -0.005365133285522461, -0.0051059722900390625, -0.004846811294555664, -0.004587650299072266, -0.004328489303588867, -0.004069328308105469, -0.0038101673126220703, -0.003551006317138672, -0.0032918453216552734, -0.003032684326171875, -0.0027735233306884766, -0.002514362335205078, -0.0022552013397216797, -0.0019960403442382812, -0.0017368793487548828, -0.0014777183532714844, -0.001218557357788086, -0.0009593963623046875, -0.0007002353668212891, -0.0004410743713378906, -0.0001819133758544922, 7.724761962890625e-05, 0.0003364086151123047, 0.0005955696105957031, 0.0008547306060791016, 0.0011138916015625, 0.0013730525970458984, 0.0016322135925292969, 0.0018913745880126953, 0.0021505355834960938, 0.002409696578979492, 0.0026688575744628906, 0.002928018569946289, 0.0031871795654296875, 0.003446340560913086, 0.0037055015563964844, 0.003964662551879883, 0.004223823547363281, 0.00448298454284668, 0.004742145538330078, 0.0050013065338134766, 0.005260467529296875, 0.0055196285247802734, 0.005778789520263672, 0.00603795051574707, 0.006297111511230469, 0.006556272506713867, 0.006815433502197266, 0.007074594497680664, 0.0073337554931640625, 0.007592916488647461, 0.00785207748413086, 0.008111238479614258, 0.008370399475097656, 0.008629560470581055, 0.008888721466064453, 0.009147882461547852, 0.00940704345703125]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 12.0, 51.0, 151.0, 318.0, 270.0, 146.0, 55.0, 8.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005862560938112438, -0.0005699560279026628, -0.0005536559037864208, -0.0005373557796701789, -0.0005210557137615979, -0.0005047556478530169, -0.0004884555237367749, -0.00047215542872436345, -0.00045585533371195197, -0.0004395552386995405, -0.000423255143687129, -0.00040695504867471755, -0.00039065495366230607, -0.0003743548586498946, -0.0003580547636374831, -0.00034175466862507164, -0.00032545457361266017, -0.0003091544786002487, -0.0002928543835878372, -0.00027655428857542574, -0.00026025419356301427, -0.0002439540985506028, -0.00022765400353819132, -0.00021135390852577984, -0.00019505381351336837, -0.0001787537185009569, -0.00016245362348854542, -0.00014615352847613394, -0.00012985343346372247, -0.00011355333845131099, -9.725324343889952e-05, -8.095314842648804e-05, -6.465302431024611e-05, -4.8352929297834635e-05, -3.205283428542316e-05, -1.5752739273011684e-05, 5.473557393997908e-07, 1.6847450751811266e-05, 3.314754576422274e-05, 4.9447640776634216e-05, 6.574773578904569e-05, 8.204783080145717e-05, 9.834792581386864e-05, 0.00011464802082628012, 0.0001309481158386916, 0.00014724821085110307, 0.00016354830586351454, 0.00017984840087592602, 0.0001961484958883375, 0.00021244859090074897, 0.00022874868591316044, 0.0002450487809255719, 0.0002613488759379834, 0.00027764897095039487, 0.00029394906596280634, 0.0003102491609752178, 0.0003265492559876293, 0.00034284935100004077, 0.00035914944601245224, 0.0003754495410248637, 0.0003917496360372752, 0.00040804973104968667, 0.00042434982606209815, 0.0004406499210745096, 0.0004569500160869211]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 5.0, 9.0, 10.0, 11.0, 11.0, 21.0, 28.0, 19.0, 31.0, 34.0, 44.0, 37.0, 48.0, 45.0, 41.0, 38.0, 50.0, 36.0, 49.0, 51.0, 42.0, 42.0, 54.0, 44.0, 18.0, 21.0, 30.0, 22.0, 23.0, 17.0, 17.0, 12.0, 12.0, 7.0, 7.0, 6.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00025659799575805664, -0.0002493634819984436, -0.00024212896823883057, -0.00023489445447921753, -0.0002276599407196045, -0.00022042542695999146, -0.00021319091320037842, -0.00020595639944076538, -0.00019872188568115234, -0.0001914873719215393, -0.00018425285816192627, -0.00017701834440231323, -0.0001697838306427002, -0.00016254931688308716, -0.00015531480312347412, -0.00014808028936386108, -0.00014084577560424805, -0.000133611261844635, -0.00012637674808502197, -0.00011914223432540894, -0.0001119077205657959, -0.00010467320680618286, -9.743869304656982e-05, -9.020417928695679e-05, -8.296966552734375e-05, -7.573515176773071e-05, -6.850063800811768e-05, -6.126612424850464e-05, -5.40316104888916e-05, -4.6797096729278564e-05, -3.956258296966553e-05, -3.232806921005249e-05, -2.5093555450439453e-05, -1.7859041690826416e-05, -1.0624527931213379e-05, -3.390014171600342e-06, 3.844499588012695e-06, 1.1079013347625732e-05, 1.831352710723877e-05, 2.5548040866851807e-05, 3.2782554626464844e-05, 4.001706838607788e-05, 4.725158214569092e-05, 5.4486095905303955e-05, 6.172060966491699e-05, 6.895512342453003e-05, 7.618963718414307e-05, 8.34241509437561e-05, 9.065866470336914e-05, 9.789317846298218e-05, 0.00010512769222259521, 0.00011236220598220825, 0.00011959671974182129, 0.00012683123350143433, 0.00013406574726104736, 0.0001413002610206604, 0.00014853477478027344, 0.00015576928853988647, 0.0001630038022994995, 0.00017023831605911255, 0.00017747282981872559, 0.00018470734357833862, 0.00019194185733795166, 0.0001991763710975647, 0.00020641088485717773]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 7.0, 6.0, 4.0, 8.0, 5.0, 6.0, 13.0, 15.0, 13.0, 17.0, 17.0, 23.0, 38.0, 36.0, 48.0, 49.0, 38.0, 35.0, 53.0, 48.0, 45.0, 37.0, 31.0, 34.0, 35.0, 29.0, 33.0, 41.0, 44.0, 25.0, 29.0, 26.0, 19.0, 19.0, 23.0, 13.0, 8.0, 10.0, 3.0, 8.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.51171875, -4.388824462890625, -4.26593017578125, -4.143035888671875, -4.0201416015625, -3.897247314453125, -3.77435302734375, -3.651458740234375, -3.528564453125, -3.405670166015625, -3.28277587890625, -3.159881591796875, -3.0369873046875, -2.914093017578125, -2.79119873046875, -2.668304443359375, -2.54541015625, -2.422515869140625, -2.29962158203125, -2.176727294921875, -2.0538330078125, -1.930938720703125, -1.80804443359375, -1.685150146484375, -1.562255859375, -1.439361572265625, -1.31646728515625, -1.193572998046875, -1.0706787109375, -0.947784423828125, -0.82489013671875, -0.701995849609375, -0.5791015625, -0.456207275390625, -0.33331298828125, -0.210418701171875, -0.0875244140625, 0.035369873046875, 0.15826416015625, 0.281158447265625, 0.404052734375, 0.526947021484375, 0.64984130859375, 0.772735595703125, 0.8956298828125, 1.018524169921875, 1.14141845703125, 1.264312744140625, 1.38720703125, 1.510101318359375, 1.63299560546875, 1.755889892578125, 1.8787841796875, 2.001678466796875, 2.12457275390625, 2.247467041015625, 2.370361328125, 2.493255615234375, 2.61614990234375, 2.739044189453125, 2.8619384765625, 2.984832763671875, 3.10772705078125, 3.230621337890625, 3.353515625]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 2.0, 1.0, 8.0, 5.0, 14.0, 13.0, 16.0, 18.0, 22.0, 36.0, 56.0, 60.0, 102.0, 112.0, 166.0, 246.0, 334.0, 644.0, 2070.0, 9036.0, 46324.0, 310888.0, 558504.0, 96448.0, 17400.0, 3628.0, 942.0, 450.0, 278.0, 188.0, 134.0, 94.0, 80.0, 64.0, 34.0, 36.0, 20.0, 21.0, 19.0, 12.0, 12.0, 4.0, 4.0, 1.0, 3.0, 3.0, 0.0, 1.0, 3.0], "bins": [-7.9609375, -7.7469482421875, -7.532958984375, -7.3189697265625, -7.10498046875, -6.8909912109375, -6.677001953125, -6.4630126953125, -6.2490234375, -6.0350341796875, -5.821044921875, -5.6070556640625, -5.39306640625, -5.1790771484375, -4.965087890625, -4.7510986328125, -4.537109375, -4.3231201171875, -4.109130859375, -3.8951416015625, -3.68115234375, -3.4671630859375, -3.253173828125, -3.0391845703125, -2.8251953125, -2.6112060546875, -2.397216796875, -2.1832275390625, -1.96923828125, -1.7552490234375, -1.541259765625, -1.3272705078125, -1.11328125, -0.8992919921875, -0.685302734375, -0.4713134765625, -0.25732421875, -0.0433349609375, 0.170654296875, 0.3846435546875, 0.5986328125, 0.8126220703125, 1.026611328125, 1.2406005859375, 1.45458984375, 1.6685791015625, 1.882568359375, 2.0965576171875, 2.310546875, 2.5245361328125, 2.738525390625, 2.9525146484375, 3.16650390625, 3.3804931640625, 3.594482421875, 3.8084716796875, 4.0224609375, 4.2364501953125, 4.450439453125, 4.6644287109375, 4.87841796875, 5.0924072265625, 5.306396484375, 5.5203857421875, 5.734375]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 4.0, 4.0, 3.0, 1.0, 12.0, 8.0, 9.0, 16.0, 15.0, 15.0, 13.0, 13.0, 17.0, 21.0, 29.0, 24.0, 34.0, 34.0, 43.0, 47.0, 58.0, 77.0, 211.0, 1548.0, 288.0, 97.0, 75.0, 39.0, 47.0, 28.0, 28.0, 31.0, 30.0, 22.0, 17.0, 14.0, 19.0, 15.0, 12.0, 11.0, 9.0, 5.0, 2.0, 4.0, 3.0, 3.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-14.515625, -14.108154296875, -13.70068359375, -13.293212890625, -12.8857421875, -12.478271484375, -12.07080078125, -11.663330078125, -11.255859375, -10.848388671875, -10.44091796875, -10.033447265625, -9.6259765625, -9.218505859375, -8.81103515625, -8.403564453125, -7.99609375, -7.588623046875, -7.18115234375, -6.773681640625, -6.3662109375, -5.958740234375, -5.55126953125, -5.143798828125, -4.736328125, -4.328857421875, -3.92138671875, -3.513916015625, -3.1064453125, -2.698974609375, -2.29150390625, -1.884033203125, -1.4765625, -1.069091796875, -0.66162109375, -0.254150390625, 0.1533203125, 0.560791015625, 0.96826171875, 1.375732421875, 1.783203125, 2.190673828125, 2.59814453125, 3.005615234375, 3.4130859375, 3.820556640625, 4.22802734375, 4.635498046875, 5.04296875, 5.450439453125, 5.85791015625, 6.265380859375, 6.6728515625, 7.080322265625, 7.48779296875, 7.895263671875, 8.302734375, 8.710205078125, 9.11767578125, 9.525146484375, 9.9326171875, 10.340087890625, 10.74755859375, 11.155029296875, 11.5625]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 5.0, 6.0, 9.0, 9.0, 12.0, 12.0, 18.0, 22.0, 26.0, 35.0, 48.0, 40.0, 67.0, 90.0, 113.0, 193.0, 319.0, 765.0, 2632.0, 212936.0, 2919316.0, 6657.0, 1047.0, 419.0, 276.0, 161.0, 125.0, 52.0, 56.0, 42.0, 33.0, 28.0, 25.0, 17.0, 23.0, 21.0, 10.0, 6.0, 12.0, 4.0, 4.0, 5.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-29.3125, -28.37255859375, -27.4326171875, -26.49267578125, -25.552734375, -24.61279296875, -23.6728515625, -22.73291015625, -21.79296875, -20.85302734375, -19.9130859375, -18.97314453125, -18.033203125, -17.09326171875, -16.1533203125, -15.21337890625, -14.2734375, -13.33349609375, -12.3935546875, -11.45361328125, -10.513671875, -9.57373046875, -8.6337890625, -7.69384765625, -6.75390625, -5.81396484375, -4.8740234375, -3.93408203125, -2.994140625, -2.05419921875, -1.1142578125, -0.17431640625, 0.765625, 1.70556640625, 2.6455078125, 3.58544921875, 4.525390625, 5.46533203125, 6.4052734375, 7.34521484375, 8.28515625, 9.22509765625, 10.1650390625, 11.10498046875, 12.044921875, 12.98486328125, 13.9248046875, 14.86474609375, 15.8046875, 16.74462890625, 17.6845703125, 18.62451171875, 19.564453125, 20.50439453125, 21.4443359375, 22.38427734375, 23.32421875, 24.26416015625, 25.2041015625, 26.14404296875, 27.083984375, 28.02392578125, 28.9638671875, 29.90380859375, 30.84375]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 39.0, 301.0, 507.0, 144.0, 21.0, 2.0], "bins": [-116.11796569824219, -114.19007873535156, -112.26219177246094, -110.33430480957031, -108.40641784667969, -106.47853088378906, -104.55064392089844, -102.62275695800781, -100.69486999511719, -98.76698303222656, -96.83909606933594, -94.91120910644531, -92.98332214355469, -91.05543518066406, -89.12754821777344, -87.19966125488281, -85.27177429199219, -83.34388732910156, -81.41600036621094, -79.48811340332031, -77.56022644042969, -75.63233947753906, -73.70445251464844, -71.77656555175781, -69.84867858886719, -67.92079162597656, -65.99290466308594, -64.06501770019531, -62.13713073730469, -60.20924377441406, -58.28135681152344, -56.35346984863281, -54.42558288574219, -52.49769592285156, -50.56980895996094, -48.64192199707031, -46.71403503417969, -44.78614807128906, -42.85826110839844, -40.93037414550781, -39.00248718261719, -37.07460021972656, -35.14671325683594, -33.21882629394531, -31.290939331054688, -29.363052368164062, -27.435165405273438, -25.507278442382812, -23.579391479492188, -21.651504516601562, -19.723617553710938, -17.795730590820312, -15.867843627929688, -13.939956665039062, -12.012069702148438, -10.084182739257812, -8.156296730041504, -6.228409767150879, -4.300522804260254, -2.372635841369629, -0.4447488784790039, 1.483138084411621, 3.411025047302246, 5.338912010192871, 7.266798973083496]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 3.0, 6.0, 2.0, 3.0, 7.0, 6.0, 5.0, 8.0, 8.0, 2.0, 10.0, 6.0, 17.0, 9.0, 18.0, 19.0, 17.0, 22.0, 35.0, 36.0, 26.0, 36.0, 34.0, 19.0, 36.0, 44.0, 48.0, 37.0, 42.0, 37.0, 33.0, 41.0, 32.0, 37.0, 22.0, 30.0, 26.0, 27.0, 13.0, 21.0, 19.0, 17.0, 15.0, 18.0, 11.0, 6.0, 8.0, 11.0, 8.0, 8.0, 1.0, 2.0, 5.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-25.790145874023438, -24.929243087768555, -24.068342208862305, -23.207439422607422, -22.346538543701172, -21.48563575744629, -20.624732971191406, -19.763832092285156, -18.902929306030273, -18.04202651977539, -17.18112564086914, -16.320222854614258, -15.459321022033691, -14.598419189453125, -13.737516403198242, -12.876614570617676, -12.01571273803711, -11.154810905456543, -10.293909072875977, -9.433006286621094, -8.572104454040527, -7.711202621459961, -6.850300312042236, -5.989398002624512, -5.128496170043945, -4.267594337463379, -3.4066920280456543, -2.545789957046509, -1.6848878860473633, -0.8239860534667969, 0.036916255950927734, 0.8978185653686523, 1.7587223052978516, 2.619624376296997, 3.4805264472961426, 4.341428756713867, 5.202330589294434, 6.063232421875, 6.924134731292725, 7.785037040710449, 8.645938873291016, 9.506840705871582, 10.367742538452148, 11.228645324707031, 12.089547157287598, 12.950448989868164, 13.811351776123047, 14.672253608703613, 15.53315544128418, 16.394058227539062, 17.254959106445312, 18.115861892700195, 18.976764678955078, 19.837665557861328, 20.69856834411621, 21.559471130371094, 22.420372009277344, 23.281274795532227, 24.142175674438477, 25.00307846069336, 25.86397933959961, 26.724882125854492, 27.585784912109375, 28.446685791015625, 29.307588577270508]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 3.0, 6.0, 9.0, 2.0, 10.0, 12.0, 9.0, 13.0, 13.0, 17.0, 21.0, 25.0, 34.0, 46.0, 40.0, 42.0, 43.0, 50.0, 40.0, 41.0, 47.0, 33.0, 44.0, 42.0, 40.0, 28.0, 34.0, 36.0, 33.0, 33.0, 26.0, 37.0, 20.0, 19.0, 8.0, 11.0, 16.0, 4.0, 4.0, 6.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.9453125, -4.806671142578125, -4.66802978515625, -4.529388427734375, -4.3907470703125, -4.252105712890625, -4.11346435546875, -3.974822998046875, -3.836181640625, -3.697540283203125, -3.55889892578125, -3.420257568359375, -3.2816162109375, -3.142974853515625, -3.00433349609375, -2.865692138671875, -2.72705078125, -2.588409423828125, -2.44976806640625, -2.311126708984375, -2.1724853515625, -2.033843994140625, -1.89520263671875, -1.756561279296875, -1.617919921875, -1.479278564453125, -1.34063720703125, -1.201995849609375, -1.0633544921875, -0.924713134765625, -0.78607177734375, -0.647430419921875, -0.5087890625, -0.370147705078125, -0.23150634765625, -0.092864990234375, 0.0457763671875, 0.184417724609375, 0.32305908203125, 0.461700439453125, 0.600341796875, 0.738983154296875, 0.87762451171875, 1.016265869140625, 1.1549072265625, 1.293548583984375, 1.43218994140625, 1.570831298828125, 1.70947265625, 1.848114013671875, 1.98675537109375, 2.125396728515625, 2.2640380859375, 2.402679443359375, 2.54132080078125, 2.679962158203125, 2.818603515625, 2.957244873046875, 3.09588623046875, 3.234527587890625, 3.3731689453125, 3.511810302734375, 3.65045166015625, 3.789093017578125, 3.927734375]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 1.0, 6.0, 6.0, 7.0, 9.0, 10.0, 19.0, 13.0, 19.0, 29.0, 27.0, 41.0, 57.0, 82.0, 104.0, 168.0, 432.0, 1369.0, 22604.0, 1271267.0, 2771432.0, 122150.0, 3113.0, 607.0, 236.0, 123.0, 74.0, 52.0, 41.0, 43.0, 29.0, 28.0, 19.0, 21.0, 12.0, 10.0, 9.0, 8.0, 3.0, 5.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.859375, -11.490966796875, -11.12255859375, -10.754150390625, -10.3857421875, -10.017333984375, -9.64892578125, -9.280517578125, -8.912109375, -8.543701171875, -8.17529296875, -7.806884765625, -7.4384765625, -7.070068359375, -6.70166015625, -6.333251953125, -5.96484375, -5.596435546875, -5.22802734375, -4.859619140625, -4.4912109375, -4.122802734375, -3.75439453125, -3.385986328125, -3.017578125, -2.649169921875, -2.28076171875, -1.912353515625, -1.5439453125, -1.175537109375, -0.80712890625, -0.438720703125, -0.0703125, 0.298095703125, 0.66650390625, 1.034912109375, 1.4033203125, 1.771728515625, 2.14013671875, 2.508544921875, 2.876953125, 3.245361328125, 3.61376953125, 3.982177734375, 4.3505859375, 4.718994140625, 5.08740234375, 5.455810546875, 5.82421875, 6.192626953125, 6.56103515625, 6.929443359375, 7.2978515625, 7.666259765625, 8.03466796875, 8.403076171875, 8.771484375, 9.139892578125, 9.50830078125, 9.876708984375, 10.2451171875, 10.613525390625, 10.98193359375, 11.350341796875, 11.71875]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 4.0, 4.0, 9.0, 8.0, 15.0, 21.0, 32.0, 29.0, 64.0, 85.0, 112.0, 159.0, 239.0, 303.0, 384.0, 504.0, 502.0, 413.0, 350.0, 241.0, 187.0, 132.0, 90.0, 56.0, 37.0, 28.0, 12.0, 15.0, 10.0, 4.0, 8.0, 6.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.734375, -7.52655029296875, -7.3187255859375, -7.11090087890625, -6.903076171875, -6.69525146484375, -6.4874267578125, -6.27960205078125, -6.07177734375, -5.86395263671875, -5.6561279296875, -5.44830322265625, -5.240478515625, -5.03265380859375, -4.8248291015625, -4.61700439453125, -4.4091796875, -4.20135498046875, -3.9935302734375, -3.78570556640625, -3.577880859375, -3.37005615234375, -3.1622314453125, -2.95440673828125, -2.74658203125, -2.53875732421875, -2.3309326171875, -2.12310791015625, -1.915283203125, -1.70745849609375, -1.4996337890625, -1.29180908203125, -1.083984375, -0.87615966796875, -0.6683349609375, -0.46051025390625, -0.252685546875, -0.04486083984375, 0.1629638671875, 0.37078857421875, 0.57861328125, 0.78643798828125, 0.9942626953125, 1.20208740234375, 1.409912109375, 1.61773681640625, 1.8255615234375, 2.03338623046875, 2.2412109375, 2.44903564453125, 2.6568603515625, 2.86468505859375, 3.072509765625, 3.28033447265625, 3.4881591796875, 3.69598388671875, 3.90380859375, 4.11163330078125, 4.3194580078125, 4.52728271484375, 4.735107421875, 4.94293212890625, 5.1507568359375, 5.35858154296875, 5.56640625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 6.0, 7.0, 16.0, 14.0, 27.0, 22.0, 48.0, 63.0, 84.0, 120.0, 119.0, 258.0, 344.0, 598.0, 1553.0, 9364.0, 340108.0, 3670567.0, 161856.0, 6065.0, 1301.0, 557.0, 341.0, 242.0, 158.0, 130.0, 90.0, 53.0, 43.0, 38.0, 26.0, 12.0, 11.0, 13.0, 9.0, 7.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.5859375, -14.0726318359375, -13.559326171875, -13.0460205078125, -12.53271484375, -12.0194091796875, -11.506103515625, -10.9927978515625, -10.4794921875, -9.9661865234375, -9.452880859375, -8.9395751953125, -8.42626953125, -7.9129638671875, -7.399658203125, -6.8863525390625, -6.373046875, -5.8597412109375, -5.346435546875, -4.8331298828125, -4.31982421875, -3.8065185546875, -3.293212890625, -2.7799072265625, -2.2666015625, -1.7532958984375, -1.239990234375, -0.7266845703125, -0.21337890625, 0.2999267578125, 0.813232421875, 1.3265380859375, 1.83984375, 2.3531494140625, 2.866455078125, 3.3797607421875, 3.89306640625, 4.4063720703125, 4.919677734375, 5.4329833984375, 5.9462890625, 6.4595947265625, 6.972900390625, 7.4862060546875, 7.99951171875, 8.5128173828125, 9.026123046875, 9.5394287109375, 10.052734375, 10.5660400390625, 11.079345703125, 11.5926513671875, 12.10595703125, 12.6192626953125, 13.132568359375, 13.6458740234375, 14.1591796875, 14.6724853515625, 15.185791015625, 15.6990966796875, 16.21240234375, 16.7257080078125, 17.239013671875, 17.7523193359375, 18.265625]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 9.0, 42.0, 150.0, 266.0, 317.0, 159.0, 50.0, 16.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.89935302734375, -65.1007080078125, -63.30207061767578, -61.5034294128418, -59.70478820800781, -57.90614700317383, -56.107505798339844, -54.30886459350586, -52.510223388671875, -50.71158218383789, -48.912940979003906, -47.11429977416992, -45.31565856933594, -43.51701736450195, -41.71837615966797, -39.919734954833984, -38.12109375, -36.322452545166016, -34.52381134033203, -32.72517013549805, -30.926528930664062, -29.127887725830078, -27.329246520996094, -25.53060531616211, -23.73196029663086, -21.933319091796875, -20.13467788696289, -18.336036682128906, -16.537395477294922, -14.738753318786621, -12.940112113952637, -11.141470909118652, -9.342830657958984, -7.544189453125, -5.745548248291016, -3.946906566619873, -2.1482653617858887, -0.3496236801147461, 1.4490175247192383, 3.2476587295532227, 5.046299934387207, 6.844941139221191, 8.643582344055176, 10.442224502563477, 12.240865707397461, 14.039506912231445, 15.83814811706543, 17.636789321899414, 19.4354305267334, 21.234071731567383, 23.032712936401367, 24.83135414123535, 26.629995346069336, 28.428638458251953, 30.227279663085938, 32.02592086791992, 33.824562072753906, 35.62320327758789, 37.421844482421875, 39.22048568725586, 41.019126892089844, 42.81776809692383, 44.61640930175781, 46.4150505065918, 48.21369171142578]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 2.0, 8.0, 7.0, 9.0, 14.0, 16.0, 19.0, 29.0, 20.0, 25.0, 20.0, 29.0, 42.0, 32.0, 37.0, 46.0, 41.0, 48.0, 40.0, 40.0, 38.0, 43.0, 39.0, 46.0, 36.0, 28.0, 36.0, 35.0, 33.0, 19.0, 11.0, 19.0, 14.0, 19.0, 14.0, 14.0, 9.0, 10.0, 2.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.433757781982422, -21.74953269958496, -21.065309524536133, -20.381084442138672, -19.696861267089844, -19.012636184692383, -18.328411102294922, -17.644187927246094, -16.959962844848633, -16.275737762451172, -15.591514587402344, -14.907289505004883, -14.223065376281738, -13.538841247558594, -12.854616165161133, -12.170392036437988, -11.486167907714844, -10.8019437789917, -10.117719650268555, -9.433494567871094, -8.74927043914795, -8.065046310424805, -7.380821704864502, -6.696597099304199, -6.012372970581055, -5.32814884185791, -4.643924236297607, -3.959699869155884, -3.27547550201416, -2.5912511348724365, -1.907026767730713, -1.2228021621704102, -0.5385780334472656, 0.145646333694458, 0.8298707008361816, 1.5140950679779053, 2.198319435119629, 2.8825438022613525, 3.566768169403076, 4.250992774963379, 4.935216903686523, 5.619441032409668, 6.303665637969971, 6.987890243530273, 7.672114372253418, 8.356338500976562, 9.040563583374023, 9.724787712097168, 10.409011840820312, 11.093235969543457, 11.777460098266602, 12.461685180664062, 13.145909309387207, 13.830133438110352, 14.514358520507812, 15.198582649230957, 15.882806777954102, 16.567031860351562, 17.25125503540039, 17.93548011779785, 18.619705200195312, 19.30392837524414, 19.9881534576416, 20.672378540039062, 21.35660171508789]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 7.0, 4.0, 3.0, 6.0, 9.0, 10.0, 14.0, 16.0, 17.0, 21.0, 26.0, 19.0, 36.0, 24.0, 33.0, 27.0, 35.0, 40.0, 39.0, 41.0, 38.0, 45.0, 38.0, 53.0, 26.0, 40.0, 29.0, 31.0, 36.0, 36.0, 26.0, 30.0, 22.0, 24.0, 22.0, 13.0, 14.0, 14.0, 12.0, 6.0, 6.0, 6.0, 1.0, 5.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.98828125, -3.86309814453125, -3.7379150390625, -3.61273193359375, -3.487548828125, -3.36236572265625, -3.2371826171875, -3.11199951171875, -2.98681640625, -2.86163330078125, -2.7364501953125, -2.61126708984375, -2.486083984375, -2.36090087890625, -2.2357177734375, -2.11053466796875, -1.9853515625, -1.86016845703125, -1.7349853515625, -1.60980224609375, -1.484619140625, -1.35943603515625, -1.2342529296875, -1.10906982421875, -0.98388671875, -0.85870361328125, -0.7335205078125, -0.60833740234375, -0.483154296875, -0.35797119140625, -0.2327880859375, -0.10760498046875, 0.017578125, 0.14276123046875, 0.2679443359375, 0.39312744140625, 0.518310546875, 0.64349365234375, 0.7686767578125, 0.89385986328125, 1.01904296875, 1.14422607421875, 1.2694091796875, 1.39459228515625, 1.519775390625, 1.64495849609375, 1.7701416015625, 1.89532470703125, 2.0205078125, 2.14569091796875, 2.2708740234375, 2.39605712890625, 2.521240234375, 2.64642333984375, 2.7716064453125, 2.89678955078125, 3.02197265625, 3.14715576171875, 3.2723388671875, 3.39752197265625, 3.522705078125, 3.64788818359375, 3.7730712890625, 3.89825439453125, 4.0234375]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 7.0, 7.0, 5.0, 9.0, 22.0, 29.0, 39.0, 71.0, 104.0, 126.0, 232.0, 377.0, 617.0, 989.0, 1568.0, 2436.0, 4054.0, 6472.0, 10800.0, 17945.0, 29946.0, 52393.0, 97591.0, 236002.0, 314240.0, 122082.0, 61900.0, 35485.0, 20680.0, 12501.0, 7597.0, 4594.0, 2875.0, 1751.0, 1125.0, 680.0, 448.0, 261.0, 177.0, 119.0, 65.0, 42.0, 35.0, 19.0, 15.0, 14.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.84619140625, -0.8206634521484375, -0.795135498046875, -0.7696075439453125, -0.74407958984375, -0.7185516357421875, -0.693023681640625, -0.6674957275390625, -0.6419677734375, -0.6164398193359375, -0.590911865234375, -0.5653839111328125, -0.53985595703125, -0.5143280029296875, -0.488800048828125, -0.4632720947265625, -0.437744140625, -0.4122161865234375, -0.386688232421875, -0.3611602783203125, -0.33563232421875, -0.3101043701171875, -0.284576416015625, -0.2590484619140625, -0.2335205078125, -0.2079925537109375, -0.182464599609375, -0.1569366455078125, -0.13140869140625, -0.1058807373046875, -0.080352783203125, -0.0548248291015625, -0.029296875, -0.0037689208984375, 0.021759033203125, 0.0472869873046875, 0.07281494140625, 0.0983428955078125, 0.123870849609375, 0.1493988037109375, 0.1749267578125, 0.2004547119140625, 0.225982666015625, 0.2515106201171875, 0.27703857421875, 0.3025665283203125, 0.328094482421875, 0.3536224365234375, 0.379150390625, 0.4046783447265625, 0.430206298828125, 0.4557342529296875, 0.48126220703125, 0.5067901611328125, 0.532318115234375, 0.5578460693359375, 0.5833740234375, 0.6089019775390625, 0.634429931640625, 0.6599578857421875, 0.68548583984375, 0.7110137939453125, 0.736541748046875, 0.7620697021484375, 0.78759765625]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 5.0, 3.0, 4.0, 2.0, 6.0, 6.0, 10.0, 9.0, 7.0, 15.0, 11.0, 9.0, 8.0, 13.0, 15.0, 29.0, 31.0, 14.0, 22.0, 29.0, 24.0, 34.0, 25.0, 28.0, 37.0, 38.0, 28.0, 38.0, 1050.0, 32.0, 39.0, 38.0, 37.0, 31.0, 31.0, 38.0, 26.0, 25.0, 20.0, 24.0, 19.0, 11.0, 23.0, 14.0, 13.0, 15.0, 10.0, 12.0, 10.0, 4.0, 2.0, 4.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.0703125, -2.00360107421875, -1.9368896484375, -1.87017822265625, -1.803466796875, -1.73675537109375, -1.6700439453125, -1.60333251953125, -1.53662109375, -1.46990966796875, -1.4031982421875, -1.33648681640625, -1.269775390625, -1.20306396484375, -1.1363525390625, -1.06964111328125, -1.0029296875, -0.93621826171875, -0.8695068359375, -0.80279541015625, -0.736083984375, -0.66937255859375, -0.6026611328125, -0.53594970703125, -0.46923828125, -0.40252685546875, -0.3358154296875, -0.26910400390625, -0.202392578125, -0.13568115234375, -0.0689697265625, -0.00225830078125, 0.064453125, 0.13116455078125, 0.1978759765625, 0.26458740234375, 0.331298828125, 0.39801025390625, 0.4647216796875, 0.53143310546875, 0.59814453125, 0.66485595703125, 0.7315673828125, 0.79827880859375, 0.864990234375, 0.93170166015625, 0.9984130859375, 1.06512451171875, 1.1318359375, 1.19854736328125, 1.2652587890625, 1.33197021484375, 1.398681640625, 1.46539306640625, 1.5321044921875, 1.59881591796875, 1.66552734375, 1.73223876953125, 1.7989501953125, 1.86566162109375, 1.932373046875, 1.99908447265625, 2.0657958984375, 2.13250732421875, 2.19921875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 5.0, 3.0, 8.0, 11.0, 9.0, 18.0, 39.0, 53.0, 52.0, 103.0, 158.0, 253.0, 330.0, 469.0, 743.0, 1016.0, 1511.0, 2075.0, 3073.0, 4284.0, 6291.0, 9141.0, 13337.0, 19867.0, 30493.0, 47845.0, 78366.0, 142936.0, 1306025.0, 175759.0, 92696.0, 54916.0, 34461.0, 22846.0, 14815.0, 10109.0, 6943.0, 4952.0, 3418.0, 2405.0, 1604.0, 1220.0, 807.0, 516.0, 416.0, 243.0, 163.0, 120.0, 81.0, 53.0, 28.0, 23.0, 16.0, 10.0, 3.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.59814453125, -0.5792465209960938, -0.5603485107421875, -0.5414505004882812, -0.522552490234375, -0.5036544799804688, -0.4847564697265625, -0.46585845947265625, -0.44696044921875, -0.42806243896484375, -0.4091644287109375, -0.39026641845703125, -0.371368408203125, -0.35247039794921875, -0.3335723876953125, -0.31467437744140625, -0.2957763671875, -0.27687835693359375, -0.2579803466796875, -0.23908233642578125, -0.220184326171875, -0.20128631591796875, -0.1823883056640625, -0.16349029541015625, -0.14459228515625, -0.12569427490234375, -0.1067962646484375, -0.08789825439453125, -0.069000244140625, -0.05010223388671875, -0.0312042236328125, -0.01230621337890625, 0.006591796875, 0.02548980712890625, 0.0443878173828125, 0.06328582763671875, 0.082183837890625, 0.10108184814453125, 0.1199798583984375, 0.13887786865234375, 0.15777587890625, 0.17667388916015625, 0.1955718994140625, 0.21446990966796875, 0.233367919921875, 0.25226593017578125, 0.2711639404296875, 0.29006195068359375, 0.3089599609375, 0.32785797119140625, 0.3467559814453125, 0.36565399169921875, 0.384552001953125, 0.40345001220703125, 0.4223480224609375, 0.44124603271484375, 0.46014404296875, 0.47904205322265625, 0.4979400634765625, 0.5168380737304688, 0.535736083984375, 0.5546340942382812, 0.5735321044921875, 0.5924301147460938, 0.611328125]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 4.0, 3.0, 4.0, 2.0, 11.0, 12.0, 11.0, 12.0, 10.0, 19.0, 26.0, 25.0, 33.0, 33.0, 37.0, 43.0, 43.0, 45.0, 34.0, 70.0, 40.0, 59.0, 44.0, 54.0, 47.0, 42.0, 41.0, 27.0, 36.0, 19.0, 23.0, 18.0, 9.0, 13.0, 15.0, 7.0, 8.0, 6.0, 4.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0], "bins": [-0.0004208087921142578, -0.00040893256664276123, -0.00039705634117126465, -0.00038518011569976807, -0.0003733038902282715, -0.0003614276647567749, -0.0003495514392852783, -0.00033767521381378174, -0.00032579898834228516, -0.0003139227628707886, -0.000302046537399292, -0.0002901703119277954, -0.00027829408645629883, -0.00026641786098480225, -0.00025454163551330566, -0.00024266541004180908, -0.0002307891845703125, -0.00021891295909881592, -0.00020703673362731934, -0.00019516050815582275, -0.00018328428268432617, -0.0001714080572128296, -0.000159531831741333, -0.00014765560626983643, -0.00013577938079833984, -0.00012390315532684326, -0.00011202692985534668, -0.0001001507043838501, -8.827447891235352e-05, -7.639825344085693e-05, -6.452202796936035e-05, -5.264580249786377e-05, -4.076957702636719e-05, -2.8893351554870605e-05, -1.7017126083374023e-05, -5.140900611877441e-06, 6.735324859619141e-06, 1.8611550331115723e-05, 3.0487775802612305e-05, 4.236400127410889e-05, 5.424022674560547e-05, 6.611645221710205e-05, 7.799267768859863e-05, 8.986890316009521e-05, 0.0001017451286315918, 0.00011362135410308838, 0.00012549757957458496, 0.00013737380504608154, 0.00014925003051757812, 0.0001611262559890747, 0.0001730024814605713, 0.00018487870693206787, 0.00019675493240356445, 0.00020863115787506104, 0.00022050738334655762, 0.0002323836088180542, 0.0002442598342895508, 0.00025613605976104736, 0.00026801228523254395, 0.00027988851070404053, 0.0002917647361755371, 0.0003036409616470337, 0.0003155171871185303, 0.00032739341259002686, 0.00033926963806152344]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 4.0, 7.0, 6.0, 6.0, 7.0, 9.0, 11.0, 14.0, 15.0, 21.0, 30.0, 33.0, 42.0, 52.0, 76.0, 91.0, 108.0, 212.0, 310.0, 559.0, 1446.0, 627563.0, 415057.0, 1296.0, 577.0, 299.0, 162.0, 119.0, 96.0, 68.0, 52.0, 48.0, 28.0, 27.0, 21.0, 16.0, 16.0, 18.0, 9.0, 8.0, 4.0, 6.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007129669189453125, -0.006883561611175537, -0.006637454032897949, -0.006391346454620361, -0.0061452388763427734, -0.0058991312980651855, -0.005653023719787598, -0.00540691614151001, -0.005160808563232422, -0.004914700984954834, -0.004668593406677246, -0.004422485828399658, -0.00417637825012207, -0.003930270671844482, -0.0036841630935668945, -0.0034380555152893066, -0.0031919479370117188, -0.002945840358734131, -0.002699732780456543, -0.002453625202178955, -0.002207517623901367, -0.0019614100456237793, -0.0017153024673461914, -0.0014691948890686035, -0.0012230873107910156, -0.0009769797325134277, -0.0007308721542358398, -0.00048476457595825195, -0.00023865699768066406, 7.450580596923828e-06, 0.0002535581588745117, 0.0004996657371520996, 0.0007457733154296875, 0.0009918808937072754, 0.0012379884719848633, 0.0014840960502624512, 0.001730203628540039, 0.001976311206817627, 0.002222418785095215, 0.0024685263633728027, 0.0027146339416503906, 0.0029607415199279785, 0.0032068490982055664, 0.0034529566764831543, 0.003699064254760742, 0.00394517183303833, 0.004191279411315918, 0.004437386989593506, 0.004683494567871094, 0.004929602146148682, 0.0051757097244262695, 0.005421817302703857, 0.005667924880981445, 0.005914032459259033, 0.006160140037536621, 0.006406247615814209, 0.006652355194091797, 0.006898462772369385, 0.007144570350646973, 0.0073906779289245605, 0.0076367855072021484, 0.007882893085479736, 0.008129000663757324, 0.008375108242034912, 0.0086212158203125]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 57.0, 706.0, 243.0, 8.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015413217479363084, -0.0014942148700356483, -0.0014471081085503101, -0.00140000123064965, -0.00135289435274899, -0.00130578747484833, -0.00125868059694767, -0.0012115738354623318, -0.0011644669575616717, -0.0011173600796610117, -0.0010702533181756735, -0.0010231464402750134, -0.0009760395623743534, -0.0009289326844736934, -0.0008818258647806942, -0.0008347190450876951, -0.0007876121671870351, -0.000740505289286375, -0.0006933984695933759, -0.0006462916499003768, -0.0005991847719997168, -0.0005520778940990567, -0.0005049710744060576, -0.000457864225609228, -0.00041075737681239843, -0.00036365052801556885, -0.00031654367921873927, -0.0002694368304219097, -0.0002223299816250801, -0.00017522313282825053, -0.00012811628403142095, -8.100943523459136e-05, -3.390270285308361e-05, 1.320414594374597e-05, 6.031099474057555e-05, 0.00010741784353740513, 0.00015452469233423471, 0.0002016315411310643, 0.0002487383899278939, 0.00029584523872472346, 0.00034295208752155304, 0.0003900589363183826, 0.0004371657851152122, 0.0004842726339120418, 0.0005313794827088714, 0.0005784863606095314, 0.0006255931803025305, 0.0006726999999955297, 0.0007198068778961897, 0.0007669137557968497, 0.0008140205754898489, 0.000861127395182848, 0.000908234273083508, 0.000955341150984168, 0.0010024479124695063, 0.0010495547903701663, 0.0010966616682708263, 0.0011437685461714864, 0.0011908754240721464, 0.0012379821855574846, 0.0012850890634581447, 0.0013321959413588047, 0.001379302702844143, 0.001426409580744803, 0.001473516458645463]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 3.0, 5.0, 7.0, 7.0, 11.0, 18.0, 23.0, 23.0, 23.0, 19.0, 35.0, 35.0, 43.0, 43.0, 32.0, 39.0, 42.0, 37.0, 50.0, 49.0, 28.0, 44.0, 42.0, 45.0, 37.0, 34.0, 36.0, 27.0, 27.0, 25.0, 18.0, 23.0, 17.0, 12.0, 9.0, 5.0, 4.0, 4.0, 5.0, 3.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002117156982421875, -0.00020445510745048523, -0.00019719451665878296, -0.0001899339258670807, -0.00018267333507537842, -0.00017541274428367615, -0.00016815215349197388, -0.0001608915627002716, -0.00015363097190856934, -0.00014637038111686707, -0.0001391097903251648, -0.00013184919953346252, -0.00012458860874176025, -0.00011732801795005798, -0.00011006742715835571, -0.00010280683636665344, -9.554624557495117e-05, -8.82856547832489e-05, -8.102506399154663e-05, -7.376447319984436e-05, -6.650388240814209e-05, -5.924329161643982e-05, -5.198270082473755e-05, -4.472211003303528e-05, -3.746151924133301e-05, -3.0200928449630737e-05, -2.2940337657928467e-05, -1.5679746866226196e-05, -8.419156074523926e-06, -1.1585652828216553e-06, 6.102025508880615e-06, 1.3362616300582886e-05, 2.0623207092285156e-05, 2.7883797883987427e-05, 3.51443886756897e-05, 4.240497946739197e-05, 4.966557025909424e-05, 5.692616105079651e-05, 6.418675184249878e-05, 7.144734263420105e-05, 7.870793342590332e-05, 8.596852421760559e-05, 9.322911500930786e-05, 0.00010048970580101013, 0.0001077502965927124, 0.00011501088738441467, 0.00012227147817611694, 0.00012953206896781921, 0.00013679265975952148, 0.00014405325055122375, 0.00015131384134292603, 0.0001585744321346283, 0.00016583502292633057, 0.00017309561371803284, 0.0001803562045097351, 0.00018761679530143738, 0.00019487738609313965, 0.00020213797688484192, 0.0002093985676765442, 0.00021665915846824646, 0.00022391974925994873, 0.000231180340051651, 0.00023844093084335327, 0.00024570152163505554, 0.0002529621124267578]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 7.0, 4.0, 3.0, 6.0, 9.0, 10.0, 14.0, 16.0, 17.0, 21.0, 26.0, 19.0, 36.0, 24.0, 33.0, 27.0, 35.0, 40.0, 39.0, 41.0, 38.0, 45.0, 38.0, 53.0, 26.0, 40.0, 29.0, 31.0, 36.0, 36.0, 26.0, 30.0, 22.0, 24.0, 22.0, 13.0, 14.0, 14.0, 12.0, 6.0, 6.0, 6.0, 1.0, 5.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.98828125, -3.86309814453125, -3.7379150390625, -3.61273193359375, -3.487548828125, -3.36236572265625, -3.2371826171875, -3.11199951171875, -2.98681640625, -2.86163330078125, -2.7364501953125, -2.61126708984375, -2.486083984375, -2.36090087890625, -2.2357177734375, -2.11053466796875, -1.9853515625, -1.86016845703125, -1.7349853515625, -1.60980224609375, -1.484619140625, -1.35943603515625, -1.2342529296875, -1.10906982421875, -0.98388671875, -0.85870361328125, -0.7335205078125, -0.60833740234375, -0.483154296875, -0.35797119140625, -0.2327880859375, -0.10760498046875, 0.017578125, 0.14276123046875, 0.2679443359375, 0.39312744140625, 0.518310546875, 0.64349365234375, 0.7686767578125, 0.89385986328125, 1.01904296875, 1.14422607421875, 1.2694091796875, 1.39459228515625, 1.519775390625, 1.64495849609375, 1.7701416015625, 1.89532470703125, 2.0205078125, 2.14569091796875, 2.2708740234375, 2.39605712890625, 2.521240234375, 2.64642333984375, 2.7716064453125, 2.89678955078125, 3.02197265625, 3.14715576171875, 3.2723388671875, 3.39752197265625, 3.522705078125, 3.64788818359375, 3.7730712890625, 3.89825439453125, 4.0234375]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 6.0, 4.0, 8.0, 7.0, 11.0, 9.0, 20.0, 24.0, 39.0, 44.0, 60.0, 91.0, 98.0, 151.0, 219.0, 269.0, 346.0, 485.0, 742.0, 1425.0, 4955.0, 28368.0, 311394.0, 638872.0, 48429.0, 7709.0, 1858.0, 820.0, 544.0, 404.0, 321.0, 221.0, 141.0, 113.0, 100.0, 65.0, 44.0, 37.0, 29.0, 25.0, 19.0, 9.0, 6.0, 2.0, 6.0, 8.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.0546875, -9.7418212890625, -9.428955078125, -9.1160888671875, -8.80322265625, -8.4903564453125, -8.177490234375, -7.8646240234375, -7.5517578125, -7.2388916015625, -6.926025390625, -6.6131591796875, -6.30029296875, -5.9874267578125, -5.674560546875, -5.3616943359375, -5.048828125, -4.7359619140625, -4.423095703125, -4.1102294921875, -3.79736328125, -3.4844970703125, -3.171630859375, -2.8587646484375, -2.5458984375, -2.2330322265625, -1.920166015625, -1.6072998046875, -1.29443359375, -0.9815673828125, -0.668701171875, -0.3558349609375, -0.04296875, 0.2698974609375, 0.582763671875, 0.8956298828125, 1.20849609375, 1.5213623046875, 1.834228515625, 2.1470947265625, 2.4599609375, 2.7728271484375, 3.085693359375, 3.3985595703125, 3.71142578125, 4.0242919921875, 4.337158203125, 4.6500244140625, 4.962890625, 5.2757568359375, 5.588623046875, 5.9014892578125, 6.21435546875, 6.5272216796875, 6.840087890625, 7.1529541015625, 7.4658203125, 7.7786865234375, 8.091552734375, 8.4044189453125, 8.71728515625, 9.0301513671875, 9.343017578125, 9.6558837890625, 9.96875]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 2.0, 11.0, 5.0, 16.0, 16.0, 18.0, 20.0, 32.0, 23.0, 39.0, 30.0, 34.0, 39.0, 59.0, 56.0, 86.0, 180.0, 1621.0, 274.0, 94.0, 74.0, 39.0, 45.0, 39.0, 43.0, 26.0, 27.0, 20.0, 14.0, 13.0, 17.0, 7.0, 11.0, 11.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.5078125, -15.0604248046875, -14.613037109375, -14.1656494140625, -13.71826171875, -13.2708740234375, -12.823486328125, -12.3760986328125, -11.9287109375, -11.4813232421875, -11.033935546875, -10.5865478515625, -10.13916015625, -9.6917724609375, -9.244384765625, -8.7969970703125, -8.349609375, -7.9022216796875, -7.454833984375, -7.0074462890625, -6.56005859375, -6.1126708984375, -5.665283203125, -5.2178955078125, -4.7705078125, -4.3231201171875, -3.875732421875, -3.4283447265625, -2.98095703125, -2.5335693359375, -2.086181640625, -1.6387939453125, -1.19140625, -0.7440185546875, -0.296630859375, 0.1507568359375, 0.59814453125, 1.0455322265625, 1.492919921875, 1.9403076171875, 2.3876953125, 2.8350830078125, 3.282470703125, 3.7298583984375, 4.17724609375, 4.6246337890625, 5.072021484375, 5.5194091796875, 5.966796875, 6.4141845703125, 6.861572265625, 7.3089599609375, 7.75634765625, 8.2037353515625, 8.651123046875, 9.0985107421875, 9.5458984375, 9.9932861328125, 10.440673828125, 10.8880615234375, 11.33544921875, 11.7828369140625, 12.230224609375, 12.6776123046875, 13.125]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 6.0, 9.0, 13.0, 15.0, 10.0, 21.0, 16.0, 21.0, 40.0, 53.0, 49.0, 75.0, 111.0, 193.0, 307.0, 769.0, 3352.0, 1588569.0, 1546780.0, 3514.0, 732.0, 324.0, 209.0, 125.0, 85.0, 58.0, 52.0, 40.0, 25.0, 32.0, 17.0, 10.0, 22.0, 12.0, 11.0, 9.0, 9.0, 7.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.4375, -33.28955078125, -32.1416015625, -30.99365234375, -29.845703125, -28.69775390625, -27.5498046875, -26.40185546875, -25.25390625, -24.10595703125, -22.9580078125, -21.81005859375, -20.662109375, -19.51416015625, -18.3662109375, -17.21826171875, -16.0703125, -14.92236328125, -13.7744140625, -12.62646484375, -11.478515625, -10.33056640625, -9.1826171875, -8.03466796875, -6.88671875, -5.73876953125, -4.5908203125, -3.44287109375, -2.294921875, -1.14697265625, 0.0009765625, 1.14892578125, 2.296875, 3.44482421875, 4.5927734375, 5.74072265625, 6.888671875, 8.03662109375, 9.1845703125, 10.33251953125, 11.48046875, 12.62841796875, 13.7763671875, 14.92431640625, 16.072265625, 17.22021484375, 18.3681640625, 19.51611328125, 20.6640625, 21.81201171875, 22.9599609375, 24.10791015625, 25.255859375, 26.40380859375, 27.5517578125, 28.69970703125, 29.84765625, 30.99560546875, 32.1435546875, 33.29150390625, 34.439453125, 35.58740234375, 36.7353515625, 37.88330078125, 39.03125]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 9.0, 46.0, 157.0, 291.0, 281.0, 162.0, 50.0, 13.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.175193786621094, -38.2205810546875, -37.26596450805664, -36.31134796142578, -35.35673522949219, -34.402122497558594, -33.447505950927734, -32.492889404296875, -31.53827667236328, -30.583662033081055, -29.629047393798828, -28.6744327545166, -27.719818115234375, -26.76520347595215, -25.810588836669922, -24.855974197387695, -23.90135955810547, -22.946744918823242, -21.992130279541016, -21.03751564025879, -20.082901000976562, -19.128286361694336, -18.17367172241211, -17.219057083129883, -16.264442443847656, -15.30982780456543, -14.355213165283203, -13.400598526000977, -12.44598388671875, -11.491369247436523, -10.536754608154297, -9.58213996887207, -8.627527236938477, -7.67291259765625, -6.718297958374023, -5.763683319091797, -4.80906867980957, -3.8544540405273438, -2.899839401245117, -1.9452247619628906, -0.9906101226806641, -0.0359954833984375, 0.9186191558837891, 1.8732337951660156, 2.827848434448242, 3.7824630737304688, 4.737077713012695, 5.691692352294922, 6.646306991577148, 7.600921630859375, 8.555536270141602, 9.510150909423828, 10.464765548706055, 11.419380187988281, 12.373994827270508, 13.328609466552734, 14.283224105834961, 15.237838745117188, 16.192453384399414, 17.14706802368164, 18.101682662963867, 19.056297302246094, 20.01091194152832, 20.965526580810547, 21.920141220092773]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 4.0, 1.0, 6.0, 7.0, 4.0, 6.0, 8.0, 15.0, 11.0, 13.0, 14.0, 12.0, 26.0, 15.0, 19.0, 29.0, 26.0, 34.0, 29.0, 38.0, 37.0, 45.0, 34.0, 47.0, 32.0, 40.0, 48.0, 39.0, 34.0, 36.0, 33.0, 35.0, 23.0, 37.0, 17.0, 24.0, 24.0, 14.0, 17.0, 13.0, 15.0, 19.0, 3.0, 4.0, 3.0, 5.0, 5.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-26.897613525390625, -25.985258102416992, -25.07290267944336, -24.16054916381836, -23.248193740844727, -22.335838317871094, -21.42348289489746, -20.511127471923828, -19.598772048950195, -18.686416625976562, -17.77406120300293, -16.861705780029297, -15.94935131072998, -15.036996841430664, -14.124641418457031, -13.212285995483398, -12.299931526184082, -11.38757610321045, -10.475221633911133, -9.5628662109375, -8.650510787963867, -7.738155841827393, -6.825800895690918, -5.913445472717285, -5.0010905265808105, -4.088735580444336, -3.176380157470703, -2.2640252113342285, -1.3516700267791748, -0.4393148422241211, 0.4730401039123535, 1.3853955268859863, 2.297750473022461, 3.2101056575775146, 4.122460842132568, 5.034815788269043, 5.947171211242676, 6.85952615737915, 7.771881103515625, 8.684236526489258, 9.59659194946289, 10.508947372436523, 11.42130184173584, 12.333657264709473, 13.246012687683105, 14.158367156982422, 15.070722579956055, 15.983078002929688, 16.895431518554688, 17.80778694152832, 18.720142364501953, 19.632495880126953, 20.544851303100586, 21.45720672607422, 22.36956214904785, 23.281917572021484, 24.194272994995117, 25.10662841796875, 26.018983840942383, 26.931339263916016, 27.843692779541016, 28.75604820251465, 29.66840362548828, 30.580759048461914, 31.493114471435547]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 2.0, 10.0, 8.0, 10.0, 11.0, 6.0, 8.0, 26.0, 13.0, 17.0, 24.0, 28.0, 37.0, 31.0, 33.0, 35.0, 40.0, 36.0, 46.0, 43.0, 47.0, 44.0, 48.0, 43.0, 32.0, 40.0, 26.0, 27.0, 35.0, 26.0, 25.0, 29.0, 19.0, 14.0, 17.0, 8.0, 15.0, 12.0, 10.0, 8.0, 7.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.1328125, -3.9979248046875, -3.863037109375, -3.7281494140625, -3.59326171875, -3.4583740234375, -3.323486328125, -3.1885986328125, -3.0537109375, -2.9188232421875, -2.783935546875, -2.6490478515625, -2.51416015625, -2.3792724609375, -2.244384765625, -2.1094970703125, -1.974609375, -1.8397216796875, -1.704833984375, -1.5699462890625, -1.43505859375, -1.3001708984375, -1.165283203125, -1.0303955078125, -0.8955078125, -0.7606201171875, -0.625732421875, -0.4908447265625, -0.35595703125, -0.2210693359375, -0.086181640625, 0.0487060546875, 0.18359375, 0.3184814453125, 0.453369140625, 0.5882568359375, 0.72314453125, 0.8580322265625, 0.992919921875, 1.1278076171875, 1.2626953125, 1.3975830078125, 1.532470703125, 1.6673583984375, 1.80224609375, 1.9371337890625, 2.072021484375, 2.2069091796875, 2.341796875, 2.4766845703125, 2.611572265625, 2.7464599609375, 2.88134765625, 3.0162353515625, 3.151123046875, 3.2860107421875, 3.4208984375, 3.5557861328125, 3.690673828125, 3.8255615234375, 3.96044921875, 4.0953369140625, 4.230224609375, 4.3651123046875, 4.5]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 4.0, 7.0, 11.0, 12.0, 14.0, 23.0, 29.0, 28.0, 35.0, 56.0, 68.0, 87.0, 104.0, 166.0, 212.0, 311.0, 498.0, 1098.0, 5178.0, 79619.0, 1155950.0, 2472550.0, 449604.0, 23942.0, 2449.0, 768.0, 430.0, 261.0, 186.0, 143.0, 86.0, 78.0, 58.0, 62.0, 29.0, 32.0, 24.0, 20.0, 15.0, 9.0, 8.0, 4.0, 3.0, 7.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.171875, -7.9107666015625, -7.649658203125, -7.3885498046875, -7.12744140625, -6.8663330078125, -6.605224609375, -6.3441162109375, -6.0830078125, -5.8218994140625, -5.560791015625, -5.2996826171875, -5.03857421875, -4.7774658203125, -4.516357421875, -4.2552490234375, -3.994140625, -3.7330322265625, -3.471923828125, -3.2108154296875, -2.94970703125, -2.6885986328125, -2.427490234375, -2.1663818359375, -1.9052734375, -1.6441650390625, -1.383056640625, -1.1219482421875, -0.86083984375, -0.5997314453125, -0.338623046875, -0.0775146484375, 0.18359375, 0.4447021484375, 0.705810546875, 0.9669189453125, 1.22802734375, 1.4891357421875, 1.750244140625, 2.0113525390625, 2.2724609375, 2.5335693359375, 2.794677734375, 3.0557861328125, 3.31689453125, 3.5780029296875, 3.839111328125, 4.1002197265625, 4.361328125, 4.6224365234375, 4.883544921875, 5.1446533203125, 5.40576171875, 5.6668701171875, 5.927978515625, 6.1890869140625, 6.4501953125, 6.7113037109375, 6.972412109375, 7.2335205078125, 7.49462890625, 7.7557373046875, 8.016845703125, 8.2779541015625, 8.5390625]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 0.0, 4.0, 7.0, 5.0, 6.0, 12.0, 12.0, 30.0, 35.0, 47.0, 57.0, 80.0, 111.0, 148.0, 217.0, 273.0, 351.0, 418.0, 436.0, 387.0, 399.0, 281.0, 202.0, 153.0, 106.0, 75.0, 45.0, 48.0, 31.0, 26.0, 22.0, 10.0, 7.0, 5.0, 7.0, 2.0, 5.0, 4.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.2890625, -6.1016845703125, -5.914306640625, -5.7269287109375, -5.53955078125, -5.3521728515625, -5.164794921875, -4.9774169921875, -4.7900390625, -4.6026611328125, -4.415283203125, -4.2279052734375, -4.04052734375, -3.8531494140625, -3.665771484375, -3.4783935546875, -3.291015625, -3.1036376953125, -2.916259765625, -2.7288818359375, -2.54150390625, -2.3541259765625, -2.166748046875, -1.9793701171875, -1.7919921875, -1.6046142578125, -1.417236328125, -1.2298583984375, -1.04248046875, -0.8551025390625, -0.667724609375, -0.4803466796875, -0.29296875, -0.1055908203125, 0.081787109375, 0.2691650390625, 0.45654296875, 0.6439208984375, 0.831298828125, 1.0186767578125, 1.2060546875, 1.3934326171875, 1.580810546875, 1.7681884765625, 1.95556640625, 2.1429443359375, 2.330322265625, 2.5177001953125, 2.705078125, 2.8924560546875, 3.079833984375, 3.2672119140625, 3.45458984375, 3.6419677734375, 3.829345703125, 4.0167236328125, 4.2041015625, 4.3914794921875, 4.578857421875, 4.7662353515625, 4.95361328125, 5.1409912109375, 5.328369140625, 5.5157470703125, 5.703125]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 6.0, 6.0, 6.0, 7.0, 7.0, 11.0, 15.0, 20.0, 36.0, 44.0, 64.0, 84.0, 109.0, 175.0, 284.0, 469.0, 784.0, 1983.0, 9690.0, 201338.0, 3544626.0, 414776.0, 14974.0, 2391.0, 880.0, 474.0, 325.0, 190.0, 141.0, 95.0, 83.0, 45.0, 33.0, 30.0, 29.0, 12.0, 10.0, 7.0, 11.0, 4.0, 7.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-14.8046875, -14.3360595703125, -13.867431640625, -13.3988037109375, -12.93017578125, -12.4615478515625, -11.992919921875, -11.5242919921875, -11.0556640625, -10.5870361328125, -10.118408203125, -9.6497802734375, -9.18115234375, -8.7125244140625, -8.243896484375, -7.7752685546875, -7.306640625, -6.8380126953125, -6.369384765625, -5.9007568359375, -5.43212890625, -4.9635009765625, -4.494873046875, -4.0262451171875, -3.5576171875, -3.0889892578125, -2.620361328125, -2.1517333984375, -1.68310546875, -1.2144775390625, -0.745849609375, -0.2772216796875, 0.19140625, 0.6600341796875, 1.128662109375, 1.5972900390625, 2.06591796875, 2.5345458984375, 3.003173828125, 3.4718017578125, 3.9404296875, 4.4090576171875, 4.877685546875, 5.3463134765625, 5.81494140625, 6.2835693359375, 6.752197265625, 7.2208251953125, 7.689453125, 8.1580810546875, 8.626708984375, 9.0953369140625, 9.56396484375, 10.0325927734375, 10.501220703125, 10.9698486328125, 11.4384765625, 11.9071044921875, 12.375732421875, 12.8443603515625, 13.31298828125, 13.7816162109375, 14.250244140625, 14.7188720703125, 15.1875]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 298.0, 716.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-725.9168701171875, -710.8220825195312, -695.727294921875, -680.6325073242188, -665.5377197265625, -650.4429321289062, -635.34814453125, -620.2533569335938, -605.1585693359375, -590.0637817382812, -574.968994140625, -559.8742065429688, -544.7794189453125, -529.6846313476562, -514.58984375, -499.49505615234375, -484.4002380371094, -469.3054504394531, -454.2106628417969, -439.1158752441406, -424.0210876464844, -408.9263000488281, -393.83148193359375, -378.7366943359375, -363.64190673828125, -348.547119140625, -333.45233154296875, -318.3575439453125, -303.26275634765625, -288.16796875, -273.07318115234375, -257.9783935546875, -242.88357543945312, -227.78878784179688, -212.69400024414062, -197.59921264648438, -182.50442504882812, -167.40963745117188, -152.31483459472656, -137.2200469970703, -122.12525939941406, -107.03047180175781, -91.93568420410156, -76.84088897705078, -61.74610137939453, -46.65131378173828, -31.5565185546875, -16.46173095703125, -1.366943359375, 13.727846145629883, 28.822635650634766, 43.91742706298828, 59.01221466064453, 74.10700225830078, 89.20179748535156, 104.29658508300781, 119.39137268066406, 134.4861602783203, 149.58094787597656, 164.67575073242188, 179.77053833007812, 194.86532592773438, 209.96011352539062, 225.05490112304688, 240.14968872070312]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 9.0, 7.0, 17.0, 11.0, 18.0, 26.0, 29.0, 23.0, 42.0, 37.0, 36.0, 48.0, 56.0, 65.0, 68.0, 62.0, 46.0, 55.0, 56.0, 49.0, 46.0, 34.0, 36.0, 34.0, 26.0, 21.0, 16.0, 13.0, 7.0, 12.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.70359992980957, -19.747283935546875, -18.790969848632812, -17.834653854370117, -16.878337860107422, -15.922021865844727, -14.965706825256348, -14.009391784667969, -13.053075790405273, -12.096759796142578, -11.1404447555542, -10.18412971496582, -9.227813720703125, -8.27149772644043, -7.315182685852051, -6.358867168426514, -5.402551651000977, -4.4462361335754395, -3.4899206161499023, -2.5336050987243652, -1.5772895812988281, -0.620974063873291, 0.3353414535522461, 1.2916569709777832, 2.2479724884033203, 3.2042880058288574, 4.1606035232543945, 5.116919040679932, 6.073234558105469, 7.029550075531006, 7.985865592956543, 8.942180633544922, 9.89849853515625, 10.854814529418945, 11.811129570007324, 12.767444610595703, 13.723760604858398, 14.680076599121094, 15.636391639709473, 16.59270668029785, 17.549022674560547, 18.505338668823242, 19.461654663085938, 20.41796875, 21.374284744262695, 22.33060073852539, 23.286914825439453, 24.24323081970215, 25.199546813964844, 26.15586280822754, 27.112178802490234, 28.068492889404297, 29.024808883666992, 29.981124877929688, 30.93743896484375, 31.893754959106445, 32.85007095336914, 33.8063850402832, 34.76270294189453, 35.719017028808594, 36.675331115722656, 37.631649017333984, 38.58796310424805, 39.544281005859375, 40.50059509277344]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 4.0, 2.0, 8.0, 13.0, 13.0, 14.0, 12.0, 17.0, 20.0, 18.0, 20.0, 29.0, 34.0, 47.0, 35.0, 31.0, 39.0, 36.0, 46.0, 40.0, 38.0, 50.0, 54.0, 42.0, 37.0, 30.0, 44.0, 35.0, 23.0, 29.0, 23.0, 21.0, 15.0, 15.0, 14.0, 13.0, 10.0, 6.0, 11.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.94921875, -3.8138427734375, -3.678466796875, -3.5430908203125, -3.40771484375, -3.2723388671875, -3.136962890625, -3.0015869140625, -2.8662109375, -2.7308349609375, -2.595458984375, -2.4600830078125, -2.32470703125, -2.1893310546875, -2.053955078125, -1.9185791015625, -1.783203125, -1.6478271484375, -1.512451171875, -1.3770751953125, -1.24169921875, -1.1063232421875, -0.970947265625, -0.8355712890625, -0.7001953125, -0.5648193359375, -0.429443359375, -0.2940673828125, -0.15869140625, -0.0233154296875, 0.112060546875, 0.2474365234375, 0.3828125, 0.5181884765625, 0.653564453125, 0.7889404296875, 0.92431640625, 1.0596923828125, 1.195068359375, 1.3304443359375, 1.4658203125, 1.6011962890625, 1.736572265625, 1.8719482421875, 2.00732421875, 2.1427001953125, 2.278076171875, 2.4134521484375, 2.548828125, 2.6842041015625, 2.819580078125, 2.9549560546875, 3.09033203125, 3.2257080078125, 3.361083984375, 3.4964599609375, 3.6318359375, 3.7672119140625, 3.902587890625, 4.0379638671875, 4.17333984375, 4.3087158203125, 4.444091796875, 4.5794677734375, 4.71484375]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 6.0, 4.0, 12.0, 8.0, 18.0, 26.0, 35.0, 57.0, 79.0, 114.0, 187.0, 290.0, 414.0, 590.0, 915.0, 1372.0, 2047.0, 3087.0, 4781.0, 7158.0, 11249.0, 17985.0, 29475.0, 49940.0, 89441.0, 179743.0, 298882.0, 154125.0, 79053.0, 44694.0, 26497.0, 16564.0, 10206.0, 6581.0, 4342.0, 2820.0, 1944.0, 1249.0, 832.0, 593.0, 375.0, 227.0, 180.0, 120.0, 75.0, 49.0, 39.0, 29.0, 19.0, 11.0, 9.0, 7.0, 2.0, 3.0, 0.0, 2.0], "bins": [-0.82958984375, -0.8054733276367188, -0.7813568115234375, -0.7572402954101562, -0.733123779296875, -0.7090072631835938, -0.6848907470703125, -0.6607742309570312, -0.63665771484375, -0.6125411987304688, -0.5884246826171875, -0.5643081665039062, -0.540191650390625, -0.5160751342773438, -0.4919586181640625, -0.46784210205078125, -0.4437255859375, -0.41960906982421875, -0.3954925537109375, -0.37137603759765625, -0.347259521484375, -0.32314300537109375, -0.2990264892578125, -0.27490997314453125, -0.25079345703125, -0.22667694091796875, -0.2025604248046875, -0.17844390869140625, -0.154327392578125, -0.13021087646484375, -0.1060943603515625, -0.08197784423828125, -0.057861328125, -0.03374481201171875, -0.0096282958984375, 0.01448822021484375, 0.038604736328125, 0.06272125244140625, 0.0868377685546875, 0.11095428466796875, 0.13507080078125, 0.15918731689453125, 0.1833038330078125, 0.20742034912109375, 0.231536865234375, 0.25565338134765625, 0.2797698974609375, 0.30388641357421875, 0.3280029296875, 0.35211944580078125, 0.3762359619140625, 0.40035247802734375, 0.424468994140625, 0.44858551025390625, 0.4727020263671875, 0.49681854248046875, 0.52093505859375, 0.5450515747070312, 0.5691680908203125, 0.5932846069335938, 0.617401123046875, 0.6415176391601562, 0.6656341552734375, 0.6897506713867188, 0.7138671875]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 5.0, 2.0, 3.0, 3.0, 6.0, 6.0, 4.0, 6.0, 4.0, 13.0, 12.0, 14.0, 14.0, 6.0, 19.0, 14.0, 18.0, 32.0, 31.0, 28.0, 29.0, 44.0, 41.0, 28.0, 35.0, 41.0, 36.0, 1060.0, 51.0, 43.0, 38.0, 36.0, 34.0, 35.0, 37.0, 25.0, 32.0, 22.0, 14.0, 13.0, 15.0, 13.0, 13.0, 11.0, 17.0, 7.0, 7.0, 8.0, 6.0, 4.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.455078125, -2.374176025390625, -2.29327392578125, -2.212371826171875, -2.1314697265625, -2.050567626953125, -1.96966552734375, -1.888763427734375, -1.807861328125, -1.726959228515625, -1.64605712890625, -1.565155029296875, -1.4842529296875, -1.403350830078125, -1.32244873046875, -1.241546630859375, -1.16064453125, -1.079742431640625, -0.99884033203125, -0.917938232421875, -0.8370361328125, -0.756134033203125, -0.67523193359375, -0.594329833984375, -0.513427734375, -0.432525634765625, -0.35162353515625, -0.270721435546875, -0.1898193359375, -0.108917236328125, -0.02801513671875, 0.052886962890625, 0.1337890625, 0.214691162109375, 0.29559326171875, 0.376495361328125, 0.4573974609375, 0.538299560546875, 0.61920166015625, 0.700103759765625, 0.781005859375, 0.861907958984375, 0.94281005859375, 1.023712158203125, 1.1046142578125, 1.185516357421875, 1.26641845703125, 1.347320556640625, 1.42822265625, 1.509124755859375, 1.59002685546875, 1.670928955078125, 1.7518310546875, 1.832733154296875, 1.91363525390625, 1.994537353515625, 2.075439453125, 2.156341552734375, 2.23724365234375, 2.318145751953125, 2.3990478515625, 2.479949951171875, 2.56085205078125, 2.641754150390625, 2.72265625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 8.0, 6.0, 13.0, 16.0, 32.0, 45.0, 56.0, 91.0, 125.0, 195.0, 281.0, 416.0, 547.0, 822.0, 1167.0, 1771.0, 2484.0, 3607.0, 5179.0, 7815.0, 11739.0, 18111.0, 28713.0, 47456.0, 83202.0, 159637.0, 1352769.0, 158230.0, 82793.0, 46882.0, 28580.0, 18002.0, 11600.0, 7689.0, 5158.0, 3730.0, 2492.0, 1848.0, 1242.0, 805.0, 566.0, 424.0, 255.0, 196.0, 119.0, 69.0, 54.0, 48.0, 18.0, 11.0, 10.0, 6.0, 7.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.68701171875, -0.6644821166992188, -0.6419525146484375, -0.6194229125976562, -0.596893310546875, -0.5743637084960938, -0.5518341064453125, -0.5293045043945312, -0.50677490234375, -0.48424530029296875, -0.4617156982421875, -0.43918609619140625, -0.416656494140625, -0.39412689208984375, -0.3715972900390625, -0.34906768798828125, -0.3265380859375, -0.30400848388671875, -0.2814788818359375, -0.25894927978515625, -0.236419677734375, -0.21389007568359375, -0.1913604736328125, -0.16883087158203125, -0.14630126953125, -0.12377166748046875, -0.1012420654296875, -0.07871246337890625, -0.056182861328125, -0.03365325927734375, -0.0111236572265625, 0.01140594482421875, 0.033935546875, 0.05646514892578125, 0.0789947509765625, 0.10152435302734375, 0.124053955078125, 0.14658355712890625, 0.1691131591796875, 0.19164276123046875, 0.21417236328125, 0.23670196533203125, 0.2592315673828125, 0.28176116943359375, 0.304290771484375, 0.32682037353515625, 0.3493499755859375, 0.37187957763671875, 0.3944091796875, 0.41693878173828125, 0.4394683837890625, 0.46199798583984375, 0.484527587890625, 0.5070571899414062, 0.5295867919921875, 0.5521163940429688, 0.57464599609375, 0.5971755981445312, 0.6197052001953125, 0.6422348022460938, 0.664764404296875, 0.6872940063476562, 0.7098236083984375, 0.7323532104492188, 0.7548828125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 2.0, 7.0, 12.0, 10.0, 9.0, 10.0, 12.0, 15.0, 18.0, 16.0, 31.0, 22.0, 32.0, 29.0, 33.0, 46.0, 44.0, 52.0, 48.0, 52.0, 54.0, 52.0, 39.0, 49.0, 38.0, 35.0, 35.0, 35.0, 18.0, 26.0, 25.0, 11.0, 17.0, 7.0, 17.0, 4.0, 6.0, 9.0, 7.0, 6.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.00043773651123046875, -0.0004251226782798767, -0.00041250884532928467, -0.0003998950123786926, -0.0003872811794281006, -0.00037466734647750854, -0.0003620535135269165, -0.00034943968057632446, -0.0003368258476257324, -0.0003242120146751404, -0.00031159818172454834, -0.0002989843487739563, -0.00028637051582336426, -0.0002737566828727722, -0.0002611428499221802, -0.00024852901697158813, -0.0002359151840209961, -0.00022330135107040405, -0.000210687518119812, -0.00019807368516921997, -0.00018545985221862793, -0.0001728460192680359, -0.00016023218631744385, -0.0001476183533668518, -0.00013500452041625977, -0.00012239068746566772, -0.00010977685451507568, -9.716302156448364e-05, -8.45491886138916e-05, -7.193535566329956e-05, -5.932152271270752e-05, -4.670768976211548e-05, -3.409385681152344e-05, -2.1480023860931396e-05, -8.866190910339355e-06, 3.7476420402526855e-06, 1.6361474990844727e-05, 2.8975307941436768e-05, 4.158914089202881e-05, 5.420297384262085e-05, 6.681680679321289e-05, 7.943063974380493e-05, 9.204447269439697e-05, 0.00010465830564498901, 0.00011727213859558105, 0.0001298859715461731, 0.00014249980449676514, 0.00015511363744735718, 0.00016772747039794922, 0.00018034130334854126, 0.0001929551362991333, 0.00020556896924972534, 0.00021818280220031738, 0.00023079663515090942, 0.00024341046810150146, 0.0002560243010520935, 0.00026863813400268555, 0.0002812519669532776, 0.00029386579990386963, 0.00030647963285446167, 0.0003190934658050537, 0.00033170729875564575, 0.0003443211317062378, 0.00035693496465682983, 0.0003695487976074219]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 3.0, 8.0, 12.0, 14.0, 8.0, 8.0, 23.0, 23.0, 27.0, 27.0, 36.0, 39.0, 55.0, 73.0, 84.0, 131.0, 179.0, 228.0, 418.0, 700.0, 2545.0, 970600.0, 70479.0, 1149.0, 527.0, 342.0, 193.0, 138.0, 94.0, 71.0, 60.0, 48.0, 36.0, 40.0, 25.0, 29.0, 17.0, 21.0, 9.0, 4.0, 10.0, 5.0, 4.0, 3.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.007114410400390625, -0.006867110729217529, -0.006619811058044434, -0.006372511386871338, -0.006125211715698242, -0.0058779120445251465, -0.005630612373352051, -0.005383312702178955, -0.005136013031005859, -0.004888713359832764, -0.004641413688659668, -0.004394114017486572, -0.0041468143463134766, -0.003899514675140381, -0.003652215003967285, -0.0034049153327941895, -0.0031576156616210938, -0.002910315990447998, -0.0026630163192749023, -0.0024157166481018066, -0.002168416976928711, -0.0019211173057556152, -0.0016738176345825195, -0.0014265179634094238, -0.0011792182922363281, -0.0009319186210632324, -0.0006846189498901367, -0.000437319278717041, -0.0001900196075439453, 5.728006362915039e-05, 0.0003045797348022461, 0.0005518794059753418, 0.0007991790771484375, 0.0010464787483215332, 0.001293778419494629, 0.0015410780906677246, 0.0017883777618408203, 0.002035677433013916, 0.0022829771041870117, 0.0025302767753601074, 0.002777576446533203, 0.003024876117706299, 0.0032721757888793945, 0.0035194754600524902, 0.003766775131225586, 0.004014074802398682, 0.004261374473571777, 0.004508674144744873, 0.004755973815917969, 0.0050032734870910645, 0.00525057315826416, 0.005497872829437256, 0.0057451725006103516, 0.005992472171783447, 0.006239771842956543, 0.006487071514129639, 0.006734371185302734, 0.00698167085647583, 0.007228970527648926, 0.0074762701988220215, 0.007723569869995117, 0.007970869541168213, 0.008218169212341309, 0.008465468883514404, 0.0087127685546875]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 31.0, 435.0, 511.0, 37.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.002659361809492111, -0.002613550052046776, -0.002567738527432084, -0.0025219267699867487, -0.002476115245372057, -0.0024303034879267216, -0.00238449196331203, -0.0023386802058666945, -0.0022928686812520027, -0.0022470569238066673, -0.0022012453991919756, -0.00215543364174664, -0.0021096221171319485, -0.002063810359686613, -0.0020179988350719213, -0.001972187077626586, -0.0019263753201812506, -0.001880563679151237, -0.0018347520381212234, -0.0017889403970912099, -0.0017431287560611963, -0.001697316998615861, -0.0016515054740011692, -0.0016056937165558338, -0.001559882191941142, -0.0015140705509111285, -0.001468258909881115, -0.0014224472688511014, -0.0013766356278210878, -0.0013308238703757524, -0.0012850123457610607, -0.0012392005883157253, -0.00119338883087039, -0.0011475771898403764, -0.0011017655488103628, -0.0010559539077803493, -0.0010101422667503357, -0.0009643305675126612, -0.0009185189264826477, -0.0008727072272449732, -0.0008268957026302814, -0.0007810840616002679, -0.0007352724205702543, -0.0006894607795402408, -0.0006436490803025663, -0.0005978374392725527, -0.0005520257982425392, -0.0005062140990048647, -0.00046040245797485113, -0.00041459081694483757, -0.00036877914681099355, -0.00032296750578098, -0.000277155835647136, -0.0002313441946171224, -0.00018553255358710885, -0.00013972088345326483, -9.390924242325127e-05, -4.809759047930129e-05, -2.285938535351306e-06, 4.352570977061987e-05, 8.933736535254866e-05, 0.00013514902093447745, 0.000180960661964491, 0.00022677233209833503, 0.0002725839731283486]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 6.0, 8.0, 5.0, 11.0, 7.0, 5.0, 17.0, 22.0, 16.0, 25.0, 16.0, 23.0, 24.0, 37.0, 33.0, 33.0, 41.0, 61.0, 36.0, 37.0, 51.0, 38.0, 50.0, 54.0, 48.0, 34.0, 32.0, 28.0, 35.0, 31.0, 23.0, 15.0, 22.0, 15.0, 14.0, 9.0, 7.0, 7.0, 9.0, 7.0, 5.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022673606872558594, -0.00021886080503463745, -0.00021098554134368896, -0.00020311027765274048, -0.000195235013961792, -0.0001873597502708435, -0.00017948448657989502, -0.00017160922288894653, -0.00016373395919799805, -0.00015585869550704956, -0.00014798343181610107, -0.0001401081681251526, -0.0001322329044342041, -0.00012435764074325562, -0.00011648237705230713, -0.00010860711336135864, -0.00010073184967041016, -9.285658597946167e-05, -8.498132228851318e-05, -7.71060585975647e-05, -6.923079490661621e-05, -6.135553121566772e-05, -5.348026752471924e-05, -4.560500383377075e-05, -3.7729740142822266e-05, -2.985447645187378e-05, -2.1979212760925293e-05, -1.4103949069976807e-05, -6.22868537902832e-06, 1.646578311920166e-06, 9.521842002868652e-06, 1.739710569381714e-05, 2.5272369384765625e-05, 3.314763307571411e-05, 4.10228967666626e-05, 4.8898160457611084e-05, 5.677342414855957e-05, 6.464868783950806e-05, 7.252395153045654e-05, 8.039921522140503e-05, 8.827447891235352e-05, 9.6149742603302e-05, 0.00010402500629425049, 0.00011190026998519897, 0.00011977553367614746, 0.00012765079736709595, 0.00013552606105804443, 0.00014340132474899292, 0.0001512765884399414, 0.0001591518521308899, 0.00016702711582183838, 0.00017490237951278687, 0.00018277764320373535, 0.00019065290689468384, 0.00019852817058563232, 0.0002064034342765808, 0.0002142786979675293, 0.00022215396165847778, 0.00023002922534942627, 0.00023790448904037476, 0.00024577975273132324, 0.00025365501642227173, 0.0002615302801132202, 0.0002694055438041687, 0.0002772808074951172]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 4.0, 2.0, 8.0, 13.0, 13.0, 14.0, 12.0, 17.0, 20.0, 18.0, 20.0, 29.0, 34.0, 47.0, 35.0, 31.0, 39.0, 36.0, 46.0, 40.0, 38.0, 50.0, 54.0, 42.0, 37.0, 30.0, 43.0, 36.0, 23.0, 29.0, 23.0, 21.0, 15.0, 15.0, 14.0, 13.0, 10.0, 6.0, 11.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.94921875, -3.8138427734375, -3.678466796875, -3.5430908203125, -3.40771484375, -3.2723388671875, -3.136962890625, -3.0015869140625, -2.8662109375, -2.7308349609375, -2.595458984375, -2.4600830078125, -2.32470703125, -2.1893310546875, -2.053955078125, -1.9185791015625, -1.783203125, -1.6478271484375, -1.512451171875, -1.3770751953125, -1.24169921875, -1.1063232421875, -0.970947265625, -0.8355712890625, -0.7001953125, -0.5648193359375, -0.429443359375, -0.2940673828125, -0.15869140625, -0.0233154296875, 0.112060546875, 0.2474365234375, 0.3828125, 0.5181884765625, 0.653564453125, 0.7889404296875, 0.92431640625, 1.0596923828125, 1.195068359375, 1.3304443359375, 1.4658203125, 1.6011962890625, 1.736572265625, 1.8719482421875, 2.00732421875, 2.1427001953125, 2.278076171875, 2.4134521484375, 2.548828125, 2.6842041015625, 2.819580078125, 2.9549560546875, 3.09033203125, 3.2257080078125, 3.361083984375, 3.4964599609375, 3.6318359375, 3.7672119140625, 3.902587890625, 4.0379638671875, 4.17333984375, 4.3087158203125, 4.444091796875, 4.5794677734375, 4.71484375]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 6.0, 12.0, 15.0, 10.0, 15.0, 23.0, 48.0, 40.0, 57.0, 75.0, 99.0, 120.0, 169.0, 290.0, 421.0, 893.0, 1683.0, 3709.0, 9712.0, 28017.0, 83446.0, 264314.0, 415483.0, 159047.0, 51508.0, 17206.0, 6406.0, 2625.0, 1260.0, 609.0, 389.0, 225.0, 174.0, 103.0, 91.0, 60.0, 52.0, 40.0, 27.0, 29.0, 14.0, 8.0, 9.0, 5.0, 6.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6484375, -4.48406982421875, -4.3197021484375, -4.15533447265625, -3.990966796875, -3.82659912109375, -3.6622314453125, -3.49786376953125, -3.33349609375, -3.16912841796875, -3.0047607421875, -2.84039306640625, -2.676025390625, -2.51165771484375, -2.3472900390625, -2.18292236328125, -2.0185546875, -1.85418701171875, -1.6898193359375, -1.52545166015625, -1.361083984375, -1.19671630859375, -1.0323486328125, -0.86798095703125, -0.70361328125, -0.53924560546875, -0.3748779296875, -0.21051025390625, -0.046142578125, 0.11822509765625, 0.2825927734375, 0.44696044921875, 0.611328125, 0.77569580078125, 0.9400634765625, 1.10443115234375, 1.268798828125, 1.43316650390625, 1.5975341796875, 1.76190185546875, 1.92626953125, 2.09063720703125, 2.2550048828125, 2.41937255859375, 2.583740234375, 2.74810791015625, 2.9124755859375, 3.07684326171875, 3.2412109375, 3.40557861328125, 3.5699462890625, 3.73431396484375, 3.898681640625, 4.06304931640625, 4.2274169921875, 4.39178466796875, 4.55615234375, 4.72052001953125, 4.8848876953125, 5.04925537109375, 5.213623046875, 5.37799072265625, 5.5423583984375, 5.70672607421875, 5.87109375]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 7.0, 9.0, 6.0, 6.0, 16.0, 23.0, 13.0, 20.0, 15.0, 26.0, 30.0, 31.0, 35.0, 30.0, 41.0, 43.0, 71.0, 105.0, 254.0, 1463.0, 230.0, 125.0, 82.0, 55.0, 45.0, 29.0, 32.0, 24.0, 32.0, 28.0, 22.0, 19.0, 19.0, 7.0, 6.0, 9.0, 7.0, 3.0, 6.0, 5.0, 8.0, 2.0, 2.0, 2.0, 6.0, 1.0, 1.0, 2.0], "bins": [-13.9453125, -13.552490234375, -13.15966796875, -12.766845703125, -12.3740234375, -11.981201171875, -11.58837890625, -11.195556640625, -10.802734375, -10.409912109375, -10.01708984375, -9.624267578125, -9.2314453125, -8.838623046875, -8.44580078125, -8.052978515625, -7.66015625, -7.267333984375, -6.87451171875, -6.481689453125, -6.0888671875, -5.696044921875, -5.30322265625, -4.910400390625, -4.517578125, -4.124755859375, -3.73193359375, -3.339111328125, -2.9462890625, -2.553466796875, -2.16064453125, -1.767822265625, -1.375, -0.982177734375, -0.58935546875, -0.196533203125, 0.1962890625, 0.589111328125, 0.98193359375, 1.374755859375, 1.767578125, 2.160400390625, 2.55322265625, 2.946044921875, 3.3388671875, 3.731689453125, 4.12451171875, 4.517333984375, 4.91015625, 5.302978515625, 5.69580078125, 6.088623046875, 6.4814453125, 6.874267578125, 7.26708984375, 7.659912109375, 8.052734375, 8.445556640625, 8.83837890625, 9.231201171875, 9.6240234375, 10.016845703125, 10.40966796875, 10.802490234375, 11.1953125]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 4.0, 2.0, 7.0, 4.0, 12.0, 10.0, 13.0, 21.0, 22.0, 44.0, 56.0, 67.0, 101.0, 145.0, 240.0, 353.0, 608.0, 1188.0, 9514.0, 2306540.0, 818212.0, 5825.0, 1095.0, 563.0, 341.0, 223.0, 134.0, 91.0, 68.0, 60.0, 27.0, 22.0, 13.0, 15.0, 18.0, 6.0, 7.0, 11.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-24.765625, -23.989990234375, -23.21435546875, -22.438720703125, -21.6630859375, -20.887451171875, -20.11181640625, -19.336181640625, -18.560546875, -17.784912109375, -17.00927734375, -16.233642578125, -15.4580078125, -14.682373046875, -13.90673828125, -13.131103515625, -12.35546875, -11.579833984375, -10.80419921875, -10.028564453125, -9.2529296875, -8.477294921875, -7.70166015625, -6.926025390625, -6.150390625, -5.374755859375, -4.59912109375, -3.823486328125, -3.0478515625, -2.272216796875, -1.49658203125, -0.720947265625, 0.0546875, 0.830322265625, 1.60595703125, 2.381591796875, 3.1572265625, 3.932861328125, 4.70849609375, 5.484130859375, 6.259765625, 7.035400390625, 7.81103515625, 8.586669921875, 9.3623046875, 10.137939453125, 10.91357421875, 11.689208984375, 12.46484375, 13.240478515625, 14.01611328125, 14.791748046875, 15.5673828125, 16.343017578125, 17.11865234375, 17.894287109375, 18.669921875, 19.445556640625, 20.22119140625, 20.996826171875, 21.7724609375, 22.548095703125, 23.32373046875, 24.099365234375, 24.875]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 7.0, 680.0, 331.0, 0.0, 0.0, 1.0], "bins": [-405.9640197753906, -399.18408203125, -392.4041442871094, -385.62420654296875, -378.84423828125, -372.0643005371094, -365.28436279296875, -358.5044250488281, -351.7244873046875, -344.9445495605469, -338.16461181640625, -331.3846435546875, -324.6047058105469, -317.82476806640625, -311.0448303222656, -304.264892578125, -297.48492431640625, -290.7049865722656, -283.925048828125, -277.14508056640625, -270.3651428222656, -263.585205078125, -256.8052673339844, -250.02532958984375, -243.24539184570312, -236.4654541015625, -229.6855010986328, -222.9055633544922, -216.12562561035156, -209.34567260742188, -202.56573486328125, -195.78579711914062, -189.005859375, -182.22592163085938, -175.4459686279297, -168.66603088378906, -161.88609313964844, -155.10614013671875, -148.32620239257812, -141.5462646484375, -134.7663116455078, -127.98636627197266, -121.20642852783203, -114.42648315429688, -107.64654541015625, -100.8666000366211, -94.08665466308594, -87.30671691894531, -80.52677154541016, -73.746826171875, -66.96688842773438, -60.18694305419922, -53.40700149536133, -46.62705993652344, -39.84711456298828, -33.06717300415039, -26.287233352661133, -19.50728988647461, -12.727348327636719, -5.947404861450195, 0.8325366973876953, 7.612478256225586, 14.392423629760742, 21.172365188598633, 27.952306747436523]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 4.0, 5.0, 4.0, 12.0, 12.0, 12.0, 13.0, 16.0, 29.0, 17.0, 27.0, 26.0, 27.0, 34.0, 43.0, 50.0, 39.0, 37.0, 47.0, 47.0, 47.0, 45.0, 40.0, 37.0, 43.0, 32.0, 40.0, 38.0, 22.0, 27.0, 25.0, 19.0, 16.0, 15.0, 15.0, 9.0, 5.0, 7.0, 8.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.35944366455078, -23.451749801635742, -22.544055938720703, -21.63636016845703, -20.728666305541992, -19.820972442626953, -18.913278579711914, -18.005584716796875, -17.097890853881836, -16.190196990966797, -15.282502174377441, -14.374808311462402, -13.467114448547363, -12.559419631958008, -11.651725769042969, -10.74403190612793, -9.836337089538574, -8.928643226623535, -8.02094841003418, -7.113254547119141, -6.205560684204102, -5.297866344451904, -4.390172004699707, -3.482478141784668, -2.5747838020324707, -1.6670897006988525, -0.7593954801559448, 0.1482987403869629, 1.055992841720581, 1.9636869430541992, 2.8713812828063965, 3.7790751457214355, 4.686769485473633, 5.59446382522583, 6.502157688140869, 7.409852027893066, 8.317545890808105, 9.225240707397461, 10.1329345703125, 11.040628433227539, 11.948322296142578, 12.856016159057617, 13.763710975646973, 14.671404838562012, 15.57909870147705, 16.486793518066406, 17.394487380981445, 18.302181243896484, 19.209877014160156, 20.117570877075195, 21.025264739990234, 21.932960510253906, 22.840654373168945, 23.748348236083984, 24.656042098999023, 25.563735961914062, 26.4714298248291, 27.37912368774414, 28.28681755065918, 29.19451141357422, 30.10220718383789, 31.00990104675293, 31.91759490966797, 32.825286865234375, 33.73298263549805]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 1.0, 3.0, 5.0, 9.0, 14.0, 5.0, 7.0, 8.0, 14.0, 18.0, 23.0, 21.0, 24.0, 20.0, 24.0, 33.0, 28.0, 33.0, 29.0, 38.0, 37.0, 37.0, 48.0, 47.0, 40.0, 48.0, 43.0, 35.0, 35.0, 36.0, 26.0, 26.0, 26.0, 23.0, 32.0, 8.0, 24.0, 17.0, 12.0, 6.0, 12.0, 8.0, 3.0, 7.0, 3.0, 5.0, 1.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.748046875, -3.620086669921875, -3.49212646484375, -3.364166259765625, -3.2362060546875, -3.108245849609375, -2.98028564453125, -2.852325439453125, -2.724365234375, -2.596405029296875, -2.46844482421875, -2.340484619140625, -2.2125244140625, -2.084564208984375, -1.95660400390625, -1.828643798828125, -1.70068359375, -1.572723388671875, -1.44476318359375, -1.316802978515625, -1.1888427734375, -1.060882568359375, -0.93292236328125, -0.804962158203125, -0.677001953125, -0.549041748046875, -0.42108154296875, -0.293121337890625, -0.1651611328125, -0.037200927734375, 0.09075927734375, 0.218719482421875, 0.3466796875, 0.474639892578125, 0.60260009765625, 0.730560302734375, 0.8585205078125, 0.986480712890625, 1.11444091796875, 1.242401123046875, 1.370361328125, 1.498321533203125, 1.62628173828125, 1.754241943359375, 1.8822021484375, 2.010162353515625, 2.13812255859375, 2.266082763671875, 2.39404296875, 2.522003173828125, 2.64996337890625, 2.777923583984375, 2.9058837890625, 3.033843994140625, 3.16180419921875, 3.289764404296875, 3.417724609375, 3.545684814453125, 3.67364501953125, 3.801605224609375, 3.9295654296875, 4.057525634765625, 4.18548583984375, 4.313446044921875, 4.44140625]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 5.0, 8.0, 5.0, 6.0, 5.0, 8.0, 8.0, 9.0, 9.0, 19.0, 25.0, 36.0, 23.0, 40.0, 69.0, 80.0, 129.0, 206.0, 360.0, 563.0, 1405.0, 4516.0, 20905.0, 122263.0, 625253.0, 1673659.0, 1301606.0, 363675.0, 63353.0, 10911.0, 2817.0, 1002.0, 481.0, 229.0, 171.0, 89.0, 73.0, 64.0, 49.0, 28.0, 29.0, 24.0, 15.0, 8.0, 17.0, 5.0, 10.0, 4.0, 4.0, 5.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.44140625, -4.28173828125, -4.1220703125, -3.96240234375, -3.802734375, -3.64306640625, -3.4833984375, -3.32373046875, -3.1640625, -3.00439453125, -2.8447265625, -2.68505859375, -2.525390625, -2.36572265625, -2.2060546875, -2.04638671875, -1.88671875, -1.72705078125, -1.5673828125, -1.40771484375, -1.248046875, -1.08837890625, -0.9287109375, -0.76904296875, -0.609375, -0.44970703125, -0.2900390625, -0.13037109375, 0.029296875, 0.18896484375, 0.3486328125, 0.50830078125, 0.66796875, 0.82763671875, 0.9873046875, 1.14697265625, 1.306640625, 1.46630859375, 1.6259765625, 1.78564453125, 1.9453125, 2.10498046875, 2.2646484375, 2.42431640625, 2.583984375, 2.74365234375, 2.9033203125, 3.06298828125, 3.22265625, 3.38232421875, 3.5419921875, 3.70166015625, 3.861328125, 4.02099609375, 4.1806640625, 4.34033203125, 4.5, 4.65966796875, 4.8193359375, 4.97900390625, 5.138671875, 5.29833984375, 5.4580078125, 5.61767578125, 5.77734375]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 3.0, 3.0, 9.0, 14.0, 10.0, 21.0, 27.0, 30.0, 43.0, 54.0, 77.0, 129.0, 170.0, 241.0, 324.0, 429.0, 461.0, 450.0, 391.0, 311.0, 245.0, 171.0, 116.0, 75.0, 55.0, 47.0, 46.0, 29.0, 19.0, 18.0, 12.0, 8.0, 7.0, 6.0, 7.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.1953125, -5.0218505859375, -4.848388671875, -4.6749267578125, -4.50146484375, -4.3280029296875, -4.154541015625, -3.9810791015625, -3.8076171875, -3.6341552734375, -3.460693359375, -3.2872314453125, -3.11376953125, -2.9403076171875, -2.766845703125, -2.5933837890625, -2.419921875, -2.2464599609375, -2.072998046875, -1.8995361328125, -1.72607421875, -1.5526123046875, -1.379150390625, -1.2056884765625, -1.0322265625, -0.8587646484375, -0.685302734375, -0.5118408203125, -0.33837890625, -0.1649169921875, 0.008544921875, 0.1820068359375, 0.35546875, 0.5289306640625, 0.702392578125, 0.8758544921875, 1.04931640625, 1.2227783203125, 1.396240234375, 1.5697021484375, 1.7431640625, 1.9166259765625, 2.090087890625, 2.2635498046875, 2.43701171875, 2.6104736328125, 2.783935546875, 2.9573974609375, 3.130859375, 3.3043212890625, 3.477783203125, 3.6512451171875, 3.82470703125, 3.9981689453125, 4.171630859375, 4.3450927734375, 4.5185546875, 4.6920166015625, 4.865478515625, 5.0389404296875, 5.21240234375, 5.3858642578125, 5.559326171875, 5.7327880859375, 5.90625]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 2.0, 3.0, 10.0, 4.0, 7.0, 15.0, 14.0, 16.0, 27.0, 47.0, 43.0, 61.0, 93.0, 153.0, 229.0, 431.0, 889.0, 2595.0, 11772.0, 82810.0, 1055865.0, 2727464.0, 273268.0, 29895.0, 5487.0, 1616.0, 612.0, 293.0, 190.0, 125.0, 63.0, 47.0, 36.0, 37.0, 16.0, 11.0, 18.0, 5.0, 7.0, 5.0, 0.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.40625, -7.1129150390625, -6.819580078125, -6.5262451171875, -6.23291015625, -5.9395751953125, -5.646240234375, -5.3529052734375, -5.0595703125, -4.7662353515625, -4.472900390625, -4.1795654296875, -3.88623046875, -3.5928955078125, -3.299560546875, -3.0062255859375, -2.712890625, -2.4195556640625, -2.126220703125, -1.8328857421875, -1.53955078125, -1.2462158203125, -0.952880859375, -0.6595458984375, -0.3662109375, -0.0728759765625, 0.220458984375, 0.5137939453125, 0.80712890625, 1.1004638671875, 1.393798828125, 1.6871337890625, 1.98046875, 2.2738037109375, 2.567138671875, 2.8604736328125, 3.15380859375, 3.4471435546875, 3.740478515625, 4.0338134765625, 4.3271484375, 4.6204833984375, 4.913818359375, 5.2071533203125, 5.50048828125, 5.7938232421875, 6.087158203125, 6.3804931640625, 6.673828125, 6.9671630859375, 7.260498046875, 7.5538330078125, 7.84716796875, 8.1405029296875, 8.433837890625, 8.7271728515625, 9.0205078125, 9.3138427734375, 9.607177734375, 9.9005126953125, 10.19384765625, 10.4871826171875, 10.780517578125, 11.0738525390625, 11.3671875]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 12.0, 89.0, 265.0, 371.0, 221.0, 41.0, 10.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.562997817993164, -20.562423706054688, -18.56184959411621, -16.561275482177734, -14.560702323913574, -12.560128211975098, -10.559555053710938, -8.558980941772461, -6.558406829833984, -4.557832717895508, -2.5572590827941895, -0.5566854476928711, 1.4438886642456055, 3.444462776184082, 5.445035934448242, 7.445610046386719, 9.446184158325195, 11.446758270263672, 13.447332382202148, 15.447905540466309, 17.44847869873047, 19.449054718017578, 21.449626922607422, 23.4502010345459, 25.450775146484375, 27.45134925842285, 29.451923370361328, 31.452495574951172, 33.45307159423828, 35.453643798828125, 37.45421600341797, 39.45479202270508, 41.45536804199219, 43.45594024658203, 45.45651626586914, 47.457088470458984, 49.457664489746094, 51.45823669433594, 53.45880889892578, 55.45938491821289, 57.4599609375, 59.460533142089844, 61.46110916137695, 63.4616813659668, 65.4622573852539, 67.46282958984375, 69.4634017944336, 71.46397399902344, 73.46455383300781, 75.46512603759766, 77.4656982421875, 79.46627807617188, 81.46685028076172, 83.46742248535156, 85.4679946899414, 87.46856689453125, 89.4691390991211, 91.46971130371094, 93.47028350830078, 95.47086334228516, 97.471435546875, 99.47200775146484, 101.47257995605469, 103.47315979003906, 105.4737319946289]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 6.0, 1.0, 4.0, 4.0, 3.0, 9.0, 9.0, 6.0, 10.0, 16.0, 9.0, 18.0, 13.0, 24.0, 21.0, 24.0, 34.0, 35.0, 32.0, 29.0, 40.0, 41.0, 41.0, 38.0, 47.0, 33.0, 40.0, 29.0, 42.0, 40.0, 49.0, 32.0, 22.0, 35.0, 29.0, 26.0, 19.0, 20.0, 20.0, 15.0, 8.0, 7.0, 10.0, 9.0, 5.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.538654327392578, -19.92561149597168, -19.31256866455078, -18.699525833129883, -18.086483001708984, -17.473440170288086, -16.860397338867188, -16.24735450744629, -15.63431167602539, -15.021268844604492, -14.408226013183594, -13.795183181762695, -13.182140350341797, -12.569097518920898, -11.9560546875, -11.343011856079102, -10.729969024658203, -10.116926193237305, -9.503883361816406, -8.890840530395508, -8.27779769897461, -7.664754867553711, -7.0517120361328125, -6.438669204711914, -5.825626373291016, -5.212583541870117, -4.599540710449219, -3.9864978790283203, -3.373455047607422, -2.7604122161865234, -2.147369384765625, -1.5343265533447266, -0.9212818145751953, -0.3082389831542969, 0.30480384826660156, 0.9178466796875, 1.5308895111083984, 2.143932342529297, 2.7569751739501953, 3.3700180053710938, 3.983060836791992, 4.596103668212891, 5.209146499633789, 5.8221893310546875, 6.435232162475586, 7.048274993896484, 7.661317825317383, 8.274360656738281, 8.88740348815918, 9.500446319580078, 10.113489151000977, 10.726531982421875, 11.339574813842773, 11.952617645263672, 12.56566047668457, 13.178703308105469, 13.791746139526367, 14.404788970947266, 15.017831802368164, 15.630874633789062, 16.24391746520996, 16.85696029663086, 17.470003128051758, 18.083045959472656, 18.696088790893555]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 12.0, 10.0, 6.0, 12.0, 9.0, 15.0, 16.0, 17.0, 17.0, 33.0, 21.0, 28.0, 27.0, 33.0, 33.0, 30.0, 41.0, 43.0, 32.0, 51.0, 44.0, 36.0, 37.0, 33.0, 42.0, 36.0, 36.0, 31.0, 28.0, 29.0, 27.0, 19.0, 20.0, 19.0, 10.0, 13.0, 8.0, 14.0, 10.0, 7.0, 4.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.8671875, -3.74310302734375, -3.6190185546875, -3.49493408203125, -3.370849609375, -3.24676513671875, -3.1226806640625, -2.99859619140625, -2.87451171875, -2.75042724609375, -2.6263427734375, -2.50225830078125, -2.378173828125, -2.25408935546875, -2.1300048828125, -2.00592041015625, -1.8818359375, -1.75775146484375, -1.6336669921875, -1.50958251953125, -1.385498046875, -1.26141357421875, -1.1373291015625, -1.01324462890625, -0.88916015625, -0.76507568359375, -0.6409912109375, -0.51690673828125, -0.392822265625, -0.26873779296875, -0.1446533203125, -0.02056884765625, 0.103515625, 0.22760009765625, 0.3516845703125, 0.47576904296875, 0.599853515625, 0.72393798828125, 0.8480224609375, 0.97210693359375, 1.09619140625, 1.22027587890625, 1.3443603515625, 1.46844482421875, 1.592529296875, 1.71661376953125, 1.8406982421875, 1.96478271484375, 2.0888671875, 2.21295166015625, 2.3370361328125, 2.46112060546875, 2.585205078125, 2.70928955078125, 2.8333740234375, 2.95745849609375, 3.08154296875, 3.20562744140625, 3.3297119140625, 3.45379638671875, 3.577880859375, 3.70196533203125, 3.8260498046875, 3.95013427734375, 4.07421875]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 5.0, 2.0, 2.0, 5.0, 8.0, 5.0, 16.0, 27.0, 21.0, 41.0, 60.0, 98.0, 134.0, 196.0, 292.0, 438.0, 632.0, 910.0, 1434.0, 2152.0, 3368.0, 4951.0, 7604.0, 11870.0, 18129.0, 29093.0, 46800.0, 79641.0, 145977.0, 277181.0, 177911.0, 93070.0, 54157.0, 33106.0, 20708.0, 13486.0, 8556.0, 5490.0, 3783.0, 2454.0, 1504.0, 1018.0, 710.0, 517.0, 305.0, 223.0, 169.0, 90.0, 69.0, 45.0, 43.0, 21.0, 17.0, 6.0, 11.0, 4.0, 1.0, 6.0, 0.0, 0.0, 3.0], "bins": [-0.734375, -0.7118759155273438, -0.6893768310546875, -0.6668777465820312, -0.644378662109375, -0.6218795776367188, -0.5993804931640625, -0.5768814086914062, -0.55438232421875, -0.5318832397460938, -0.5093841552734375, -0.48688507080078125, -0.464385986328125, -0.44188690185546875, -0.4193878173828125, -0.39688873291015625, -0.3743896484375, -0.35189056396484375, -0.3293914794921875, -0.30689239501953125, -0.284393310546875, -0.26189422607421875, -0.2393951416015625, -0.21689605712890625, -0.19439697265625, -0.17189788818359375, -0.1493988037109375, -0.12689971923828125, -0.104400634765625, -0.08190155029296875, -0.0594024658203125, -0.03690338134765625, -0.014404296875, 0.00809478759765625, 0.0305938720703125, 0.05309295654296875, 0.075592041015625, 0.09809112548828125, 0.1205902099609375, 0.14308929443359375, 0.16558837890625, 0.18808746337890625, 0.2105865478515625, 0.23308563232421875, 0.255584716796875, 0.27808380126953125, 0.3005828857421875, 0.32308197021484375, 0.3455810546875, 0.36808013916015625, 0.3905792236328125, 0.41307830810546875, 0.435577392578125, 0.45807647705078125, 0.4805755615234375, 0.5030746459960938, 0.52557373046875, 0.5480728149414062, 0.5705718994140625, 0.5930709838867188, 0.615570068359375, 0.6380691528320312, 0.6605682373046875, 0.6830673217773438, 0.70556640625]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 7.0, 9.0, 8.0, 9.0, 5.0, 12.0, 15.0, 9.0, 15.0, 23.0, 35.0, 23.0, 28.0, 41.0, 41.0, 35.0, 38.0, 35.0, 31.0, 49.0, 36.0, 1071.0, 40.0, 40.0, 36.0, 35.0, 41.0, 28.0, 24.0, 37.0, 26.0, 32.0, 20.0, 14.0, 21.0, 16.0, 8.0, 8.0, 9.0, 6.0, 6.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.83203125, -2.747344970703125, -2.66265869140625, -2.577972412109375, -2.4932861328125, -2.408599853515625, -2.32391357421875, -2.239227294921875, -2.154541015625, -2.069854736328125, -1.98516845703125, -1.900482177734375, -1.8157958984375, -1.731109619140625, -1.64642333984375, -1.561737060546875, -1.47705078125, -1.392364501953125, -1.30767822265625, -1.222991943359375, -1.1383056640625, -1.053619384765625, -0.96893310546875, -0.884246826171875, -0.799560546875, -0.714874267578125, -0.63018798828125, -0.545501708984375, -0.4608154296875, -0.376129150390625, -0.29144287109375, -0.206756591796875, -0.1220703125, -0.037384033203125, 0.04730224609375, 0.131988525390625, 0.2166748046875, 0.301361083984375, 0.38604736328125, 0.470733642578125, 0.555419921875, 0.640106201171875, 0.72479248046875, 0.809478759765625, 0.8941650390625, 0.978851318359375, 1.06353759765625, 1.148223876953125, 1.23291015625, 1.317596435546875, 1.40228271484375, 1.486968994140625, 1.5716552734375, 1.656341552734375, 1.74102783203125, 1.825714111328125, 1.910400390625, 1.995086669921875, 2.07977294921875, 2.164459228515625, 2.2491455078125, 2.333831787109375, 2.41851806640625, 2.503204345703125, 2.587890625]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 7.0, 13.0, 19.0, 28.0, 39.0, 61.0, 93.0, 155.0, 211.0, 334.0, 491.0, 703.0, 1066.0, 1593.0, 2403.0, 3568.0, 5539.0, 8612.0, 13501.0, 21433.0, 34299.0, 58389.0, 104573.0, 218118.0, 1319128.0, 124744.0, 68872.0, 40489.0, 24676.0, 15432.0, 9776.0, 6370.0, 4159.0, 2762.0, 1890.0, 1277.0, 814.0, 529.0, 345.0, 218.0, 149.0, 99.0, 56.0, 28.0, 33.0, 18.0, 5.0, 11.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.7587890625, -0.7358932495117188, -0.7129974365234375, -0.6901016235351562, -0.667205810546875, -0.6443099975585938, -0.6214141845703125, -0.5985183715820312, -0.57562255859375, -0.5527267456054688, -0.5298309326171875, -0.5069351196289062, -0.484039306640625, -0.46114349365234375, -0.4382476806640625, -0.41535186767578125, -0.3924560546875, -0.36956024169921875, -0.3466644287109375, -0.32376861572265625, -0.300872802734375, -0.27797698974609375, -0.2550811767578125, -0.23218536376953125, -0.20928955078125, -0.18639373779296875, -0.1634979248046875, -0.14060211181640625, -0.117706298828125, -0.09481048583984375, -0.0719146728515625, -0.04901885986328125, -0.026123046875, -0.00322723388671875, 0.0196685791015625, 0.04256439208984375, 0.065460205078125, 0.08835601806640625, 0.1112518310546875, 0.13414764404296875, 0.15704345703125, 0.17993927001953125, 0.2028350830078125, 0.22573089599609375, 0.248626708984375, 0.27152252197265625, 0.2944183349609375, 0.31731414794921875, 0.3402099609375, 0.36310577392578125, 0.3860015869140625, 0.40889739990234375, 0.431793212890625, 0.45468902587890625, 0.4775848388671875, 0.5004806518554688, 0.52337646484375, 0.5462722778320312, 0.5691680908203125, 0.5920639038085938, 0.614959716796875, 0.6378555297851562, 0.6607513427734375, 0.6836471557617188, 0.70654296875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 8.0, 5.0, 10.0, 14.0, 11.0, 13.0, 17.0, 19.0, 32.0, 32.0, 41.0, 56.0, 57.0, 63.0, 65.0, 78.0, 84.0, 71.0, 53.0, 33.0, 46.0, 41.0, 36.0, 22.0, 18.0, 15.0, 12.0, 8.0, 3.0, 15.0, 4.0, 5.0, 1.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004181861877441406, -0.000403478741645813, -0.00038877129554748535, -0.0003740638494491577, -0.0003593564033508301, -0.00034464895725250244, -0.0003299415111541748, -0.00031523406505584717, -0.00030052661895751953, -0.0002858191728591919, -0.00027111172676086426, -0.0002564042806625366, -0.00024169683456420898, -0.00022698938846588135, -0.0002122819423675537, -0.00019757449626922607, -0.00018286705017089844, -0.0001681596040725708, -0.00015345215797424316, -0.00013874471187591553, -0.0001240372657775879, -0.00010932981967926025, -9.462237358093262e-05, -7.991492748260498e-05, -6.520748138427734e-05, -5.050003528594971e-05, -3.579258918762207e-05, -2.1085143089294434e-05, -6.377696990966797e-06, 8.32974910736084e-06, 2.3037195205688477e-05, 3.774464130401611e-05, 5.245208740234375e-05, 6.715953350067139e-05, 8.186697959899902e-05, 9.657442569732666e-05, 0.0001112818717956543, 0.00012598931789398193, 0.00014069676399230957, 0.0001554042100906372, 0.00017011165618896484, 0.00018481910228729248, 0.00019952654838562012, 0.00021423399448394775, 0.0002289414405822754, 0.00024364888668060303, 0.00025835633277893066, 0.0002730637788772583, 0.00028777122497558594, 0.0003024786710739136, 0.0003171861171722412, 0.00033189356327056885, 0.0003466010093688965, 0.0003613084554672241, 0.00037601590156555176, 0.0003907233476638794, 0.00040543079376220703, 0.00042013823986053467, 0.0004348456859588623, 0.00044955313205718994, 0.0004642605781555176, 0.0004789680242538452, 0.0004936754703521729, 0.0005083829164505005, 0.0005230903625488281]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 7.0, 6.0, 3.0, 4.0, 5.0, 6.0, 13.0, 17.0, 20.0, 21.0, 21.0, 38.0, 41.0, 66.0, 94.0, 135.0, 198.0, 283.0, 555.0, 1271.0, 362612.0, 680038.0, 1544.0, 603.0, 303.0, 187.0, 130.0, 80.0, 67.0, 31.0, 35.0, 28.0, 26.0, 17.0, 13.0, 11.0, 6.0, 4.0, 6.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.01032257080078125, -0.010043919086456299, -0.009765267372131348, -0.009486615657806396, -0.009207963943481445, -0.008929312229156494, -0.008650660514831543, -0.008372008800506592, -0.00809335708618164, -0.00781470537185669, -0.007536053657531738, -0.007257401943206787, -0.006978750228881836, -0.006700098514556885, -0.006421446800231934, -0.006142795085906982, -0.005864143371582031, -0.00558549165725708, -0.005306839942932129, -0.005028188228607178, -0.0047495365142822266, -0.004470884799957275, -0.004192233085632324, -0.003913581371307373, -0.003634929656982422, -0.0033562779426574707, -0.0030776262283325195, -0.0027989745140075684, -0.002520322799682617, -0.002241671085357666, -0.001963019371032715, -0.0016843676567077637, -0.0014057159423828125, -0.0011270642280578613, -0.0008484125137329102, -0.000569760799407959, -0.0002911090850830078, -1.245737075805664e-05, 0.00026619434356689453, 0.0005448460578918457, 0.0008234977722167969, 0.001102149486541748, 0.0013808012008666992, 0.0016594529151916504, 0.0019381046295166016, 0.0022167563438415527, 0.002495408058166504, 0.002774059772491455, 0.0030527114868164062, 0.0033313632011413574, 0.0036100149154663086, 0.0038886666297912598, 0.004167318344116211, 0.004445970058441162, 0.004724621772766113, 0.0050032734870910645, 0.005281925201416016, 0.005560576915740967, 0.005839228630065918, 0.006117880344390869, 0.00639653205871582, 0.0066751837730407715, 0.006953835487365723, 0.007232487201690674, 0.007511138916015625]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 7.0, 14.0, 49.0, 103.0, 199.0, 230.0, 177.0, 139.0, 57.0, 20.0, 15.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0006207413389347494, -0.0006061834865249693, -0.0005916256923228502, -0.0005770678399130702, -0.0005625099875032902, -0.0005479521350935102, -0.0005333942826837301, -0.000518836488481611, -0.000504278636071831, -0.000489720783662051, -0.0004751629603561014, -0.0004606051370501518, -0.0004460472846403718, -0.0004314894322305918, -0.0004169316089246422, -0.00040237378561869264, -0.0003878159332089126, -0.0003732580807991326, -0.000358700257493183, -0.00034414243418723345, -0.0003295845817774534, -0.0003150267293676734, -0.00030046890606172383, -0.00028591108275577426, -0.00027135323034599423, -0.0002567953779362142, -0.00024223755463026464, -0.00022767971677239984, -0.00021312187891453505, -0.00019856404105667025, -0.00018400620319880545, -0.00016944836534094065, -0.00015489052748307586, -0.00014033268962521106, -0.00012577485176734626, -0.00011121701390948147, -9.665917605161667e-05, -8.210133819375187e-05, -6.754350033588707e-05, -5.298566247802228e-05, -3.842782462015748e-05, -2.3869986762292683e-05, -9.312148904427886e-06, 5.245688953436911e-06, 1.9803526811301708e-05, 3.4361364669166505e-05, 4.89192025270313e-05, 6.34770403848961e-05, 7.80348782427609e-05, 9.25927161006257e-05, 0.00010715055395849049, 0.00012170839181635529, 0.00013626622967422009, 0.00015082406753208488, 0.00016538190538994968, 0.00017993974324781448, 0.00019449758110567927, 0.00020905541896354407, 0.00022361325682140887, 0.00023817109467927366, 0.00025272893253713846, 0.0002672867849469185, 0.00028184460825286806, 0.0002964024315588176, 0.00031096028396859765]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 0.0, 3.0, 6.0, 7.0, 9.0, 3.0, 6.0, 11.0, 10.0, 13.0, 10.0, 17.0, 15.0, 17.0, 30.0, 32.0, 35.0, 35.0, 32.0, 24.0, 38.0, 49.0, 45.0, 29.0, 35.0, 36.0, 32.0, 35.0, 34.0, 41.0, 35.0, 30.0, 33.0, 29.0, 34.0, 21.0, 20.0, 29.0, 18.0, 13.0, 19.0, 6.0, 8.0, 3.0, 7.0, 8.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00019699335098266602, -0.0001905057579278946, -0.00018401816487312317, -0.00017753057181835175, -0.00017104297876358032, -0.0001645553857088089, -0.00015806779265403748, -0.00015158019959926605, -0.00014509260654449463, -0.0001386050134897232, -0.00013211742043495178, -0.00012562982738018036, -0.00011914223432540894, -0.00011265464127063751, -0.00010616704821586609, -9.967945516109467e-05, -9.319186210632324e-05, -8.670426905155182e-05, -8.02166759967804e-05, -7.372908294200897e-05, -6.724148988723755e-05, -6.0753896832466125e-05, -5.42663037776947e-05, -4.777871072292328e-05, -4.1291117668151855e-05, -3.480352461338043e-05, -2.831593155860901e-05, -2.1828338503837585e-05, -1.5340745449066162e-05, -8.853152394294739e-06, -2.3655593395233154e-06, 4.122033715248108e-06, 1.0609626770019531e-05, 1.7097219824790955e-05, 2.3584812879562378e-05, 3.00724059343338e-05, 3.6559998989105225e-05, 4.304759204387665e-05, 4.953518509864807e-05, 5.6022778153419495e-05, 6.251037120819092e-05, 6.899796426296234e-05, 7.548555731773376e-05, 8.197315037250519e-05, 8.846074342727661e-05, 9.494833648204803e-05, 0.00010143592953681946, 0.00010792352259159088, 0.0001144111156463623, 0.00012089870870113373, 0.00012738630175590515, 0.00013387389481067657, 0.000140361487865448, 0.00014684908092021942, 0.00015333667397499084, 0.00015982426702976227, 0.0001663118600845337, 0.00017279945313930511, 0.00017928704619407654, 0.00018577463924884796, 0.00019226223230361938, 0.0001987498253583908, 0.00020523741841316223, 0.00021172501146793365, 0.00021821260452270508]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 12.0, 10.0, 6.0, 12.0, 9.0, 15.0, 16.0, 17.0, 17.0, 33.0, 21.0, 28.0, 27.0, 33.0, 33.0, 30.0, 41.0, 43.0, 32.0, 51.0, 44.0, 36.0, 37.0, 33.0, 42.0, 36.0, 36.0, 31.0, 28.0, 29.0, 27.0, 19.0, 20.0, 19.0, 10.0, 13.0, 8.0, 14.0, 10.0, 7.0, 4.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.8671875, -3.74310302734375, -3.6190185546875, -3.49493408203125, -3.370849609375, -3.24676513671875, -3.1226806640625, -2.99859619140625, -2.87451171875, -2.75042724609375, -2.6263427734375, -2.50225830078125, -2.378173828125, -2.25408935546875, -2.1300048828125, -2.00592041015625, -1.8818359375, -1.75775146484375, -1.6336669921875, -1.50958251953125, -1.385498046875, -1.26141357421875, -1.1373291015625, -1.01324462890625, -0.88916015625, -0.76507568359375, -0.6409912109375, -0.51690673828125, -0.392822265625, -0.26873779296875, -0.1446533203125, -0.02056884765625, 0.103515625, 0.22760009765625, 0.3516845703125, 0.47576904296875, 0.599853515625, 0.72393798828125, 0.8480224609375, 0.97210693359375, 1.09619140625, 1.22027587890625, 1.3443603515625, 1.46844482421875, 1.592529296875, 1.71661376953125, 1.8406982421875, 1.96478271484375, 2.0888671875, 2.21295166015625, 2.3370361328125, 2.46112060546875, 2.585205078125, 2.70928955078125, 2.8333740234375, 2.95745849609375, 3.08154296875, 3.20562744140625, 3.3297119140625, 3.45379638671875, 3.577880859375, 3.70196533203125, 3.8260498046875, 3.95013427734375, 4.07421875]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 4.0, 8.0, 3.0, 6.0, 9.0, 15.0, 22.0, 30.0, 39.0, 57.0, 61.0, 64.0, 97.0, 124.0, 192.0, 253.0, 346.0, 500.0, 767.0, 1344.0, 2880.0, 6768.0, 20609.0, 68648.0, 207210.0, 379909.0, 237712.0, 81141.0, 24673.0, 7712.0, 3034.0, 1558.0, 868.0, 510.0, 351.0, 267.0, 177.0, 140.0, 102.0, 107.0, 65.0, 39.0, 41.0, 23.0, 18.0, 19.0, 18.0, 6.0, 9.0, 7.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.0390625, -4.87945556640625, -4.7198486328125, -4.56024169921875, -4.400634765625, -4.24102783203125, -4.0814208984375, -3.92181396484375, -3.76220703125, -3.60260009765625, -3.4429931640625, -3.28338623046875, -3.123779296875, -2.96417236328125, -2.8045654296875, -2.64495849609375, -2.4853515625, -2.32574462890625, -2.1661376953125, -2.00653076171875, -1.846923828125, -1.68731689453125, -1.5277099609375, -1.36810302734375, -1.20849609375, -1.04888916015625, -0.8892822265625, -0.72967529296875, -0.570068359375, -0.41046142578125, -0.2508544921875, -0.09124755859375, 0.068359375, 0.22796630859375, 0.3875732421875, 0.54718017578125, 0.706787109375, 0.86639404296875, 1.0260009765625, 1.18560791015625, 1.34521484375, 1.50482177734375, 1.6644287109375, 1.82403564453125, 1.983642578125, 2.14324951171875, 2.3028564453125, 2.46246337890625, 2.6220703125, 2.78167724609375, 2.9412841796875, 3.10089111328125, 3.260498046875, 3.42010498046875, 3.5797119140625, 3.73931884765625, 3.89892578125, 4.05853271484375, 4.2181396484375, 4.37774658203125, 4.537353515625, 4.69696044921875, 4.8565673828125, 5.01617431640625, 5.17578125]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 6.0, 7.0, 10.0, 7.0, 16.0, 14.0, 16.0, 23.0, 27.0, 27.0, 30.0, 33.0, 41.0, 52.0, 54.0, 77.0, 162.0, 323.0, 1413.0, 185.0, 87.0, 73.0, 57.0, 48.0, 39.0, 44.0, 38.0, 22.0, 27.0, 22.0, 14.0, 13.0, 5.0, 8.0, 4.0, 4.0, 4.0, 6.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-11.8125, -11.4320068359375, -11.051513671875, -10.6710205078125, -10.29052734375, -9.9100341796875, -9.529541015625, -9.1490478515625, -8.7685546875, -8.3880615234375, -8.007568359375, -7.6270751953125, -7.24658203125, -6.8660888671875, -6.485595703125, -6.1051025390625, -5.724609375, -5.3441162109375, -4.963623046875, -4.5831298828125, -4.20263671875, -3.8221435546875, -3.441650390625, -3.0611572265625, -2.6806640625, -2.3001708984375, -1.919677734375, -1.5391845703125, -1.15869140625, -0.7781982421875, -0.397705078125, -0.0172119140625, 0.36328125, 0.7437744140625, 1.124267578125, 1.5047607421875, 1.88525390625, 2.2657470703125, 2.646240234375, 3.0267333984375, 3.4072265625, 3.7877197265625, 4.168212890625, 4.5487060546875, 4.92919921875, 5.3096923828125, 5.690185546875, 6.0706787109375, 6.451171875, 6.8316650390625, 7.212158203125, 7.5926513671875, 7.97314453125, 8.3536376953125, 8.734130859375, 9.1146240234375, 9.4951171875, 9.8756103515625, 10.256103515625, 10.6365966796875, 11.01708984375, 11.3975830078125, 11.778076171875, 12.1585693359375, 12.5390625]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 6.0, 8.0, 3.0, 15.0, 12.0, 17.0, 30.0, 40.0, 49.0, 71.0, 86.0, 132.0, 249.0, 356.0, 612.0, 1252.0, 6442.0, 2666720.0, 463996.0, 3304.0, 896.0, 480.0, 305.0, 208.0, 135.0, 85.0, 55.0, 42.0, 33.0, 15.0, 25.0, 9.0, 10.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-30.953125, -30.09033203125, -29.2275390625, -28.36474609375, -27.501953125, -26.63916015625, -25.7763671875, -24.91357421875, -24.05078125, -23.18798828125, -22.3251953125, -21.46240234375, -20.599609375, -19.73681640625, -18.8740234375, -18.01123046875, -17.1484375, -16.28564453125, -15.4228515625, -14.56005859375, -13.697265625, -12.83447265625, -11.9716796875, -11.10888671875, -10.24609375, -9.38330078125, -8.5205078125, -7.65771484375, -6.794921875, -5.93212890625, -5.0693359375, -4.20654296875, -3.34375, -2.48095703125, -1.6181640625, -0.75537109375, 0.107421875, 0.97021484375, 1.8330078125, 2.69580078125, 3.55859375, 4.42138671875, 5.2841796875, 6.14697265625, 7.009765625, 7.87255859375, 8.7353515625, 9.59814453125, 10.4609375, 11.32373046875, 12.1865234375, 13.04931640625, 13.912109375, 14.77490234375, 15.6376953125, 16.50048828125, 17.36328125, 18.22607421875, 19.0888671875, 19.95166015625, 20.814453125, 21.67724609375, 22.5400390625, 23.40283203125, 24.265625]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 8.0, 91.0, 584.0, 316.0, 17.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.23248291015625, -66.64657592773438, -64.0606689453125, -61.474761962890625, -58.888858795166016, -56.30295181274414, -53.717044830322266, -51.131141662597656, -48.54523468017578, -45.959327697753906, -43.37342071533203, -40.787513732910156, -38.20161056518555, -35.61570358276367, -33.0297966003418, -30.443891525268555, -27.857982635498047, -25.272075653076172, -22.68617057800293, -20.100263595581055, -17.514358520507812, -14.928451538085938, -12.342544555664062, -9.75663948059082, -7.170732498168945, -4.584826469421387, -1.99891996383667, 0.5869865417480469, 3.1728925704956055, 5.758798599243164, 8.344705581665039, 10.930610656738281, 13.516517639160156, 16.10242462158203, 18.688329696655273, 21.27423667907715, 23.86014175415039, 26.446048736572266, 29.03195571899414, 31.617860794067383, 34.203765869140625, 36.7896728515625, 39.375579833984375, 41.96148681640625, 44.54738998413086, 47.133296966552734, 49.71920394897461, 52.30510711669922, 54.89101791381836, 57.476924896240234, 60.06283187866211, 62.64873504638672, 65.2346420288086, 67.82054901123047, 70.40645599365234, 72.99236297607422, 75.5782699584961, 78.16417694091797, 80.75008392333984, 83.33599090576172, 85.9218978881836, 88.50779724121094, 91.09370422363281, 93.67961120605469, 96.26551818847656]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 3.0, 4.0, 2.0, 1.0, 7.0, 9.0, 7.0, 11.0, 16.0, 25.0, 24.0, 25.0, 22.0, 30.0, 31.0, 36.0, 43.0, 41.0, 43.0, 45.0, 49.0, 59.0, 38.0, 54.0, 54.0, 42.0, 35.0, 35.0, 25.0, 23.0, 38.0, 27.0, 21.0, 14.0, 18.0, 12.0, 13.0, 9.0, 9.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.111183166503906, -21.219919204711914, -20.328655242919922, -19.437393188476562, -18.54612922668457, -17.654865264892578, -16.76360321044922, -15.872339248657227, -14.981075286865234, -14.089811325073242, -13.198548316955566, -12.30728530883789, -11.416021347045898, -10.524757385253906, -9.63349437713623, -8.742231369018555, -7.8509674072265625, -6.9597039222717285, -6.0684404373168945, -5.1771769523620605, -4.285913467407227, -3.3946499824523926, -2.5033864974975586, -1.6121230125427246, -0.7208595275878906, 0.17040395736694336, 1.0616674423217773, 1.9529309272766113, 2.8441944122314453, 3.7354578971862793, 4.626721382141113, 5.517984867095947, 6.409248352050781, 7.300511837005615, 8.19177532196045, 9.083038330078125, 9.974302291870117, 10.86556625366211, 11.756829261779785, 12.648092269897461, 13.539356231689453, 14.430620193481445, 15.321883201599121, 16.213146209716797, 17.10441017150879, 17.99567413330078, 18.88693618774414, 19.778200149536133, 20.669464111328125, 21.560728073120117, 22.45199203491211, 23.34325408935547, 24.23451805114746, 25.125782012939453, 26.017044067382812, 26.908308029174805, 27.799571990966797, 28.69083595275879, 29.58209991455078, 30.47336196899414, 31.364625930786133, 32.255889892578125, 33.147151947021484, 34.03841781616211, 34.92967987060547]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 5.0, 7.0, 8.0, 9.0, 11.0, 15.0, 16.0, 17.0, 21.0, 22.0, 29.0, 27.0, 30.0, 29.0, 39.0, 32.0, 36.0, 36.0, 45.0, 52.0, 41.0, 52.0, 31.0, 35.0, 47.0, 39.0, 25.0, 26.0, 26.0, 35.0, 22.0, 23.0, 25.0, 18.0, 13.0, 5.0, 14.0, 6.0, 13.0, 5.0, 7.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.935546875, -3.810150146484375, -3.68475341796875, -3.559356689453125, -3.4339599609375, -3.308563232421875, -3.18316650390625, -3.057769775390625, -2.932373046875, -2.806976318359375, -2.68157958984375, -2.556182861328125, -2.4307861328125, -2.305389404296875, -2.17999267578125, -2.054595947265625, -1.92919921875, -1.803802490234375, -1.67840576171875, -1.553009033203125, -1.4276123046875, -1.302215576171875, -1.17681884765625, -1.051422119140625, -0.926025390625, -0.800628662109375, -0.67523193359375, -0.549835205078125, -0.4244384765625, -0.299041748046875, -0.17364501953125, -0.048248291015625, 0.0771484375, 0.202545166015625, 0.32794189453125, 0.453338623046875, 0.5787353515625, 0.704132080078125, 0.82952880859375, 0.954925537109375, 1.080322265625, 1.205718994140625, 1.33111572265625, 1.456512451171875, 1.5819091796875, 1.707305908203125, 1.83270263671875, 1.958099365234375, 2.08349609375, 2.208892822265625, 2.33428955078125, 2.459686279296875, 2.5850830078125, 2.710479736328125, 2.83587646484375, 2.961273193359375, 3.086669921875, 3.212066650390625, 3.33746337890625, 3.462860107421875, 3.5882568359375, 3.713653564453125, 3.83905029296875, 3.964447021484375, 4.08984375]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 7.0, 4.0, 4.0, 3.0, 7.0, 7.0, 9.0, 14.0, 10.0, 19.0, 24.0, 28.0, 25.0, 34.0, 36.0, 61.0, 75.0, 100.0, 129.0, 179.0, 236.0, 258.0, 340.0, 599.0, 25928.0, 4161698.0, 2541.0, 438.0, 319.0, 251.0, 214.0, 152.0, 101.0, 92.0, 58.0, 52.0, 51.0, 30.0, 31.0, 25.0, 21.0, 13.0, 13.0, 8.0, 10.0, 11.0, 6.0, 6.0, 5.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0], "bins": [-40.53125, -39.150390625, -37.76953125, -36.388671875, -35.0078125, -33.626953125, -32.24609375, -30.865234375, -29.484375, -28.103515625, -26.72265625, -25.341796875, -23.9609375, -22.580078125, -21.19921875, -19.818359375, -18.4375, -17.056640625, -15.67578125, -14.294921875, -12.9140625, -11.533203125, -10.15234375, -8.771484375, -7.390625, -6.009765625, -4.62890625, -3.248046875, -1.8671875, -0.486328125, 0.89453125, 2.275390625, 3.65625, 5.037109375, 6.41796875, 7.798828125, 9.1796875, 10.560546875, 11.94140625, 13.322265625, 14.703125, 16.083984375, 17.46484375, 18.845703125, 20.2265625, 21.607421875, 22.98828125, 24.369140625, 25.75, 27.130859375, 28.51171875, 29.892578125, 31.2734375, 32.654296875, 34.03515625, 35.416015625, 36.796875, 38.177734375, 39.55859375, 40.939453125, 42.3203125, 43.701171875, 45.08203125, 46.462890625, 47.84375]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 3.0, 4.0, 3.0, 10.0, 12.0, 9.0, 22.0, 28.0, 40.0, 62.0, 85.0, 134.0, 164.0, 241.0, 374.0, 496.0, 593.0, 565.0, 371.0, 242.0, 162.0, 122.0, 100.0, 48.0, 47.0, 39.0, 18.0, 26.0, 9.0, 13.0, 7.0, 6.0, 6.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.61328125, -5.4095458984375, -5.205810546875, -5.0020751953125, -4.79833984375, -4.5946044921875, -4.390869140625, -4.1871337890625, -3.9833984375, -3.7796630859375, -3.575927734375, -3.3721923828125, -3.16845703125, -2.9647216796875, -2.760986328125, -2.5572509765625, -2.353515625, -2.1497802734375, -1.946044921875, -1.7423095703125, -1.53857421875, -1.3348388671875, -1.131103515625, -0.9273681640625, -0.7236328125, -0.5198974609375, -0.316162109375, -0.1124267578125, 0.09130859375, 0.2950439453125, 0.498779296875, 0.7025146484375, 0.90625, 1.1099853515625, 1.313720703125, 1.5174560546875, 1.72119140625, 1.9249267578125, 2.128662109375, 2.3323974609375, 2.5361328125, 2.7398681640625, 2.943603515625, 3.1473388671875, 3.35107421875, 3.5548095703125, 3.758544921875, 3.9622802734375, 4.166015625, 4.3697509765625, 4.573486328125, 4.7772216796875, 4.98095703125, 5.1846923828125, 5.388427734375, 5.5921630859375, 5.7958984375, 5.9996337890625, 6.203369140625, 6.4071044921875, 6.61083984375, 6.8145751953125, 7.018310546875, 7.2220458984375, 7.42578125]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 7.0, 8.0, 3.0, 15.0, 17.0, 10.0, 17.0, 35.0, 46.0, 53.0, 77.0, 104.0, 224.0, 789.0, 27606.0, 4117399.0, 46294.0, 955.0, 222.0, 95.0, 63.0, 69.0, 43.0, 29.0, 22.0, 18.0, 15.0, 9.0, 11.0, 9.0, 5.0, 5.0, 2.0, 1.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-39.5, -38.44775390625, -37.3955078125, -36.34326171875, -35.291015625, -34.23876953125, -33.1865234375, -32.13427734375, -31.08203125, -30.02978515625, -28.9775390625, -27.92529296875, -26.873046875, -25.82080078125, -24.7685546875, -23.71630859375, -22.6640625, -21.61181640625, -20.5595703125, -19.50732421875, -18.455078125, -17.40283203125, -16.3505859375, -15.29833984375, -14.24609375, -13.19384765625, -12.1416015625, -11.08935546875, -10.037109375, -8.98486328125, -7.9326171875, -6.88037109375, -5.828125, -4.77587890625, -3.7236328125, -2.67138671875, -1.619140625, -0.56689453125, 0.4853515625, 1.53759765625, 2.58984375, 3.64208984375, 4.6943359375, 5.74658203125, 6.798828125, 7.85107421875, 8.9033203125, 9.95556640625, 11.0078125, 12.06005859375, 13.1123046875, 14.16455078125, 15.216796875, 16.26904296875, 17.3212890625, 18.37353515625, 19.42578125, 20.47802734375, 21.5302734375, 22.58251953125, 23.634765625, 24.68701171875, 25.7392578125, 26.79150390625, 27.84375]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 8.0, 142.0, 685.0, 175.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-213.35162353515625, -209.44268798828125, -205.53375244140625, -201.6248016357422, -197.7158660888672, -193.8069305419922, -189.89797973632812, -185.98904418945312, -182.08010864257812, -178.17117309570312, -174.26223754882812, -170.35328674316406, -166.44435119628906, -162.53541564941406, -158.62646484375, -154.717529296875, -150.80859375, -146.899658203125, -142.99072265625, -139.08177185058594, -135.17283630371094, -131.26390075683594, -127.3549575805664, -123.44601440429688, -119.53707885742188, -115.62814331054688, -111.71920013427734, -107.81025695800781, -103.90132141113281, -99.99238586425781, -96.08344268798828, -92.17449951171875, -88.26556396484375, -84.35662841796875, -80.44768524169922, -76.53874206542969, -72.62980651855469, -68.72087097167969, -64.81192779541016, -60.90298843383789, -56.994049072265625, -53.08510971069336, -49.176170349121094, -45.26723098754883, -41.35829162597656, -37.4493522644043, -33.54041290283203, -29.631473541259766, -25.7225341796875, -21.813594818115234, -17.90465545654297, -13.995716094970703, -10.086776733398438, -6.177837371826172, -2.2688980102539062, 1.6400413513183594, 5.548980712890625, 9.45792007446289, 13.366859436035156, 17.275798797607422, 21.184738159179688, 25.093677520751953, 29.00261688232422, 32.911556243896484, 36.82049560546875]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 4.0, 3.0, 5.0, 7.0, 3.0, 11.0, 11.0, 14.0, 12.0, 11.0, 16.0, 22.0, 27.0, 26.0, 32.0, 38.0, 45.0, 32.0, 36.0, 52.0, 56.0, 42.0, 41.0, 44.0, 47.0, 44.0, 40.0, 45.0, 21.0, 27.0, 29.0, 27.0, 24.0, 23.0, 15.0, 18.0, 10.0, 10.0, 8.0, 10.0, 8.0, 3.0, 3.0, 2.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.761035919189453, -19.073503494262695, -18.385971069335938, -17.69843864440918, -17.010906219482422, -16.323373794555664, -15.635842323303223, -14.948309898376465, -14.260777473449707, -13.57324504852295, -12.885712623596191, -12.19818115234375, -11.510648727416992, -10.823116302490234, -10.135583877563477, -9.448051452636719, -8.760519027709961, -8.072986602783203, -7.385454177856445, -6.697922229766846, -6.010389804840088, -5.32285737991333, -4.6353254318237305, -3.9477930068969727, -3.260260581970215, -2.572728157043457, -1.8851959705352783, -1.1976637840270996, -0.5101313591003418, 0.17740106582641602, 0.8649330139160156, 1.5524654388427734, 2.2399978637695312, 2.927530288696289, 3.6150624752044678, 4.3025946617126465, 4.990127086639404, 5.677659511566162, 6.365191459655762, 7.0527238845825195, 7.740256309509277, 8.427788734436035, 9.115321159362793, 9.802852630615234, 10.490385055541992, 11.17791748046875, 11.865449905395508, 12.552982330322266, 13.240514755249023, 13.928047180175781, 14.615579605102539, 15.303112030029297, 15.990644454956055, 16.678176879882812, 17.365707397460938, 18.053241729736328, 18.740772247314453, 19.42830467224121, 20.11583709716797, 20.803369522094727, 21.490901947021484, 22.178434371948242, 22.865966796875, 23.553497314453125, 24.241031646728516]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 1.0, 6.0, 8.0, 3.0, 6.0, 8.0, 19.0, 11.0, 14.0, 15.0, 25.0, 26.0, 22.0, 26.0, 30.0, 29.0, 33.0, 47.0, 41.0, 39.0, 60.0, 47.0, 40.0, 48.0, 39.0, 52.0, 31.0, 40.0, 35.0, 33.0, 33.0, 24.0, 23.0, 21.0, 14.0, 10.0, 9.0, 5.0, 8.0, 4.0, 5.0, 5.0, 4.0, 1.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.22265625, -3.0982666015625, -2.973876953125, -2.8494873046875, -2.72509765625, -2.6007080078125, -2.476318359375, -2.3519287109375, -2.2275390625, -2.1031494140625, -1.978759765625, -1.8543701171875, -1.72998046875, -1.6055908203125, -1.481201171875, -1.3568115234375, -1.232421875, -1.1080322265625, -0.983642578125, -0.8592529296875, -0.73486328125, -0.6104736328125, -0.486083984375, -0.3616943359375, -0.2373046875, -0.1129150390625, 0.011474609375, 0.1358642578125, 0.26025390625, 0.3846435546875, 0.509033203125, 0.6334228515625, 0.7578125, 0.8822021484375, 1.006591796875, 1.1309814453125, 1.25537109375, 1.3797607421875, 1.504150390625, 1.6285400390625, 1.7529296875, 1.8773193359375, 2.001708984375, 2.1260986328125, 2.25048828125, 2.3748779296875, 2.499267578125, 2.6236572265625, 2.748046875, 2.8724365234375, 2.996826171875, 3.1212158203125, 3.24560546875, 3.3699951171875, 3.494384765625, 3.6187744140625, 3.7431640625, 3.8675537109375, 3.991943359375, 4.1163330078125, 4.24072265625, 4.3651123046875, 4.489501953125, 4.6138916015625, 4.73828125]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 6.0, 11.0, 15.0, 22.0, 22.0, 45.0, 55.0, 101.0, 138.0, 199.0, 344.0, 491.0, 831.0, 1196.0, 1979.0, 3070.0, 5110.0, 8209.0, 13514.0, 22336.0, 39223.0, 73963.0, 152494.0, 319746.0, 197485.0, 92267.0, 47844.0, 26828.0, 15707.0, 9450.0, 5811.0, 3616.0, 2281.0, 1464.0, 959.0, 646.0, 402.0, 245.0, 127.0, 112.0, 69.0, 54.0, 16.0, 20.0, 14.0, 13.0, 7.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.796875, -0.7724761962890625, -0.748077392578125, -0.7236785888671875, -0.69927978515625, -0.6748809814453125, -0.650482177734375, -0.6260833740234375, -0.6016845703125, -0.5772857666015625, -0.552886962890625, -0.5284881591796875, -0.50408935546875, -0.4796905517578125, -0.455291748046875, -0.4308929443359375, -0.406494140625, -0.3820953369140625, -0.357696533203125, -0.3332977294921875, -0.30889892578125, -0.2845001220703125, -0.260101318359375, -0.2357025146484375, -0.2113037109375, -0.1869049072265625, -0.162506103515625, -0.1381072998046875, -0.11370849609375, -0.0893096923828125, -0.064910888671875, -0.0405120849609375, -0.01611328125, 0.0082855224609375, 0.032684326171875, 0.0570831298828125, 0.08148193359375, 0.1058807373046875, 0.130279541015625, 0.1546783447265625, 0.1790771484375, 0.2034759521484375, 0.227874755859375, 0.2522735595703125, 0.27667236328125, 0.3010711669921875, 0.325469970703125, 0.3498687744140625, 0.374267578125, 0.3986663818359375, 0.423065185546875, 0.4474639892578125, 0.47186279296875, 0.4962615966796875, 0.520660400390625, 0.5450592041015625, 0.5694580078125, 0.5938568115234375, 0.618255615234375, 0.6426544189453125, 0.66705322265625, 0.6914520263671875, 0.715850830078125, 0.7402496337890625, 0.7646484375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 7.0, 6.0, 7.0, 8.0, 9.0, 11.0, 11.0, 13.0, 14.0, 23.0, 16.0, 18.0, 24.0, 21.0, 32.0, 25.0, 27.0, 44.0, 35.0, 38.0, 40.0, 50.0, 1067.0, 61.0, 38.0, 39.0, 41.0, 35.0, 36.0, 37.0, 23.0, 18.0, 21.0, 23.0, 23.0, 20.0, 12.0, 14.0, 6.0, 10.0, 7.0, 8.0, 5.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.3203125, -2.2471923828125, -2.174072265625, -2.1009521484375, -2.02783203125, -1.9547119140625, -1.881591796875, -1.8084716796875, -1.7353515625, -1.6622314453125, -1.589111328125, -1.5159912109375, -1.44287109375, -1.3697509765625, -1.296630859375, -1.2235107421875, -1.150390625, -1.0772705078125, -1.004150390625, -0.9310302734375, -0.85791015625, -0.7847900390625, -0.711669921875, -0.6385498046875, -0.5654296875, -0.4923095703125, -0.419189453125, -0.3460693359375, -0.27294921875, -0.1998291015625, -0.126708984375, -0.0535888671875, 0.01953125, 0.0926513671875, 0.165771484375, 0.2388916015625, 0.31201171875, 0.3851318359375, 0.458251953125, 0.5313720703125, 0.6044921875, 0.6776123046875, 0.750732421875, 0.8238525390625, 0.89697265625, 0.9700927734375, 1.043212890625, 1.1163330078125, 1.189453125, 1.2625732421875, 1.335693359375, 1.4088134765625, 1.48193359375, 1.5550537109375, 1.628173828125, 1.7012939453125, 1.7744140625, 1.8475341796875, 1.920654296875, 1.9937744140625, 2.06689453125, 2.1400146484375, 2.213134765625, 2.2862548828125, 2.359375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 7.0, 9.0, 14.0, 32.0, 42.0, 59.0, 84.0, 136.0, 218.0, 319.0, 469.0, 659.0, 1035.0, 1457.0, 2113.0, 3105.0, 4614.0, 7044.0, 10474.0, 16266.0, 25365.0, 41641.0, 72567.0, 143572.0, 1354955.0, 187743.0, 88379.0, 49409.0, 29877.0, 18768.0, 12129.0, 8035.0, 5419.0, 3652.0, 2514.0, 1667.0, 1079.0, 747.0, 473.0, 333.0, 224.0, 136.0, 92.0, 64.0, 54.0, 27.0, 20.0, 20.0, 9.0, 3.0, 2.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.63671875, -0.616607666015625, -0.59649658203125, -0.576385498046875, -0.5562744140625, -0.536163330078125, -0.51605224609375, -0.495941162109375, -0.475830078125, -0.455718994140625, -0.43560791015625, -0.415496826171875, -0.3953857421875, -0.375274658203125, -0.35516357421875, -0.335052490234375, -0.31494140625, -0.294830322265625, -0.27471923828125, -0.254608154296875, -0.2344970703125, -0.214385986328125, -0.19427490234375, -0.174163818359375, -0.154052734375, -0.133941650390625, -0.11383056640625, -0.093719482421875, -0.0736083984375, -0.053497314453125, -0.03338623046875, -0.013275146484375, 0.0068359375, 0.026947021484375, 0.04705810546875, 0.067169189453125, 0.0872802734375, 0.107391357421875, 0.12750244140625, 0.147613525390625, 0.167724609375, 0.187835693359375, 0.20794677734375, 0.228057861328125, 0.2481689453125, 0.268280029296875, 0.28839111328125, 0.308502197265625, 0.32861328125, 0.348724365234375, 0.36883544921875, 0.388946533203125, 0.4090576171875, 0.429168701171875, 0.44927978515625, 0.469390869140625, 0.489501953125, 0.509613037109375, 0.52972412109375, 0.549835205078125, 0.5699462890625, 0.590057373046875, 0.61016845703125, 0.630279541015625, 0.650390625]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 4.0, 2.0, 3.0, 1.0, 6.0, 8.0, 8.0, 12.0, 7.0, 16.0, 20.0, 24.0, 29.0, 35.0, 37.0, 37.0, 44.0, 50.0, 78.0, 67.0, 68.0, 69.0, 56.0, 48.0, 34.0, 36.0, 37.0, 35.0, 29.0, 20.0, 24.0, 14.0, 8.0, 12.0, 8.0, 4.0, 6.0, 4.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.00043845176696777344, -0.0004248395562171936, -0.00041122734546661377, -0.00039761513471603394, -0.0003840029239654541, -0.00037039071321487427, -0.00035677850246429443, -0.0003431662917137146, -0.00032955408096313477, -0.00031594187021255493, -0.0003023296594619751, -0.00028871744871139526, -0.00027510523796081543, -0.0002614930272102356, -0.00024788081645965576, -0.00023426860570907593, -0.0002206563949584961, -0.00020704418420791626, -0.00019343197345733643, -0.0001798197627067566, -0.00016620755195617676, -0.00015259534120559692, -0.0001389831304550171, -0.00012537091970443726, -0.00011175870895385742, -9.814649820327759e-05, -8.453428745269775e-05, -7.092207670211792e-05, -5.7309865951538086e-05, -4.369765520095825e-05, -3.0085444450378418e-05, -1.6473233699798584e-05, -2.86102294921875e-06, 1.0751187801361084e-05, 2.4363398551940918e-05, 3.797560930252075e-05, 5.1587820053100586e-05, 6.520003080368042e-05, 7.881224155426025e-05, 9.242445230484009e-05, 0.00010603666305541992, 0.00011964887380599976, 0.0001332610845565796, 0.00014687329530715942, 0.00016048550605773926, 0.0001740977168083191, 0.00018770992755889893, 0.00020132213830947876, 0.0002149343490600586, 0.00022854655981063843, 0.00024215877056121826, 0.0002557709813117981, 0.00026938319206237793, 0.00028299540281295776, 0.0002966076135635376, 0.00031021982431411743, 0.00032383203506469727, 0.0003374442458152771, 0.00035105645656585693, 0.00036466866731643677, 0.0003782808780670166, 0.00039189308881759644, 0.00040550529956817627, 0.0004191175103187561, 0.00043272972106933594]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 3.0, 2.0, 8.0, 5.0, 11.0, 12.0, 9.0, 14.0, 28.0, 31.0, 33.0, 56.0, 67.0, 74.0, 83.0, 124.0, 181.0, 329.0, 524.0, 875.0, 3530.0, 1000709.0, 38818.0, 1150.0, 639.0, 365.0, 235.0, 161.0, 106.0, 91.0, 49.0, 52.0, 52.0, 21.0, 16.0, 23.0, 14.0, 12.0, 7.0, 5.0, 3.0, 5.0, 7.0, 9.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00760650634765625, -0.007373809814453125, -0.00714111328125, -0.006908416748046875, -0.00667572021484375, -0.006443023681640625, -0.0062103271484375, -0.005977630615234375, -0.00574493408203125, -0.005512237548828125, -0.005279541015625, -0.005046844482421875, -0.00481414794921875, -0.004581451416015625, -0.0043487548828125, -0.004116058349609375, -0.00388336181640625, -0.003650665283203125, -0.00341796875, -0.003185272216796875, -0.00295257568359375, -0.002719879150390625, -0.0024871826171875, -0.002254486083984375, -0.00202178955078125, -0.001789093017578125, -0.001556396484375, -0.001323699951171875, -0.00109100341796875, -0.000858306884765625, -0.0006256103515625, -0.000392913818359375, -0.00016021728515625, 7.2479248046875e-05, 0.00030517578125, 0.000537872314453125, 0.00077056884765625, 0.001003265380859375, 0.0012359619140625, 0.001468658447265625, 0.00170135498046875, 0.001934051513671875, 0.002166748046875, 0.002399444580078125, 0.00263214111328125, 0.002864837646484375, 0.0030975341796875, 0.003330230712890625, 0.00356292724609375, 0.003795623779296875, 0.0040283203125, 0.004261016845703125, 0.00449371337890625, 0.004726409912109375, 0.0049591064453125, 0.005191802978515625, 0.00542449951171875, 0.005657196044921875, 0.005889892578125, 0.006122589111328125, 0.00635528564453125, 0.006587982177734375, 0.0068206787109375, 0.007053375244140625, 0.00728607177734375]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 14.0, 372.0, 565.0, 60.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002532385056838393, -0.0024828817695379257, -0.0024333782494068146, -0.002383874962106347, -0.002334371441975236, -0.0022848681546747684, -0.0022353646345436573, -0.00218586134724319, -0.0021363578271120787, -0.002086854539811611, -0.0020373510196805, -0.0019878477323800325, -0.0019383442122489214, -0.001888840808533132, -0.0018393374048173428, -0.0017898340011015534, -0.0017403305973857641, -0.0016908271936699748, -0.0016413237899541855, -0.0015918203862383962, -0.0015423169825226068, -0.0014928135788068175, -0.0014433101750910282, -0.001393806771375239, -0.0013443034840747714, -0.001294800080358982, -0.0012452966766431928, -0.0011957932729274035, -0.0011462898692116141, -0.0010967864654958248, -0.0010472830617800355, -0.0009977796580642462, -0.0009482763125561178, -0.0008987729088403285, -0.0008492695051245391, -0.0007997661014087498, -0.0007502626976929605, -0.0007007593521848321, -0.0006512559484690428, -0.0006017525447532535, -0.0005522491410374641, -0.0005027457373216748, -0.0004532423336058855, -0.0004037389298900962, -0.00035423552617430687, -0.000304732151562348, -0.0002552287478465587, -0.00020572534413076937, -0.0001562219113111496, -0.00010671850759536028, -5.7215111155528575e-05, -7.711714715696871e-06, 4.179168900009245e-05, 9.129507816396654e-05, 0.00014079848187975585, 0.00019030188559554517, 0.0002398052893113345, 0.0002893086930271238, 0.0003388120967429131, 0.000388315471354872, 0.0004378188750706613, 0.0004873222787864506, 0.0005368256825022399, 0.0005863290862180293, 0.0006358324899338186]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 2.0, 9.0, 10.0, 8.0, 7.0, 12.0, 18.0, 13.0, 16.0, 26.0, 18.0, 41.0, 32.0, 35.0, 34.0, 43.0, 40.0, 46.0, 43.0, 41.0, 43.0, 40.0, 44.0, 46.0, 37.0, 50.0, 36.0, 44.0, 31.0, 19.0, 28.0, 9.0, 11.0, 12.0, 12.0, 11.0, 7.0, 8.0, 5.0, 6.0, 1.0, 4.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022596120834350586, -0.00021848827600479126, -0.00021101534366607666, -0.00020354241132736206, -0.00019606947898864746, -0.00018859654664993286, -0.00018112361431121826, -0.00017365068197250366, -0.00016617774963378906, -0.00015870481729507446, -0.00015123188495635986, -0.00014375895261764526, -0.00013628602027893066, -0.00012881308794021606, -0.00012134015560150146, -0.00011386722326278687, -0.00010639429092407227, -9.892135858535767e-05, -9.144842624664307e-05, -8.397549390792847e-05, -7.650256156921387e-05, -6.902962923049927e-05, -6.155669689178467e-05, -5.408376455307007e-05, -4.661083221435547e-05, -3.913789987564087e-05, -3.166496753692627e-05, -2.419203519821167e-05, -1.671910285949707e-05, -9.24617052078247e-06, -1.773238182067871e-06, 5.6996941566467285e-06, 1.3172626495361328e-05, 2.0645558834075928e-05, 2.8118491172790527e-05, 3.559142351150513e-05, 4.3064355850219727e-05, 5.0537288188934326e-05, 5.8010220527648926e-05, 6.548315286636353e-05, 7.295608520507812e-05, 8.042901754379272e-05, 8.790194988250732e-05, 9.537488222122192e-05, 0.00010284781455993652, 0.00011032074689865112, 0.00011779367923736572, 0.00012526661157608032, 0.00013273954391479492, 0.00014021247625350952, 0.00014768540859222412, 0.00015515834093093872, 0.00016263127326965332, 0.00017010420560836792, 0.00017757713794708252, 0.00018505007028579712, 0.00019252300262451172, 0.00019999593496322632, 0.00020746886730194092, 0.00021494179964065552, 0.00022241473197937012, 0.00022988766431808472, 0.00023736059665679932, 0.0002448335289955139, 0.0002523064613342285]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 1.0, 6.0, 8.0, 3.0, 6.0, 8.0, 19.0, 11.0, 14.0, 15.0, 25.0, 26.0, 22.0, 26.0, 30.0, 29.0, 33.0, 47.0, 41.0, 39.0, 60.0, 47.0, 40.0, 48.0, 39.0, 52.0, 31.0, 40.0, 35.0, 33.0, 33.0, 24.0, 23.0, 21.0, 14.0, 10.0, 9.0, 5.0, 8.0, 4.0, 5.0, 5.0, 4.0, 1.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.22265625, -3.0982666015625, -2.973876953125, -2.8494873046875, -2.72509765625, -2.6007080078125, -2.476318359375, -2.3519287109375, -2.2275390625, -2.1031494140625, -1.978759765625, -1.8543701171875, -1.72998046875, -1.6055908203125, -1.481201171875, -1.3568115234375, -1.232421875, -1.1080322265625, -0.983642578125, -0.8592529296875, -0.73486328125, -0.6104736328125, -0.486083984375, -0.3616943359375, -0.2373046875, -0.1129150390625, 0.011474609375, 0.1358642578125, 0.26025390625, 0.3846435546875, 0.509033203125, 0.6334228515625, 0.7578125, 0.8822021484375, 1.006591796875, 1.1309814453125, 1.25537109375, 1.3797607421875, 1.504150390625, 1.6285400390625, 1.7529296875, 1.8773193359375, 2.001708984375, 2.1260986328125, 2.25048828125, 2.3748779296875, 2.499267578125, 2.6236572265625, 2.748046875, 2.8724365234375, 2.996826171875, 3.1212158203125, 3.24560546875, 3.3699951171875, 3.494384765625, 3.6187744140625, 3.7431640625, 3.8675537109375, 3.991943359375, 4.1163330078125, 4.24072265625, 4.3651123046875, 4.489501953125, 4.6138916015625, 4.73828125]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 9.0, 8.0, 7.0, 9.0, 15.0, 26.0, 32.0, 48.0, 70.0, 95.0, 123.0, 167.0, 237.0, 338.0, 496.0, 739.0, 1094.0, 1665.0, 3382.0, 19995.0, 203257.0, 643476.0, 151008.0, 14445.0, 2866.0, 1548.0, 1069.0, 666.0, 514.0, 339.0, 224.0, 163.0, 140.0, 83.0, 64.0, 41.0, 28.0, 18.0, 14.0, 11.0, 7.0, 8.0, 5.0, 6.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.0546875, -8.7666015625, -8.478515625, -8.1904296875, -7.90234375, -7.6142578125, -7.326171875, -7.0380859375, -6.75, -6.4619140625, -6.173828125, -5.8857421875, -5.59765625, -5.3095703125, -5.021484375, -4.7333984375, -4.4453125, -4.1572265625, -3.869140625, -3.5810546875, -3.29296875, -3.0048828125, -2.716796875, -2.4287109375, -2.140625, -1.8525390625, -1.564453125, -1.2763671875, -0.98828125, -0.7001953125, -0.412109375, -0.1240234375, 0.1640625, 0.4521484375, 0.740234375, 1.0283203125, 1.31640625, 1.6044921875, 1.892578125, 2.1806640625, 2.46875, 2.7568359375, 3.044921875, 3.3330078125, 3.62109375, 3.9091796875, 4.197265625, 4.4853515625, 4.7734375, 5.0615234375, 5.349609375, 5.6376953125, 5.92578125, 6.2138671875, 6.501953125, 6.7900390625, 7.078125, 7.3662109375, 7.654296875, 7.9423828125, 8.23046875, 8.5185546875, 8.806640625, 9.0947265625, 9.3828125]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 6.0, 6.0, 7.0, 6.0, 3.0, 14.0, 13.0, 25.0, 22.0, 25.0, 31.0, 35.0, 35.0, 49.0, 41.0, 56.0, 99.0, 187.0, 1383.0, 357.0, 166.0, 74.0, 54.0, 45.0, 43.0, 43.0, 33.0, 33.0, 33.0, 18.0, 20.0, 24.0, 16.0, 11.0, 13.0, 6.0, 6.0, 4.0, 5.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.2421875, -8.93359375, -8.625, -8.31640625, -8.0078125, -7.69921875, -7.390625, -7.08203125, -6.7734375, -6.46484375, -6.15625, -5.84765625, -5.5390625, -5.23046875, -4.921875, -4.61328125, -4.3046875, -3.99609375, -3.6875, -3.37890625, -3.0703125, -2.76171875, -2.453125, -2.14453125, -1.8359375, -1.52734375, -1.21875, -0.91015625, -0.6015625, -0.29296875, 0.015625, 0.32421875, 0.6328125, 0.94140625, 1.25, 1.55859375, 1.8671875, 2.17578125, 2.484375, 2.79296875, 3.1015625, 3.41015625, 3.71875, 4.02734375, 4.3359375, 4.64453125, 4.953125, 5.26171875, 5.5703125, 5.87890625, 6.1875, 6.49609375, 6.8046875, 7.11328125, 7.421875, 7.73046875, 8.0390625, 8.34765625, 8.65625, 8.96484375, 9.2734375, 9.58203125, 9.890625, 10.19921875, 10.5078125]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 1.0, 6.0, 5.0, 6.0, 13.0, 15.0, 12.0, 13.0, 28.0, 48.0, 39.0, 73.0, 85.0, 124.0, 212.0, 326.0, 503.0, 983.0, 2631.0, 3111534.0, 25656.0, 1534.0, 678.0, 390.0, 252.0, 161.0, 114.0, 70.0, 45.0, 33.0, 31.0, 26.0, 17.0, 12.0, 11.0, 4.0, 5.0, 6.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.375, -41.86669921875, -40.3583984375, -38.85009765625, -37.341796875, -35.83349609375, -34.3251953125, -32.81689453125, -31.30859375, -29.80029296875, -28.2919921875, -26.78369140625, -25.275390625, -23.76708984375, -22.2587890625, -20.75048828125, -19.2421875, -17.73388671875, -16.2255859375, -14.71728515625, -13.208984375, -11.70068359375, -10.1923828125, -8.68408203125, -7.17578125, -5.66748046875, -4.1591796875, -2.65087890625, -1.142578125, 0.36572265625, 1.8740234375, 3.38232421875, 4.890625, 6.39892578125, 7.9072265625, 9.41552734375, 10.923828125, 12.43212890625, 13.9404296875, 15.44873046875, 16.95703125, 18.46533203125, 19.9736328125, 21.48193359375, 22.990234375, 24.49853515625, 26.0068359375, 27.51513671875, 29.0234375, 30.53173828125, 32.0400390625, 33.54833984375, 35.056640625, 36.56494140625, 38.0732421875, 39.58154296875, 41.08984375, 42.59814453125, 44.1064453125, 45.61474609375, 47.123046875, 48.63134765625, 50.1396484375, 51.64794921875, 53.15625]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 96.0, 623.0, 277.0, 16.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-95.67234802246094, -92.65572357177734, -89.63909912109375, -86.62247467041016, -83.60585021972656, -80.58922576904297, -77.57260131835938, -74.55597686767578, -71.53935241699219, -68.5227279663086, -65.506103515625, -62.489479064941406, -59.47285461425781, -56.45623016357422, -53.439605712890625, -50.42298126220703, -47.40635681152344, -44.389732360839844, -41.37310791015625, -38.356483459472656, -35.33985900878906, -32.32323455810547, -29.306610107421875, -26.28998565673828, -23.273361206054688, -20.256736755371094, -17.2401123046875, -14.223487854003906, -11.206863403320312, -8.190238952636719, -5.173614501953125, -2.1569900512695312, 0.8596343994140625, 3.8762588500976562, 6.89288330078125, 9.909507751464844, 12.926132202148438, 15.942756652832031, 18.959381103515625, 21.97600555419922, 24.992630004882812, 28.009254455566406, 31.02587890625, 34.042503356933594, 37.05912780761719, 40.07575225830078, 43.092376708984375, 46.10900115966797, 49.12562561035156, 52.142250061035156, 55.15887451171875, 58.175498962402344, 61.19212341308594, 64.20874786376953, 67.22537231445312, 70.24199676513672, 73.25862121582031, 76.2752456665039, 79.2918701171875, 82.3084945678711, 85.32511901855469, 88.34174346923828, 91.35836791992188, 94.37499237060547, 97.39161682128906]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 2.0, 3.0, 5.0, 4.0, 11.0, 7.0, 8.0, 12.0, 6.0, 13.0, 14.0, 12.0, 15.0, 20.0, 15.0, 22.0, 20.0, 31.0, 34.0, 27.0, 33.0, 38.0, 33.0, 40.0, 38.0, 32.0, 48.0, 37.0, 33.0, 36.0, 32.0, 39.0, 24.0, 28.0, 20.0, 19.0, 20.0, 26.0, 14.0, 20.0, 13.0, 22.0, 15.0, 14.0, 9.0, 13.0, 10.0, 5.0, 5.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-19.73282241821289, -19.054611206054688, -18.376399993896484, -17.69818878173828, -17.01997947692871, -16.341768264770508, -15.663557052612305, -14.985345840454102, -14.307135581970215, -13.628924369812012, -12.950714111328125, -12.272502899169922, -11.594291687011719, -10.916081428527832, -10.237870216369629, -9.559659957885742, -8.881448745727539, -8.203237533569336, -7.525027275085449, -6.846816062927246, -6.168605327606201, -5.490394592285156, -4.812183380126953, -4.133972644805908, -3.4557619094848633, -2.7775511741638184, -2.0993402004241943, -1.4211292266845703, -0.7429184913635254, -0.06470775604248047, 0.6135034561157227, 1.2917141914367676, 1.9699249267578125, 2.6481356620788574, 3.3263466358184814, 4.0045576095581055, 4.68276834487915, 5.360979080200195, 6.039190292358398, 6.717401027679443, 7.395611763000488, 8.073822975158691, 8.752033233642578, 9.430244445800781, 10.108455657958984, 10.786665916442871, 11.464877128601074, 12.143087387084961, 12.821298599243164, 13.499509811401367, 14.177720069885254, 14.855931282043457, 15.534141540527344, 16.212352752685547, 16.89056396484375, 17.568775177001953, 18.246986389160156, 18.92519760131836, 19.603408813476562, 20.281620025634766, 20.959829330444336, 21.63804054260254, 22.316251754760742, 22.994462966918945, 23.672672271728516]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 2.0, 5.0, 3.0, 3.0, 6.0, 10.0, 8.0, 12.0, 10.0, 14.0, 15.0, 26.0, 23.0, 20.0, 16.0, 29.0, 31.0, 44.0, 35.0, 30.0, 37.0, 41.0, 32.0, 41.0, 37.0, 38.0, 61.0, 24.0, 36.0, 37.0, 31.0, 34.0, 35.0, 23.0, 25.0, 20.0, 22.0, 19.0, 8.0, 9.0, 7.0, 6.0, 5.0, 3.0, 8.0, 2.0, 6.0, 6.0, 4.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.482421875, -3.370849609375, -3.25927734375, -3.147705078125, -3.0361328125, -2.924560546875, -2.81298828125, -2.701416015625, -2.58984375, -2.478271484375, -2.36669921875, -2.255126953125, -2.1435546875, -2.031982421875, -1.92041015625, -1.808837890625, -1.697265625, -1.585693359375, -1.47412109375, -1.362548828125, -1.2509765625, -1.139404296875, -1.02783203125, -0.916259765625, -0.8046875, -0.693115234375, -0.58154296875, -0.469970703125, -0.3583984375, -0.246826171875, -0.13525390625, -0.023681640625, 0.087890625, 0.199462890625, 0.31103515625, 0.422607421875, 0.5341796875, 0.645751953125, 0.75732421875, 0.868896484375, 0.98046875, 1.092041015625, 1.20361328125, 1.315185546875, 1.4267578125, 1.538330078125, 1.64990234375, 1.761474609375, 1.873046875, 1.984619140625, 2.09619140625, 2.207763671875, 2.3193359375, 2.430908203125, 2.54248046875, 2.654052734375, 2.765625, 2.877197265625, 2.98876953125, 3.100341796875, 3.2119140625, 3.323486328125, 3.43505859375, 3.546630859375, 3.658203125]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 6.0, 2.0, 6.0, 8.0, 8.0, 14.0, 21.0, 23.0, 36.0, 40.0, 63.0, 70.0, 96.0, 138.0, 218.0, 345.0, 708.0, 1697.0, 4722.0, 20872.0, 132152.0, 822998.0, 2181145.0, 864629.0, 134618.0, 21203.0, 5083.0, 1576.0, 680.0, 356.0, 226.0, 128.0, 99.0, 61.0, 67.0, 33.0, 32.0, 25.0, 25.0, 14.0, 20.0, 10.0, 6.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.40625, -5.20233154296875, -4.9984130859375, -4.79449462890625, -4.590576171875, -4.38665771484375, -4.1827392578125, -3.97882080078125, -3.77490234375, -3.57098388671875, -3.3670654296875, -3.16314697265625, -2.959228515625, -2.75531005859375, -2.5513916015625, -2.34747314453125, -2.1435546875, -1.93963623046875, -1.7357177734375, -1.53179931640625, -1.327880859375, -1.12396240234375, -0.9200439453125, -0.71612548828125, -0.51220703125, -0.30828857421875, -0.1043701171875, 0.09954833984375, 0.303466796875, 0.50738525390625, 0.7113037109375, 0.91522216796875, 1.119140625, 1.32305908203125, 1.5269775390625, 1.73089599609375, 1.934814453125, 2.13873291015625, 2.3426513671875, 2.54656982421875, 2.75048828125, 2.95440673828125, 3.1583251953125, 3.36224365234375, 3.566162109375, 3.77008056640625, 3.9739990234375, 4.17791748046875, 4.3818359375, 4.58575439453125, 4.7896728515625, 4.99359130859375, 5.197509765625, 5.40142822265625, 5.6053466796875, 5.80926513671875, 6.01318359375, 6.21710205078125, 6.4210205078125, 6.62493896484375, 6.828857421875, 7.03277587890625, 7.2366943359375, 7.44061279296875, 7.64453125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 2.0, 9.0, 6.0, 6.0, 8.0, 15.0, 17.0, 28.0, 26.0, 42.0, 60.0, 74.0, 102.0, 139.0, 170.0, 209.0, 304.0, 411.0, 483.0, 467.0, 379.0, 258.0, 201.0, 120.0, 112.0, 104.0, 69.0, 43.0, 37.0, 41.0, 37.0, 25.0, 26.0, 10.0, 8.0, 5.0, 8.0, 3.0, 5.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3828125, -5.18121337890625, -4.9796142578125, -4.77801513671875, -4.576416015625, -4.37481689453125, -4.1732177734375, -3.97161865234375, -3.77001953125, -3.56842041015625, -3.3668212890625, -3.16522216796875, -2.963623046875, -2.76202392578125, -2.5604248046875, -2.35882568359375, -2.1572265625, -1.95562744140625, -1.7540283203125, -1.55242919921875, -1.350830078125, -1.14923095703125, -0.9476318359375, -0.74603271484375, -0.54443359375, -0.34283447265625, -0.1412353515625, 0.06036376953125, 0.261962890625, 0.46356201171875, 0.6651611328125, 0.86676025390625, 1.068359375, 1.26995849609375, 1.4715576171875, 1.67315673828125, 1.874755859375, 2.07635498046875, 2.2779541015625, 2.47955322265625, 2.68115234375, 2.88275146484375, 3.0843505859375, 3.28594970703125, 3.487548828125, 3.68914794921875, 3.8907470703125, 4.09234619140625, 4.2939453125, 4.49554443359375, 4.6971435546875, 4.89874267578125, 5.100341796875, 5.30194091796875, 5.5035400390625, 5.70513916015625, 5.90673828125, 6.10833740234375, 6.3099365234375, 6.51153564453125, 6.713134765625, 6.91473388671875, 7.1163330078125, 7.31793212890625, 7.51953125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 5.0, 10.0, 17.0, 29.0, 68.0, 130.0, 218.0, 453.0, 1042.0, 3322.0, 77903.0, 3900632.0, 203974.0, 4366.0, 1177.0, 467.0, 227.0, 114.0, 54.0, 33.0, 15.0, 8.0, 5.0, 5.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-27.28125, -26.609130859375, -25.93701171875, -25.264892578125, -24.5927734375, -23.920654296875, -23.24853515625, -22.576416015625, -21.904296875, -21.232177734375, -20.56005859375, -19.887939453125, -19.2158203125, -18.543701171875, -17.87158203125, -17.199462890625, -16.52734375, -15.855224609375, -15.18310546875, -14.510986328125, -13.8388671875, -13.166748046875, -12.49462890625, -11.822509765625, -11.150390625, -10.478271484375, -9.80615234375, -9.134033203125, -8.4619140625, -7.789794921875, -7.11767578125, -6.445556640625, -5.7734375, -5.101318359375, -4.42919921875, -3.757080078125, -3.0849609375, -2.412841796875, -1.74072265625, -1.068603515625, -0.396484375, 0.275634765625, 0.94775390625, 1.619873046875, 2.2919921875, 2.964111328125, 3.63623046875, 4.308349609375, 4.98046875, 5.652587890625, 6.32470703125, 6.996826171875, 7.6689453125, 8.341064453125, 9.01318359375, 9.685302734375, 10.357421875, 11.029541015625, 11.70166015625, 12.373779296875, 13.0458984375, 13.718017578125, 14.39013671875, 15.062255859375, 15.734375]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 21.0, 670.0, 321.0, 4.0, 1.0, 1.0, 1.0], "bins": [-442.0586853027344, -434.54180908203125, -427.0249328613281, -419.5080871582031, -411.9912109375, -404.4743347167969, -396.95745849609375, -389.44061279296875, -381.9237365722656, -374.4068603515625, -366.8899841308594, -359.3731384277344, -351.85626220703125, -344.3393859863281, -336.822509765625, -329.3056640625, -321.78875732421875, -314.2718811035156, -306.7550048828125, -299.2381591796875, -291.7212829589844, -284.20440673828125, -276.6875305175781, -269.170654296875, -261.65380859375, -254.13693237304688, -246.6200714111328, -239.1031951904297, -231.58633422851562, -224.0694580078125, -216.55258178710938, -209.0357208251953, -201.5188446044922, -194.00196838378906, -186.485107421875, -178.96823120117188, -171.4513702392578, -163.9344940185547, -156.41763305664062, -148.9007568359375, -141.38389587402344, -133.8670196533203, -126.35015869140625, -118.83328247070312, -111.31642150878906, -103.79954528808594, -96.28267669677734, -88.76580810546875, -81.24893188476562, -73.73206329345703, -66.21519470214844, -58.69832229614258, -51.181453704833984, -43.66458511352539, -36.14771270751953, -28.630844116210938, -21.11397933959961, -13.5971097946167, -6.080240249633789, 1.4366302490234375, 8.953498840332031, 16.470367431640625, 23.987239837646484, 31.504108428955078, 39.02097702026367]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 6.0, 3.0, 4.0, 8.0, 4.0, 8.0, 8.0, 17.0, 12.0, 20.0, 27.0, 18.0, 34.0, 28.0, 19.0, 32.0, 38.0, 36.0, 46.0, 41.0, 40.0, 40.0, 42.0, 45.0, 36.0, 53.0, 36.0, 30.0, 38.0, 33.0, 31.0, 30.0, 25.0, 20.0, 22.0, 9.0, 16.0, 8.0, 12.0, 7.0, 10.0, 7.0, 5.0, 2.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.018861770629883, -22.141508102416992, -21.264156341552734, -20.386802673339844, -19.509449005126953, -18.632095336914062, -17.754741668701172, -16.877389907836914, -16.000036239624023, -15.122682571411133, -14.245329856872559, -13.367977142333984, -12.490623474121094, -11.613269805908203, -10.735917091369629, -9.858564376831055, -8.981210708618164, -8.103857040405273, -7.226504325866699, -6.349151134490967, -5.471797943115234, -4.594444751739502, -3.7170915603637695, -2.839738368988037, -1.9623851776123047, -1.0850319862365723, -0.20767879486083984, 0.6696743965148926, 1.547027587890625, 2.4243807792663574, 3.30173397064209, 4.179087162017822, 5.056438446044922, 5.933791637420654, 6.811144828796387, 7.688498020172119, 8.565851211547852, 9.443204879760742, 10.320557594299316, 11.19791030883789, 12.075263977050781, 12.952617645263672, 13.829970359802246, 14.70732307434082, 15.584676742553711, 16.4620304107666, 17.33938217163086, 18.21673583984375, 19.09408950805664, 19.97144317626953, 20.848796844482422, 21.72614860534668, 22.60350227355957, 23.48085594177246, 24.35820770263672, 25.23556137084961, 26.1129150390625, 26.99026870727539, 27.86762237548828, 28.74497413635254, 29.62232780456543, 30.49968147277832, 31.377033233642578, 32.25438690185547, 33.13174057006836]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 10.0, 7.0, 8.0, 7.0, 22.0, 19.0, 16.0, 17.0, 33.0, 28.0, 44.0, 35.0, 43.0, 44.0, 35.0, 47.0, 37.0, 39.0, 43.0, 46.0, 47.0, 48.0, 41.0, 37.0, 36.0, 31.0, 30.0, 28.0, 24.0, 19.0, 22.0, 9.0, 17.0, 18.0, 3.0, 7.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.224609375, -3.120361328125, -3.01611328125, -2.911865234375, -2.8076171875, -2.703369140625, -2.59912109375, -2.494873046875, -2.390625, -2.286376953125, -2.18212890625, -2.077880859375, -1.9736328125, -1.869384765625, -1.76513671875, -1.660888671875, -1.556640625, -1.452392578125, -1.34814453125, -1.243896484375, -1.1396484375, -1.035400390625, -0.93115234375, -0.826904296875, -0.72265625, -0.618408203125, -0.51416015625, -0.409912109375, -0.3056640625, -0.201416015625, -0.09716796875, 0.007080078125, 0.111328125, 0.215576171875, 0.31982421875, 0.424072265625, 0.5283203125, 0.632568359375, 0.73681640625, 0.841064453125, 0.9453125, 1.049560546875, 1.15380859375, 1.258056640625, 1.3623046875, 1.466552734375, 1.57080078125, 1.675048828125, 1.779296875, 1.883544921875, 1.98779296875, 2.092041015625, 2.1962890625, 2.300537109375, 2.40478515625, 2.509033203125, 2.61328125, 2.717529296875, 2.82177734375, 2.926025390625, 3.0302734375, 3.134521484375, 3.23876953125, 3.343017578125, 3.447265625]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 9.0, 22.0, 22.0, 36.0, 56.0, 81.0, 116.0, 189.0, 295.0, 469.0, 914.0, 1626.0, 2999.0, 5347.0, 10448.0, 20379.0, 39735.0, 81972.0, 197362.0, 377599.0, 164137.0, 71598.0, 34877.0, 17890.0, 9360.0, 4921.0, 2665.0, 1437.0, 830.0, 441.0, 259.0, 153.0, 103.0, 74.0, 43.0, 24.0, 18.0, 18.0, 8.0, 6.0, 6.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.7568359375, -0.7334823608398438, -0.7101287841796875, -0.6867752075195312, -0.663421630859375, -0.6400680541992188, -0.6167144775390625, -0.5933609008789062, -0.57000732421875, -0.5466537475585938, -0.5233001708984375, -0.49994659423828125, -0.476593017578125, -0.45323944091796875, -0.4298858642578125, -0.40653228759765625, -0.3831787109375, -0.35982513427734375, -0.3364715576171875, -0.31311798095703125, -0.289764404296875, -0.26641082763671875, -0.2430572509765625, -0.21970367431640625, -0.19635009765625, -0.17299652099609375, -0.1496429443359375, -0.12628936767578125, -0.102935791015625, -0.07958221435546875, -0.0562286376953125, -0.03287506103515625, -0.009521484375, 0.01383209228515625, 0.0371856689453125, 0.06053924560546875, 0.083892822265625, 0.10724639892578125, 0.1305999755859375, 0.15395355224609375, 0.17730712890625, 0.20066070556640625, 0.2240142822265625, 0.24736785888671875, 0.270721435546875, 0.29407501220703125, 0.3174285888671875, 0.34078216552734375, 0.3641357421875, 0.38748931884765625, 0.4108428955078125, 0.43419647216796875, 0.457550048828125, 0.48090362548828125, 0.5042572021484375, 0.5276107788085938, 0.55096435546875, 0.5743179321289062, 0.5976715087890625, 0.6210250854492188, 0.644378662109375, 0.6677322387695312, 0.6910858154296875, 0.7144393920898438, 0.73779296875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 5.0, 4.0, 3.0, 10.0, 9.0, 4.0, 8.0, 13.0, 12.0, 15.0, 9.0, 23.0, 20.0, 24.0, 28.0, 31.0, 29.0, 27.0, 37.0, 33.0, 34.0, 33.0, 30.0, 43.0, 1061.0, 37.0, 36.0, 39.0, 41.0, 28.0, 30.0, 42.0, 23.0, 31.0, 22.0, 21.0, 20.0, 17.0, 15.0, 24.0, 13.0, 9.0, 8.0, 4.0, 9.0, 5.0, 3.0, 5.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0], "bins": [-1.8125, -1.7574005126953125, -1.702301025390625, -1.6472015380859375, -1.59210205078125, -1.5370025634765625, -1.481903076171875, -1.4268035888671875, -1.3717041015625, -1.3166046142578125, -1.261505126953125, -1.2064056396484375, -1.15130615234375, -1.0962066650390625, -1.041107177734375, -0.9860076904296875, -0.930908203125, -0.8758087158203125, -0.820709228515625, -0.7656097412109375, -0.71051025390625, -0.6554107666015625, -0.600311279296875, -0.5452117919921875, -0.4901123046875, -0.4350128173828125, -0.379913330078125, -0.3248138427734375, -0.26971435546875, -0.2146148681640625, -0.159515380859375, -0.1044158935546875, -0.04931640625, 0.0057830810546875, 0.060882568359375, 0.1159820556640625, 0.17108154296875, 0.2261810302734375, 0.281280517578125, 0.3363800048828125, 0.3914794921875, 0.4465789794921875, 0.501678466796875, 0.5567779541015625, 0.61187744140625, 0.6669769287109375, 0.722076416015625, 0.7771759033203125, 0.832275390625, 0.8873748779296875, 0.942474365234375, 0.9975738525390625, 1.05267333984375, 1.1077728271484375, 1.162872314453125, 1.2179718017578125, 1.2730712890625, 1.3281707763671875, 1.383270263671875, 1.4383697509765625, 1.49346923828125, 1.5485687255859375, 1.603668212890625, 1.6587677001953125, 1.7138671875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 5.0, 7.0, 7.0, 11.0, 18.0, 28.0, 49.0, 65.0, 78.0, 138.0, 161.0, 286.0, 336.0, 520.0, 763.0, 1093.0, 1615.0, 2277.0, 3334.0, 4879.0, 7418.0, 10953.0, 17045.0, 26284.0, 42322.0, 69424.0, 124134.0, 1310190.0, 207712.0, 101709.0, 59334.0, 36393.0, 23016.0, 15004.0, 9754.0, 6582.0, 4515.0, 3013.0, 2109.0, 1421.0, 969.0, 687.0, 488.0, 319.0, 218.0, 157.0, 109.0, 59.0, 42.0, 32.0, 27.0, 13.0, 7.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0], "bins": [-0.499755859375, -0.4845390319824219, -0.46932220458984375, -0.4541053771972656, -0.4388885498046875, -0.4236717224121094, -0.40845489501953125, -0.3932380676269531, -0.378021240234375, -0.3628044128417969, -0.34758758544921875, -0.3323707580566406, -0.3171539306640625, -0.3019371032714844, -0.28672027587890625, -0.2715034484863281, -0.25628662109375, -0.24106979370117188, -0.22585296630859375, -0.21063613891601562, -0.1954193115234375, -0.18020248413085938, -0.16498565673828125, -0.14976882934570312, -0.134552001953125, -0.11933517456054688, -0.10411834716796875, -0.08890151977539062, -0.0736846923828125, -0.058467864990234375, -0.04325103759765625, -0.028034210205078125, -0.0128173828125, 0.002399444580078125, 0.01761627197265625, 0.032833099365234375, 0.0480499267578125, 0.06326675415039062, 0.07848358154296875, 0.09370040893554688, 0.108917236328125, 0.12413406372070312, 0.13935089111328125, 0.15456771850585938, 0.1697845458984375, 0.18500137329101562, 0.20021820068359375, 0.21543502807617188, 0.23065185546875, 0.24586868286132812, 0.26108551025390625, 0.2763023376464844, 0.2915191650390625, 0.3067359924316406, 0.32195281982421875, 0.3371696472167969, 0.352386474609375, 0.3676033020019531, 0.38282012939453125, 0.3980369567871094, 0.4132537841796875, 0.4284706115722656, 0.44368743896484375, 0.4589042663574219, 0.47412109375]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 3.0, 4.0, 2.0, 6.0, 4.0, 9.0, 11.0, 12.0, 14.0, 11.0, 14.0, 23.0, 27.0, 22.0, 36.0, 42.0, 41.0, 45.0, 51.0, 37.0, 57.0, 57.0, 65.0, 46.0, 57.0, 49.0, 34.0, 35.0, 34.0, 25.0, 23.0, 11.0, 17.0, 14.0, 16.0, 11.0, 9.0, 7.0, 10.0, 2.0, 2.0, 3.0, 7.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003428459167480469, -0.00033260881900787354, -0.0003223717212677002, -0.00031213462352752686, -0.0003018975257873535, -0.0002916604280471802, -0.00028142333030700684, -0.0002711862325668335, -0.00026094913482666016, -0.0002507120370864868, -0.00024047493934631348, -0.00023023784160614014, -0.0002200007438659668, -0.00020976364612579346, -0.00019952654838562012, -0.00018928945064544678, -0.00017905235290527344, -0.0001688152551651001, -0.00015857815742492676, -0.00014834105968475342, -0.00013810396194458008, -0.00012786686420440674, -0.0001176297664642334, -0.00010739266872406006, -9.715557098388672e-05, -8.691847324371338e-05, -7.668137550354004e-05, -6.64442777633667e-05, -5.620718002319336e-05, -4.597008228302002e-05, -3.573298454284668e-05, -2.549588680267334e-05, -1.52587890625e-05, -5.02169132232666e-06, 5.21540641784668e-06, 1.545250415802002e-05, 2.568960189819336e-05, 3.59266996383667e-05, 4.616379737854004e-05, 5.640089511871338e-05, 6.663799285888672e-05, 7.687509059906006e-05, 8.71121883392334e-05, 9.734928607940674e-05, 0.00010758638381958008, 0.00011782348155975342, 0.00012806057929992676, 0.0001382976770401001, 0.00014853477478027344, 0.00015877187252044678, 0.00016900897026062012, 0.00017924606800079346, 0.0001894831657409668, 0.00019972026348114014, 0.00020995736122131348, 0.00022019445896148682, 0.00023043155670166016, 0.0002406686544418335, 0.00025090575218200684, 0.0002611428499221802, 0.0002713799476623535, 0.00028161704540252686, 0.0002918541431427002, 0.00030209124088287354, 0.0003123283386230469]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 5.0, 2.0, 12.0, 11.0, 8.0, 29.0, 32.0, 30.0, 45.0, 53.0, 53.0, 50.0, 128.0, 155.0, 233.0, 327.0, 545.0, 931.0, 8711.0, 1024078.0, 10307.0, 972.0, 542.0, 363.0, 242.0, 175.0, 121.0, 78.0, 62.0, 39.0, 39.0, 26.0, 38.0, 26.0, 11.0, 18.0, 9.0, 11.0, 7.0, 5.0, 9.0, 7.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.006000518798828125, -0.005810141563415527, -0.00561976432800293, -0.005429387092590332, -0.005239009857177734, -0.005048632621765137, -0.004858255386352539, -0.004667878150939941, -0.004477500915527344, -0.004287123680114746, -0.0040967464447021484, -0.003906369209289551, -0.003715991973876953, -0.0035256147384643555, -0.003335237503051758, -0.00314486026763916, -0.0029544830322265625, -0.002764105796813965, -0.002573728561401367, -0.0023833513259887695, -0.002192974090576172, -0.0020025968551635742, -0.0018122196197509766, -0.001621842384338379, -0.0014314651489257812, -0.0012410879135131836, -0.001050710678100586, -0.0008603334426879883, -0.0006699562072753906, -0.00047957897186279297, -0.0002892017364501953, -9.882450103759766e-05, 9.1552734375e-05, 0.00028192996978759766, 0.0004723072052001953, 0.000662684440612793, 0.0008530616760253906, 0.0010434389114379883, 0.001233816146850586, 0.0014241933822631836, 0.0016145706176757812, 0.001804947853088379, 0.0019953250885009766, 0.0021857023239135742, 0.002376079559326172, 0.0025664567947387695, 0.002756834030151367, 0.002947211265563965, 0.0031375885009765625, 0.00332796573638916, 0.003518342971801758, 0.0037087202072143555, 0.003899097442626953, 0.004089474678039551, 0.0042798519134521484, 0.004470229148864746, 0.004660606384277344, 0.004850983619689941, 0.005041360855102539, 0.005231738090515137, 0.005422115325927734, 0.005612492561340332, 0.00580286979675293, 0.005993247032165527, 0.006183624267578125]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 22.0, 178.0, 537.0, 247.0, 28.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0006031366647221148, -0.0005752437864430249, -0.0005473509663715959, -0.0005194580880925059, -0.0004915652680210769, -0.000463672389741987, -0.0004357795405667275, -0.00040788669139146805, -0.0003799938422162086, -0.0003521009930409491, -0.00032420814386568964, -0.00029631529469043016, -0.00026842241641134024, -0.000240529581787996, -0.0002126367180608213, -0.00018474386888556182, -0.00015685101971030235, -0.00012895817053504288, -0.0001010653140838258, -7.317245763260871e-05, -4.527960845734924e-05, -1.738675928208977e-05, 1.050610444508493e-05, 3.83989536203444e-05, 6.629180279560387e-05, 9.418465197086334e-05, 0.0001220775011461228, 0.0001499703648732975, 0.00017786321404855698, 0.00020575606322381645, 0.00023364892695099115, 0.0002615417761262506, 0.000289434683509171, 0.0003173275326844305, 0.00034522038185968995, 0.0003731132601387799, 0.0004010060802102089, 0.0004288989584892988, 0.0004567918076645583, 0.00048468465683981776, 0.0005125774769112468, 0.0005404703551903367, 0.0005683631752617657, 0.0005962560535408556, 0.0006241488736122847, 0.0006520417518913746, 0.0006799346301704645, 0.0007078274502418935, 0.0007357203285209835, 0.0007636132068000734, 0.0007915060268715024, 0.0008193989051505923, 0.0008472917252220213, 0.0008751846035011113, 0.0009030774235725403, 0.0009309703018516302, 0.0009588631801307201, 0.00098675605840981, 0.0010146489366889, 0.001042541698552668, 0.001070434576831758, 0.001098327455110848, 0.0011262203333899379, 0.001154113095253706, 0.001182005973532796]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 7.0, 8.0, 10.0, 5.0, 10.0, 11.0, 8.0, 12.0, 12.0, 24.0, 20.0, 32.0, 20.0, 29.0, 30.0, 28.0, 44.0, 31.0, 32.0, 41.0, 38.0, 44.0, 36.0, 40.0, 34.0, 37.0, 40.0, 48.0, 29.0, 29.0, 37.0, 26.0, 23.0, 21.0, 21.0, 12.0, 8.0, 14.0, 13.0, 14.0, 7.0, 9.0, 6.0, 7.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00020492076873779297, -0.0001990925520658493, -0.00019326433539390564, -0.00018743611872196198, -0.0001816079020500183, -0.00017577968537807465, -0.00016995146870613098, -0.00016412325203418732, -0.00015829503536224365, -0.0001524668186903, -0.00014663860201835632, -0.00014081038534641266, -0.000134982168674469, -0.00012915395200252533, -0.00012332573533058167, -0.000117497518658638, -0.00011166930198669434, -0.00010584108531475067, -0.00010001286864280701, -9.418465197086334e-05, -8.835643529891968e-05, -8.252821862697601e-05, -7.670000195503235e-05, -7.087178528308868e-05, -6.504356861114502e-05, -5.9215351939201355e-05, -5.338713526725769e-05, -4.7558918595314026e-05, -4.173070192337036e-05, -3.59024852514267e-05, -3.0074268579483032e-05, -2.4246051907539368e-05, -1.8417835235595703e-05, -1.2589618563652039e-05, -6.761401891708374e-06, -9.331852197647095e-07, 4.895031452178955e-06, 1.072324812412262e-05, 1.6551464796066284e-05, 2.237968146800995e-05, 2.8207898139953613e-05, 3.403611481189728e-05, 3.986433148384094e-05, 4.569254815578461e-05, 5.152076482772827e-05, 5.7348981499671936e-05, 6.31771981716156e-05, 6.900541484355927e-05, 7.483363151550293e-05, 8.06618481874466e-05, 8.649006485939026e-05, 9.231828153133392e-05, 9.814649820327759e-05, 0.00010397471487522125, 0.00010980293154716492, 0.00011563114821910858, 0.00012145936489105225, 0.0001272875815629959, 0.00013311579823493958, 0.00013894401490688324, 0.0001447722315788269, 0.00015060044825077057, 0.00015642866492271423, 0.0001622568815946579, 0.00016808509826660156]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 10.0, 7.0, 8.0, 7.0, 22.0, 19.0, 16.0, 17.0, 33.0, 28.0, 44.0, 35.0, 43.0, 44.0, 35.0, 47.0, 37.0, 39.0, 43.0, 46.0, 47.0, 48.0, 41.0, 37.0, 36.0, 31.0, 30.0, 28.0, 24.0, 19.0, 22.0, 9.0, 17.0, 18.0, 3.0, 7.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.224609375, -3.120361328125, -3.01611328125, -2.911865234375, -2.8076171875, -2.703369140625, -2.59912109375, -2.494873046875, -2.390625, -2.286376953125, -2.18212890625, -2.077880859375, -1.9736328125, -1.869384765625, -1.76513671875, -1.660888671875, -1.556640625, -1.452392578125, -1.34814453125, -1.243896484375, -1.1396484375, -1.035400390625, -0.93115234375, -0.826904296875, -0.72265625, -0.618408203125, -0.51416015625, -0.409912109375, -0.3056640625, -0.201416015625, -0.09716796875, 0.007080078125, 0.111328125, 0.215576171875, 0.31982421875, 0.424072265625, 0.5283203125, 0.632568359375, 0.73681640625, 0.841064453125, 0.9453125, 1.049560546875, 1.15380859375, 1.258056640625, 1.3623046875, 1.466552734375, 1.57080078125, 1.675048828125, 1.779296875, 1.883544921875, 1.98779296875, 2.092041015625, 2.1962890625, 2.300537109375, 2.40478515625, 2.509033203125, 2.61328125, 2.717529296875, 2.82177734375, 2.926025390625, 3.0302734375, 3.134521484375, 3.23876953125, 3.343017578125, 3.447265625]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 5.0, 4.0, 10.0, 17.0, 18.0, 29.0, 45.0, 63.0, 97.0, 143.0, 173.0, 244.0, 349.0, 455.0, 707.0, 893.0, 1383.0, 2008.0, 3137.0, 5821.0, 27725.0, 362120.0, 577609.0, 47385.0, 7361.0, 3504.0, 2227.0, 1514.0, 993.0, 747.0, 506.0, 356.0, 276.0, 184.0, 154.0, 82.0, 72.0, 42.0, 34.0, 24.0, 15.0, 11.0, 0.0, 6.0, 6.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-8.75, -8.4857177734375, -8.221435546875, -7.9571533203125, -7.69287109375, -7.4285888671875, -7.164306640625, -6.9000244140625, -6.6357421875, -6.3714599609375, -6.107177734375, -5.8428955078125, -5.57861328125, -5.3143310546875, -5.050048828125, -4.7857666015625, -4.521484375, -4.2572021484375, -3.992919921875, -3.7286376953125, -3.46435546875, -3.2000732421875, -2.935791015625, -2.6715087890625, -2.4072265625, -2.1429443359375, -1.878662109375, -1.6143798828125, -1.35009765625, -1.0858154296875, -0.821533203125, -0.5572509765625, -0.29296875, -0.0286865234375, 0.235595703125, 0.4998779296875, 0.76416015625, 1.0284423828125, 1.292724609375, 1.5570068359375, 1.8212890625, 2.0855712890625, 2.349853515625, 2.6141357421875, 2.87841796875, 3.1427001953125, 3.406982421875, 3.6712646484375, 3.935546875, 4.1998291015625, 4.464111328125, 4.7283935546875, 4.99267578125, 5.2569580078125, 5.521240234375, 5.7855224609375, 6.0498046875, 6.3140869140625, 6.578369140625, 6.8426513671875, 7.10693359375, 7.3712158203125, 7.635498046875, 7.8997802734375, 8.1640625]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 5.0, 8.0, 7.0, 6.0, 9.0, 18.0, 16.0, 16.0, 31.0, 39.0, 30.0, 40.0, 56.0, 59.0, 73.0, 151.0, 1556.0, 408.0, 143.0, 59.0, 51.0, 51.0, 35.0, 34.0, 32.0, 21.0, 22.0, 17.0, 12.0, 8.0, 7.0, 7.0, 7.0, 8.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.125, -9.8170166015625, -9.509033203125, -9.2010498046875, -8.89306640625, -8.5850830078125, -8.277099609375, -7.9691162109375, -7.6611328125, -7.3531494140625, -7.045166015625, -6.7371826171875, -6.42919921875, -6.1212158203125, -5.813232421875, -5.5052490234375, -5.197265625, -4.8892822265625, -4.581298828125, -4.2733154296875, -3.96533203125, -3.6573486328125, -3.349365234375, -3.0413818359375, -2.7333984375, -2.4254150390625, -2.117431640625, -1.8094482421875, -1.50146484375, -1.1934814453125, -0.885498046875, -0.5775146484375, -0.26953125, 0.0384521484375, 0.346435546875, 0.6544189453125, 0.96240234375, 1.2703857421875, 1.578369140625, 1.8863525390625, 2.1943359375, 2.5023193359375, 2.810302734375, 3.1182861328125, 3.42626953125, 3.7342529296875, 4.042236328125, 4.3502197265625, 4.658203125, 4.9661865234375, 5.274169921875, 5.5821533203125, 5.89013671875, 6.1981201171875, 6.506103515625, 6.8140869140625, 7.1220703125, 7.4300537109375, 7.738037109375, 8.0460205078125, 8.35400390625, 8.6619873046875, 8.969970703125, 9.2779541015625, 9.5859375]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 2.0, 4.0, 8.0, 3.0, 10.0, 16.0, 11.0, 29.0, 24.0, 51.0, 97.0, 129.0, 211.0, 361.0, 746.0, 2077.0, 2858284.0, 280134.0, 1874.0, 700.0, 345.0, 222.0, 108.0, 90.0, 42.0, 39.0, 26.0, 22.0, 11.0, 8.0, 4.0, 2.0, 1.0, 6.0, 2.0, 7.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.0625, -41.6708984375, -40.279296875, -38.8876953125, -37.49609375, -36.1044921875, -34.712890625, -33.3212890625, -31.9296875, -30.5380859375, -29.146484375, -27.7548828125, -26.36328125, -24.9716796875, -23.580078125, -22.1884765625, -20.796875, -19.4052734375, -18.013671875, -16.6220703125, -15.23046875, -13.8388671875, -12.447265625, -11.0556640625, -9.6640625, -8.2724609375, -6.880859375, -5.4892578125, -4.09765625, -2.7060546875, -1.314453125, 0.0771484375, 1.46875, 2.8603515625, 4.251953125, 5.6435546875, 7.03515625, 8.4267578125, 9.818359375, 11.2099609375, 12.6015625, 13.9931640625, 15.384765625, 16.7763671875, 18.16796875, 19.5595703125, 20.951171875, 22.3427734375, 23.734375, 25.1259765625, 26.517578125, 27.9091796875, 29.30078125, 30.6923828125, 32.083984375, 33.4755859375, 34.8671875, 36.2587890625, 37.650390625, 39.0419921875, 40.43359375, 41.8251953125, 43.216796875, 44.6083984375, 46.0]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 18.0, 181.0, 554.0, 224.0, 31.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-143.19784545898438, -140.66525268554688, -138.13265991210938, -135.6000518798828, -133.0674591064453, -130.5348663330078, -128.00225830078125, -125.46966552734375, -122.93707275390625, -120.40447998046875, -117.87187957763672, -115.33927917480469, -112.80668640136719, -110.27409362792969, -107.74149322509766, -105.20889282226562, -102.67630004882812, -100.14370727539062, -97.6111068725586, -95.07850646972656, -92.54591369628906, -90.01332092285156, -87.48072052001953, -84.9481201171875, -82.41552734375, -79.8829345703125, -77.35033416748047, -74.81773376464844, -72.28514099121094, -69.75254821777344, -67.2199478149414, -64.68734741210938, -62.15475082397461, -59.622154235839844, -57.08955764770508, -54.55696105957031, -52.02436447143555, -49.49176788330078, -46.959171295166016, -44.42657470703125, -41.893978118896484, -39.36138153076172, -36.82878494262695, -34.29618835449219, -31.763591766357422, -29.230995178222656, -26.69839859008789, -24.165802001953125, -21.63320541381836, -19.100608825683594, -16.568012237548828, -14.035415649414062, -11.502819061279297, -8.970222473144531, -6.437625885009766, -3.905029296875, -1.3724327087402344, 1.1601638793945312, 3.692760467529297, 6.2253570556640625, 8.757953643798828, 11.290550231933594, 13.82314682006836, 16.355743408203125, 18.88833999633789]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 4.0, 8.0, 2.0, 7.0, 8.0, 12.0, 11.0, 19.0, 18.0, 19.0, 21.0, 27.0, 31.0, 28.0, 35.0, 28.0, 36.0, 33.0, 41.0, 37.0, 39.0, 48.0, 48.0, 48.0, 51.0, 42.0, 33.0, 36.0, 40.0, 25.0, 27.0, 27.0, 16.0, 12.0, 21.0, 18.0, 8.0, 14.0, 7.0, 6.0, 3.0, 4.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-30.263473510742188, -29.354202270507812, -28.444929122924805, -27.53565788269043, -26.626384735107422, -25.717113494873047, -24.807842254638672, -23.898571014404297, -22.98929786682129, -22.080026626586914, -21.170753479003906, -20.26148223876953, -19.352210998535156, -18.44293785095215, -17.533666610717773, -16.624393463134766, -15.71512222290039, -14.8058500289917, -13.896577835083008, -12.987306594848633, -12.078034400939941, -11.16876220703125, -10.259490966796875, -9.350218772888184, -8.440946578979492, -7.531674385070801, -6.622402667999268, -5.713130950927734, -4.803858757019043, -3.8945865631103516, -2.9853148460388184, -2.076043128967285, -1.166769027709961, -0.25749707221984863, 0.6517748832702637, 1.561046838760376, 2.4703187942504883, 3.3795909881591797, 4.288862705230713, 5.198134422302246, 6.1074066162109375, 7.016678810119629, 7.925950527191162, 8.835222244262695, 9.744494438171387, 10.653766632080078, 11.563037872314453, 12.472310066223145, 13.381582260131836, 14.290854454040527, 15.200126647949219, 16.109397888183594, 17.01866912841797, 17.927942276000977, 18.83721351623535, 19.74648666381836, 20.655757904052734, 21.56502914428711, 22.474302291870117, 23.383573532104492, 24.2928466796875, 25.202117919921875, 26.11138916015625, 27.020660400390625, 27.929933547973633]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 3.0, 5.0, 4.0, 2.0, 6.0, 7.0, 13.0, 13.0, 13.0, 20.0, 25.0, 17.0, 20.0, 31.0, 28.0, 26.0, 36.0, 32.0, 43.0, 35.0, 37.0, 34.0, 42.0, 45.0, 29.0, 39.0, 24.0, 46.0, 40.0, 38.0, 28.0, 41.0, 29.0, 31.0, 21.0, 18.0, 17.0, 12.0, 20.0, 7.0, 4.0, 6.0, 8.0, 1.0, 4.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-3.373046875, -3.27398681640625, -3.1749267578125, -3.07586669921875, -2.976806640625, -2.87774658203125, -2.7786865234375, -2.67962646484375, -2.58056640625, -2.48150634765625, -2.3824462890625, -2.28338623046875, -2.184326171875, -2.08526611328125, -1.9862060546875, -1.88714599609375, -1.7880859375, -1.68902587890625, -1.5899658203125, -1.49090576171875, -1.391845703125, -1.29278564453125, -1.1937255859375, -1.09466552734375, -0.99560546875, -0.89654541015625, -0.7974853515625, -0.69842529296875, -0.599365234375, -0.50030517578125, -0.4012451171875, -0.30218505859375, -0.203125, -0.10406494140625, -0.0050048828125, 0.09405517578125, 0.193115234375, 0.29217529296875, 0.3912353515625, 0.49029541015625, 0.58935546875, 0.68841552734375, 0.7874755859375, 0.88653564453125, 0.985595703125, 1.08465576171875, 1.1837158203125, 1.28277587890625, 1.3818359375, 1.48089599609375, 1.5799560546875, 1.67901611328125, 1.778076171875, 1.87713623046875, 1.9761962890625, 2.07525634765625, 2.17431640625, 2.27337646484375, 2.3724365234375, 2.47149658203125, 2.570556640625, 2.66961669921875, 2.7686767578125, 2.86773681640625, 2.966796875]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 3.0, 5.0, 7.0, 5.0, 13.0, 11.0, 26.0, 17.0, 34.0, 37.0, 31.0, 60.0, 84.0, 130.0, 227.0, 407.0, 961.0, 2310.0, 7732.0, 36116.0, 321894.0, 2139542.0, 1480306.0, 172600.0, 22670.0, 5502.0, 1816.0, 723.0, 380.0, 201.0, 113.0, 78.0, 57.0, 39.0, 30.0, 22.0, 23.0, 19.0, 13.0, 10.0, 7.0, 8.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.5, -7.2908935546875, -7.081787109375, -6.8726806640625, -6.66357421875, -6.4544677734375, -6.245361328125, -6.0362548828125, -5.8271484375, -5.6180419921875, -5.408935546875, -5.1998291015625, -4.99072265625, -4.7816162109375, -4.572509765625, -4.3634033203125, -4.154296875, -3.9451904296875, -3.736083984375, -3.5269775390625, -3.31787109375, -3.1087646484375, -2.899658203125, -2.6905517578125, -2.4814453125, -2.2723388671875, -2.063232421875, -1.8541259765625, -1.64501953125, -1.4359130859375, -1.226806640625, -1.0177001953125, -0.80859375, -0.5994873046875, -0.390380859375, -0.1812744140625, 0.02783203125, 0.2369384765625, 0.446044921875, 0.6551513671875, 0.8642578125, 1.0733642578125, 1.282470703125, 1.4915771484375, 1.70068359375, 1.9097900390625, 2.118896484375, 2.3280029296875, 2.537109375, 2.7462158203125, 2.955322265625, 3.1644287109375, 3.37353515625, 3.5826416015625, 3.791748046875, 4.0008544921875, 4.2099609375, 4.4190673828125, 4.628173828125, 4.8372802734375, 5.04638671875, 5.2554931640625, 5.464599609375, 5.6737060546875, 5.8828125]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 6.0, 29.0, 72.0, 248.0, 897.0, 1815.0, 740.0, 199.0, 55.0, 16.0, 7.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.171875, -25.4130859375, -24.654296875, -23.8955078125, -23.13671875, -22.3779296875, -21.619140625, -20.8603515625, -20.1015625, -19.3427734375, -18.583984375, -17.8251953125, -17.06640625, -16.3076171875, -15.548828125, -14.7900390625, -14.03125, -13.2724609375, -12.513671875, -11.7548828125, -10.99609375, -10.2373046875, -9.478515625, -8.7197265625, -7.9609375, -7.2021484375, -6.443359375, -5.6845703125, -4.92578125, -4.1669921875, -3.408203125, -2.6494140625, -1.890625, -1.1318359375, -0.373046875, 0.3857421875, 1.14453125, 1.9033203125, 2.662109375, 3.4208984375, 4.1796875, 4.9384765625, 5.697265625, 6.4560546875, 7.21484375, 7.9736328125, 8.732421875, 9.4912109375, 10.25, 11.0087890625, 11.767578125, 12.5263671875, 13.28515625, 14.0439453125, 14.802734375, 15.5615234375, 16.3203125, 17.0791015625, 17.837890625, 18.5966796875, 19.35546875, 20.1142578125, 20.873046875, 21.6318359375, 22.390625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 2.0, 3.0, 7.0, 11.0, 29.0, 52.0, 249.0, 1423.0, 499517.0, 3690395.0, 2057.0, 400.0, 93.0, 25.0, 12.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.46875, -47.82373046875, -46.1787109375, -44.53369140625, -42.888671875, -41.24365234375, -39.5986328125, -37.95361328125, -36.30859375, -34.66357421875, -33.0185546875, -31.37353515625, -29.728515625, -28.08349609375, -26.4384765625, -24.79345703125, -23.1484375, -21.50341796875, -19.8583984375, -18.21337890625, -16.568359375, -14.92333984375, -13.2783203125, -11.63330078125, -9.98828125, -8.34326171875, -6.6982421875, -5.05322265625, -3.408203125, -1.76318359375, -0.1181640625, 1.52685546875, 3.171875, 4.81689453125, 6.4619140625, 8.10693359375, 9.751953125, 11.39697265625, 13.0419921875, 14.68701171875, 16.33203125, 17.97705078125, 19.6220703125, 21.26708984375, 22.912109375, 24.55712890625, 26.2021484375, 27.84716796875, 29.4921875, 31.13720703125, 32.7822265625, 34.42724609375, 36.072265625, 37.71728515625, 39.3623046875, 41.00732421875, 42.65234375, 44.29736328125, 45.9423828125, 47.58740234375, 49.232421875, 50.87744140625, 52.5224609375, 54.16748046875, 55.8125]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 31.0, 164.0, 473.0, 279.0, 51.0, 8.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-104.59152221679688, -101.88837432861328, -99.18522644042969, -96.4820785522461, -93.7789306640625, -91.0757827758789, -88.37263488769531, -85.66949462890625, -82.96633911132812, -80.26319122314453, -77.56004333496094, -74.85689544677734, -72.15374755859375, -69.45059967041016, -66.74745178222656, -64.0443115234375, -61.341163635253906, -58.63801574707031, -55.93486785888672, -53.231719970703125, -50.52857208251953, -47.82542419433594, -45.12228012084961, -42.419132232666016, -39.71598434448242, -37.01283645629883, -34.309688568115234, -31.606542587280273, -28.90339469909668, -26.200246810913086, -23.497100830078125, -20.79395294189453, -18.090805053710938, -15.387657165527344, -12.684510231018066, -9.981363296508789, -7.278215408325195, -4.575067520141602, -1.8719215393066406, 0.8312263488769531, 3.534374237060547, 6.237521648406982, 8.940669059753418, 11.643815994262695, 14.346963882446289, 17.050111770629883, 19.753257751464844, 22.456405639648438, 25.15955352783203, 27.862701416015625, 30.56584930419922, 33.26899719238281, 35.972145080566406, 38.67529296875, 41.37843704223633, 44.08158493041992, 46.784732818603516, 49.48788070678711, 52.1910285949707, 54.89417266845703, 57.597320556640625, 60.30046844482422, 63.00361633300781, 65.7067642211914, 68.409912109375]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 6.0, 4.0, 17.0, 10.0, 8.0, 10.0, 14.0, 17.0, 22.0, 14.0, 27.0, 19.0, 29.0, 29.0, 43.0, 37.0, 32.0, 47.0, 40.0, 45.0, 27.0, 49.0, 25.0, 33.0, 38.0, 33.0, 42.0, 28.0, 29.0, 32.0, 22.0, 24.0, 25.0, 25.0, 21.0, 19.0, 11.0, 14.0, 6.0, 7.0, 2.0, 4.0, 7.0, 7.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.871299743652344, -25.081384658813477, -24.291467666625977, -23.50155258178711, -22.711637496948242, -21.921722412109375, -21.131805419921875, -20.341890335083008, -19.55197525024414, -18.762060165405273, -17.972143173217773, -17.182228088378906, -16.39231300354004, -15.602396965026855, -14.812480926513672, -14.022565841674805, -13.232648849487305, -12.442732810974121, -11.652817726135254, -10.86290168762207, -10.072986602783203, -9.28307056427002, -8.493154525756836, -7.7032389640808105, -6.913323402404785, -6.12340784072876, -5.333492279052734, -4.543576240539551, -3.7536606788635254, -2.9637451171875, -2.1738290786743164, -1.383913516998291, -0.5939960479736328, 0.19591963291168213, 0.9858353137969971, 1.7757511138916016, 2.565666675567627, 3.3555822372436523, 4.145498275756836, 4.935413837432861, 5.725329399108887, 6.515244960784912, 7.3051605224609375, 8.095076560974121, 8.884992599487305, 9.674907684326172, 10.464823722839355, 11.254739761352539, 12.044654846191406, 12.83457088470459, 13.624485969543457, 14.41440200805664, 15.204317092895508, 15.994233131408691, 16.784149169921875, 17.574064254760742, 18.36397933959961, 19.153894424438477, 19.943811416625977, 20.733726501464844, 21.52364158630371, 22.313556671142578, 23.103473663330078, 23.893388748168945, 24.683305740356445]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 3.0, 8.0, 5.0, 8.0, 7.0, 7.0, 10.0, 11.0, 15.0, 18.0, 21.0, 17.0, 15.0, 20.0, 23.0, 21.0, 26.0, 26.0, 38.0, 30.0, 23.0, 40.0, 30.0, 31.0, 36.0, 45.0, 39.0, 38.0, 41.0, 42.0, 27.0, 40.0, 33.0, 28.0, 29.0, 24.0, 21.0, 18.0, 14.0, 23.0, 10.0, 10.0, 7.0, 4.0, 7.0, 4.0, 6.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9619140625, -1.8910675048828125, -1.820220947265625, -1.7493743896484375, -1.67852783203125, -1.6076812744140625, -1.536834716796875, -1.4659881591796875, -1.3951416015625, -1.3242950439453125, -1.253448486328125, -1.1826019287109375, -1.11175537109375, -1.0409088134765625, -0.970062255859375, -0.8992156982421875, -0.828369140625, -0.7575225830078125, -0.686676025390625, -0.6158294677734375, -0.54498291015625, -0.4741363525390625, -0.403289794921875, -0.3324432373046875, -0.2615966796875, -0.1907501220703125, -0.119903564453125, -0.0490570068359375, 0.02178955078125, 0.0926361083984375, 0.163482666015625, 0.2343292236328125, 0.30517578125, 0.3760223388671875, 0.446868896484375, 0.5177154541015625, 0.58856201171875, 0.6594085693359375, 0.730255126953125, 0.8011016845703125, 0.8719482421875, 0.9427947998046875, 1.013641357421875, 1.0844879150390625, 1.15533447265625, 1.2261810302734375, 1.297027587890625, 1.3678741455078125, 1.438720703125, 1.5095672607421875, 1.580413818359375, 1.6512603759765625, 1.72210693359375, 1.7929534912109375, 1.863800048828125, 1.9346466064453125, 2.0054931640625, 2.0763397216796875, 2.147186279296875, 2.2180328369140625, 2.28887939453125, 2.3597259521484375, 2.430572509765625, 2.5014190673828125, 2.572265625]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 5.0, 5.0, 8.0, 15.0, 18.0, 21.0, 33.0, 42.0, 58.0, 104.0, 181.0, 254.0, 387.0, 573.0, 906.0, 1395.0, 2247.0, 3391.0, 5445.0, 8370.0, 13051.0, 20726.0, 33074.0, 56067.0, 100223.0, 200746.0, 279901.0, 136057.0, 72586.0, 42062.0, 25483.0, 16397.0, 10226.0, 6570.0, 4330.0, 2733.0, 1741.0, 1100.0, 726.0, 462.0, 288.0, 195.0, 114.0, 80.0, 50.0, 42.0, 31.0, 20.0, 7.0, 6.0, 6.0, 1.0, 1.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.401611328125, -0.3873863220214844, -0.37316131591796875, -0.3589363098144531, -0.3447113037109375, -0.3304862976074219, -0.31626129150390625, -0.3020362854003906, -0.287811279296875, -0.2735862731933594, -0.25936126708984375, -0.24513626098632812, -0.2309112548828125, -0.21668624877929688, -0.20246124267578125, -0.18823623657226562, -0.17401123046875, -0.15978622436523438, -0.14556121826171875, -0.13133621215820312, -0.1171112060546875, -0.10288619995117188, -0.08866119384765625, -0.07443618774414062, -0.060211181640625, -0.045986175537109375, -0.03176116943359375, -0.017536163330078125, -0.0033111572265625, 0.010913848876953125, 0.02513885498046875, 0.039363861083984375, 0.0535888671875, 0.06781387329101562, 0.08203887939453125, 0.09626388549804688, 0.1104888916015625, 0.12471389770507812, 0.13893890380859375, 0.15316390991210938, 0.167388916015625, 0.18161392211914062, 0.19583892822265625, 0.21006393432617188, 0.2242889404296875, 0.23851394653320312, 0.25273895263671875, 0.2669639587402344, 0.28118896484375, 0.2954139709472656, 0.30963897705078125, 0.3238639831542969, 0.3380889892578125, 0.3523139953613281, 0.36653900146484375, 0.3807640075683594, 0.394989013671875, 0.4092140197753906, 0.42343902587890625, 0.4376640319824219, 0.4518890380859375, 0.4661140441894531, 0.48033905029296875, 0.4945640563964844, 0.5087890625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 7.0, 2.0, 2.0, 3.0, 9.0, 7.0, 10.0, 12.0, 15.0, 21.0, 12.0, 13.0, 31.0, 19.0, 22.0, 30.0, 29.0, 41.0, 38.0, 41.0, 48.0, 38.0, 35.0, 1066.0, 40.0, 33.0, 36.0, 47.0, 37.0, 34.0, 32.0, 30.0, 47.0, 13.0, 27.0, 21.0, 20.0, 14.0, 17.0, 8.0, 8.0, 6.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7099609375, -1.65826416015625, -1.6065673828125, -1.55487060546875, -1.503173828125, -1.45147705078125, -1.3997802734375, -1.34808349609375, -1.29638671875, -1.24468994140625, -1.1929931640625, -1.14129638671875, -1.089599609375, -1.03790283203125, -0.9862060546875, -0.93450927734375, -0.8828125, -0.83111572265625, -0.7794189453125, -0.72772216796875, -0.676025390625, -0.62432861328125, -0.5726318359375, -0.52093505859375, -0.46923828125, -0.41754150390625, -0.3658447265625, -0.31414794921875, -0.262451171875, -0.21075439453125, -0.1590576171875, -0.10736083984375, -0.0556640625, -0.00396728515625, 0.0477294921875, 0.09942626953125, 0.151123046875, 0.20281982421875, 0.2545166015625, 0.30621337890625, 0.35791015625, 0.40960693359375, 0.4613037109375, 0.51300048828125, 0.564697265625, 0.61639404296875, 0.6680908203125, 0.71978759765625, 0.771484375, 0.82318115234375, 0.8748779296875, 0.92657470703125, 0.978271484375, 1.02996826171875, 1.0816650390625, 1.13336181640625, 1.18505859375, 1.23675537109375, 1.2884521484375, 1.34014892578125, 1.391845703125, 1.44354248046875, 1.4952392578125, 1.54693603515625, 1.5986328125]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 13.0, 14.0, 17.0, 27.0, 50.0, 74.0, 102.0, 170.0, 233.0, 377.0, 555.0, 820.0, 1297.0, 1940.0, 2870.0, 4491.0, 6925.0, 10835.0, 17182.0, 27605.0, 45995.0, 79319.0, 152250.0, 1350179.0, 174465.0, 87663.0, 49990.0, 29728.0, 18411.0, 11704.0, 7560.0, 4975.0, 3144.0, 2189.0, 1325.0, 908.0, 598.0, 387.0, 243.0, 177.0, 108.0, 91.0, 41.0, 27.0, 25.0, 14.0, 10.0, 6.0, 2.0, 3.0, 5.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.453857421875, -0.4399299621582031, -0.42600250244140625, -0.4120750427246094, -0.3981475830078125, -0.3842201232910156, -0.37029266357421875, -0.3563652038574219, -0.342437744140625, -0.3285102844238281, -0.31458282470703125, -0.3006553649902344, -0.2867279052734375, -0.2728004455566406, -0.25887298583984375, -0.24494552612304688, -0.23101806640625, -0.21709060668945312, -0.20316314697265625, -0.18923568725585938, -0.1753082275390625, -0.16138076782226562, -0.14745330810546875, -0.13352584838867188, -0.119598388671875, -0.10567092895507812, -0.09174346923828125, -0.07781600952148438, -0.0638885498046875, -0.049961090087890625, -0.03603363037109375, -0.022106170654296875, -0.0081787109375, 0.005748748779296875, 0.01967620849609375, 0.033603668212890625, 0.0475311279296875, 0.061458587646484375, 0.07538604736328125, 0.08931350708007812, 0.103240966796875, 0.11716842651367188, 0.13109588623046875, 0.14502334594726562, 0.1589508056640625, 0.17287826538085938, 0.18680572509765625, 0.20073318481445312, 0.21466064453125, 0.22858810424804688, 0.24251556396484375, 0.2564430236816406, 0.2703704833984375, 0.2842979431152344, 0.29822540283203125, 0.3121528625488281, 0.326080322265625, 0.3400077819824219, 0.35393524169921875, 0.3678627014160156, 0.3817901611328125, 0.3957176208496094, 0.40964508056640625, 0.4235725402832031, 0.4375]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 3.0, 6.0, 4.0, 12.0, 12.0, 14.0, 12.0, 15.0, 19.0, 24.0, 25.0, 34.0, 38.0, 48.0, 46.0, 52.0, 47.0, 62.0, 59.0, 50.0, 52.0, 48.0, 54.0, 37.0, 32.0, 33.0, 28.0, 20.0, 19.0, 23.0, 13.0, 15.0, 5.0, 7.0, 2.0, 2.0, 7.0, 6.0, 4.0, 1.0, 1.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00034356117248535156, -0.00033297762274742126, -0.00032239407300949097, -0.00031181052327156067, -0.00030122697353363037, -0.0002906434237957001, -0.0002800598740577698, -0.0002694763243198395, -0.0002588927745819092, -0.0002483092248439789, -0.00023772567510604858, -0.00022714212536811829, -0.000216558575630188, -0.0002059750258922577, -0.0001953914761543274, -0.0001848079264163971, -0.0001742243766784668, -0.0001636408269405365, -0.0001530572772026062, -0.0001424737274646759, -0.0001318901777267456, -0.00012130662798881531, -0.00011072307825088501, -0.00010013952851295471, -8.955597877502441e-05, -7.897242903709412e-05, -6.838887929916382e-05, -5.780532956123352e-05, -4.722177982330322e-05, -3.6638230085372925e-05, -2.6054680347442627e-05, -1.547113060951233e-05, -4.887580871582031e-06, 5.695968866348267e-06, 1.6279518604278564e-05, 2.6863068342208862e-05, 3.744661808013916e-05, 4.803016781806946e-05, 5.8613717555999756e-05, 6.919726729393005e-05, 7.978081703186035e-05, 9.036436676979065e-05, 0.00010094791650772095, 0.00011153146624565125, 0.00012211501598358154, 0.00013269856572151184, 0.00014328211545944214, 0.00015386566519737244, 0.00016444921493530273, 0.00017503276467323303, 0.00018561631441116333, 0.00019619986414909363, 0.00020678341388702393, 0.00021736696362495422, 0.00022795051336288452, 0.00023853406310081482, 0.0002491176128387451, 0.0002597011625766754, 0.0002702847123146057, 0.000280868262052536, 0.0002914518117904663, 0.0003020353615283966, 0.0003126189112663269, 0.0003232024610042572, 0.0003337860107421875]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 3.0, 7.0, 10.0, 6.0, 6.0, 12.0, 10.0, 17.0, 30.0, 37.0, 62.0, 76.0, 113.0, 159.0, 254.0, 409.0, 831.0, 2641.0, 1037891.0, 3751.0, 911.0, 461.0, 262.0, 174.0, 119.0, 89.0, 45.0, 50.0, 39.0, 23.0, 15.0, 15.0, 11.0, 5.0, 4.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00811767578125, -0.007868289947509766, -0.007618904113769531, -0.007369518280029297, -0.0071201324462890625, -0.006870746612548828, -0.006621360778808594, -0.006371974945068359, -0.006122589111328125, -0.005873203277587891, -0.005623817443847656, -0.005374431610107422, -0.0051250457763671875, -0.004875659942626953, -0.004626274108886719, -0.004376888275146484, -0.00412750244140625, -0.0038781166076660156, -0.0036287307739257812, -0.003379344940185547, -0.0031299591064453125, -0.002880573272705078, -0.0026311874389648438, -0.0023818016052246094, -0.002132415771484375, -0.0018830299377441406, -0.0016336441040039062, -0.0013842582702636719, -0.0011348724365234375, -0.0008854866027832031, -0.0006361007690429688, -0.0003867149353027344, -0.0001373291015625, 0.00011205673217773438, 0.00036144256591796875, 0.0006108283996582031, 0.0008602142333984375, 0.0011096000671386719, 0.0013589859008789062, 0.0016083717346191406, 0.001857757568359375, 0.0021071434020996094, 0.0023565292358398438, 0.002605915069580078, 0.0028553009033203125, 0.003104686737060547, 0.0033540725708007812, 0.0036034584045410156, 0.00385284423828125, 0.004102230072021484, 0.004351615905761719, 0.004601001739501953, 0.0048503875732421875, 0.005099773406982422, 0.005349159240722656, 0.005598545074462891, 0.005847930908203125, 0.006097316741943359, 0.006346702575683594, 0.006596088409423828, 0.0068454742431640625, 0.007094860076904297, 0.007344245910644531, 0.007593631744384766, 0.007843017578125]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 65.0, 553.0, 364.0, 27.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001295246183872223, -0.0012669855495914817, -0.0012387249153107405, -0.0012104642810299993, -0.001182203646749258, -0.0011539431288838387, -0.0011256824946030974, -0.0010974218603223562, -0.001069161226041615, -0.0010409005917608738, -0.0010126399574801326, -0.0009843793231993914, -0.0009561187471263111, -0.0009278581128455698, -0.0008995975367724895, -0.0008713369024917483, -0.0008430762682110071, -0.0008148156339302659, -0.0007865549996495247, -0.0007582944235764444, -0.0007300337892957032, -0.000701773155014962, -0.0006735125789418817, -0.0006452519446611404, -0.0006169913103803992, -0.000588730676099658, -0.0005604700418189168, -0.0005322094657458365, -0.0005039488314650953, -0.00047568819718435407, -0.0004474275920074433, -0.00041916698683053255, -0.0003909062943421304, -0.0003626456600613892, -0.00033438505488447845, -0.0003061244497075677, -0.0002778638154268265, -0.00024960318114608526, -0.0002213425759691745, -0.00019308195624034852, -0.00016482133651152253, -0.00013656071678269655, -0.00010830009705387056, -8.003947732504457e-05, -5.1778857596218586e-05, -2.35182378673926e-05, 4.742381861433387e-06, 3.300300159025937e-05, 6.126362131908536e-05, 8.952424104791135e-05, 0.00011778486077673733, 0.00014604548050556332, 0.0001743061002343893, 0.0002025667199632153, 0.00023082733969204128, 0.00025908794486895204, 0.00028734857914969325, 0.00031560921343043447, 0.0003438698186073452, 0.000372130423784256, 0.0004003910580649972, 0.0004286516923457384, 0.00045691229752264917, 0.0004851729026995599, 0.0005134335369803011]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 2.0, 4.0, 4.0, 12.0, 11.0, 16.0, 12.0, 9.0, 13.0, 25.0, 22.0, 18.0, 26.0, 24.0, 27.0, 44.0, 43.0, 44.0, 40.0, 37.0, 37.0, 46.0, 37.0, 43.0, 52.0, 39.0, 43.0, 25.0, 33.0, 31.0, 25.0, 13.0, 20.0, 23.0, 16.0, 15.0, 12.0, 11.0, 15.0, 10.0, 6.0, 2.0, 5.0, 4.0, 3.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.00020182132720947266, -0.00019604898989200592, -0.00019027665257453918, -0.00018450431525707245, -0.0001787319779396057, -0.00017295964062213898, -0.00016718730330467224, -0.0001614149659872055, -0.00015564262866973877, -0.00014987029135227203, -0.0001440979540348053, -0.00013832561671733856, -0.00013255327939987183, -0.0001267809420824051, -0.00012100860476493835, -0.00011523626744747162, -0.00010946393013000488, -0.00010369159281253815, -9.791925549507141e-05, -9.214691817760468e-05, -8.637458086013794e-05, -8.06022435426712e-05, -7.482990622520447e-05, -6.905756890773773e-05, -6.3285231590271e-05, -5.751289427280426e-05, -5.1740556955337524e-05, -4.596821963787079e-05, -4.019588232040405e-05, -3.442354500293732e-05, -2.865120768547058e-05, -2.2878870368003845e-05, -1.710653305053711e-05, -1.1334195733070374e-05, -5.561858415603638e-06, 2.1047890186309814e-07, 5.982816219329834e-06, 1.175515353679657e-05, 1.7527490854263306e-05, 2.329982817173004e-05, 2.9072165489196777e-05, 3.484450280666351e-05, 4.061684012413025e-05, 4.6389177441596985e-05, 5.216151475906372e-05, 5.7933852076530457e-05, 6.370618939399719e-05, 6.947852671146393e-05, 7.525086402893066e-05, 8.10232013463974e-05, 8.679553866386414e-05, 9.256787598133087e-05, 9.834021329879761e-05, 0.00010411255061626434, 0.00010988488793373108, 0.00011565722525119781, 0.00012142956256866455, 0.0001272018998861313, 0.00013297423720359802, 0.00013874657452106476, 0.0001445189118385315, 0.00015029124915599823, 0.00015606358647346497, 0.0001618359237909317, 0.00016760826110839844]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [5.0, 1.0, 2.0, 3.0, 8.0, 5.0, 8.0, 7.0, 7.0, 10.0, 11.0, 15.0, 18.0, 21.0, 17.0, 15.0, 20.0, 23.0, 21.0, 26.0, 26.0, 38.0, 30.0, 23.0, 40.0, 30.0, 31.0, 36.0, 45.0, 39.0, 38.0, 41.0, 42.0, 27.0, 40.0, 33.0, 28.0, 29.0, 23.0, 22.0, 18.0, 14.0, 23.0, 10.0, 10.0, 7.0, 4.0, 7.0, 4.0, 6.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9619140625, -1.8910675048828125, -1.820220947265625, -1.7493743896484375, -1.67852783203125, -1.6076812744140625, -1.536834716796875, -1.4659881591796875, -1.3951416015625, -1.3242950439453125, -1.253448486328125, -1.1826019287109375, -1.11175537109375, -1.0409088134765625, -0.970062255859375, -0.8992156982421875, -0.828369140625, -0.7575225830078125, -0.686676025390625, -0.6158294677734375, -0.54498291015625, -0.4741363525390625, -0.403289794921875, -0.3324432373046875, -0.2615966796875, -0.1907501220703125, -0.119903564453125, -0.0490570068359375, 0.02178955078125, 0.0926361083984375, 0.163482666015625, 0.2343292236328125, 0.30517578125, 0.3760223388671875, 0.446868896484375, 0.5177154541015625, 0.58856201171875, 0.6594085693359375, 0.730255126953125, 0.8011016845703125, 0.8719482421875, 0.9427947998046875, 1.013641357421875, 1.0844879150390625, 1.15533447265625, 1.2261810302734375, 1.297027587890625, 1.3678741455078125, 1.438720703125, 1.5095672607421875, 1.580413818359375, 1.6512603759765625, 1.72210693359375, 1.7929534912109375, 1.863800048828125, 1.9346466064453125, 2.0054931640625, 2.0763397216796875, 2.147186279296875, 2.2180328369140625, 2.28887939453125, 2.3597259521484375, 2.430572509765625, 2.5014190673828125, 2.572265625]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 7.0, 12.0, 16.0, 15.0, 27.0, 26.0, 44.0, 44.0, 80.0, 91.0, 127.0, 158.0, 229.0, 329.0, 483.0, 742.0, 1207.0, 2095.0, 4212.0, 10528.0, 39074.0, 257153.0, 594055.0, 103101.0, 20357.0, 6787.0, 3014.0, 1612.0, 933.0, 553.0, 402.0, 271.0, 198.0, 149.0, 130.0, 84.0, 61.0, 46.0, 36.0, 20.0, 17.0, 12.0, 6.0, 5.0, 2.0, 7.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.40625, -4.2557373046875, -4.105224609375, -3.9547119140625, -3.80419921875, -3.6536865234375, -3.503173828125, -3.3526611328125, -3.2021484375, -3.0516357421875, -2.901123046875, -2.7506103515625, -2.60009765625, -2.4495849609375, -2.299072265625, -2.1485595703125, -1.998046875, -1.8475341796875, -1.697021484375, -1.5465087890625, -1.39599609375, -1.2454833984375, -1.094970703125, -0.9444580078125, -0.7939453125, -0.6434326171875, -0.492919921875, -0.3424072265625, -0.19189453125, -0.0413818359375, 0.109130859375, 0.2596435546875, 0.41015625, 0.5606689453125, 0.711181640625, 0.8616943359375, 1.01220703125, 1.1627197265625, 1.313232421875, 1.4637451171875, 1.6142578125, 1.7647705078125, 1.915283203125, 2.0657958984375, 2.21630859375, 2.3668212890625, 2.517333984375, 2.6678466796875, 2.818359375, 2.9688720703125, 3.119384765625, 3.2698974609375, 3.42041015625, 3.5709228515625, 3.721435546875, 3.8719482421875, 4.0224609375, 4.1729736328125, 4.323486328125, 4.4739990234375, 4.62451171875, 4.7750244140625, 4.925537109375, 5.0760498046875, 5.2265625]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 7.0, 4.0, 5.0, 9.0, 5.0, 13.0, 7.0, 13.0, 16.0, 18.0, 19.0, 33.0, 31.0, 36.0, 57.0, 42.0, 85.0, 158.0, 435.0, 1483.0, 155.0, 83.0, 63.0, 42.0, 44.0, 40.0, 31.0, 24.0, 22.0, 18.0, 12.0, 10.0, 8.0, 2.0, 2.0, 5.0, 3.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.390625, -9.1064453125, -8.822265625, -8.5380859375, -8.25390625, -7.9697265625, -7.685546875, -7.4013671875, -7.1171875, -6.8330078125, -6.548828125, -6.2646484375, -5.98046875, -5.6962890625, -5.412109375, -5.1279296875, -4.84375, -4.5595703125, -4.275390625, -3.9912109375, -3.70703125, -3.4228515625, -3.138671875, -2.8544921875, -2.5703125, -2.2861328125, -2.001953125, -1.7177734375, -1.43359375, -1.1494140625, -0.865234375, -0.5810546875, -0.296875, -0.0126953125, 0.271484375, 0.5556640625, 0.83984375, 1.1240234375, 1.408203125, 1.6923828125, 1.9765625, 2.2607421875, 2.544921875, 2.8291015625, 3.11328125, 3.3974609375, 3.681640625, 3.9658203125, 4.25, 4.5341796875, 4.818359375, 5.1025390625, 5.38671875, 5.6708984375, 5.955078125, 6.2392578125, 6.5234375, 6.8076171875, 7.091796875, 7.3759765625, 7.66015625, 7.9443359375, 8.228515625, 8.5126953125, 8.796875]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 9.0, 5.0, 7.0, 14.0, 19.0, 23.0, 36.0, 36.0, 72.0, 82.0, 102.0, 169.0, 320.0, 570.0, 1422.0, 24516.0, 3110201.0, 5751.0, 1042.0, 414.0, 244.0, 175.0, 115.0, 91.0, 65.0, 48.0, 47.0, 27.0, 14.0, 13.0, 15.0, 9.0, 6.0, 6.0, 4.0, 5.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-19.5625, -18.957763671875, -18.35302734375, -17.748291015625, -17.1435546875, -16.538818359375, -15.93408203125, -15.329345703125, -14.724609375, -14.119873046875, -13.51513671875, -12.910400390625, -12.3056640625, -11.700927734375, -11.09619140625, -10.491455078125, -9.88671875, -9.281982421875, -8.67724609375, -8.072509765625, -7.4677734375, -6.863037109375, -6.25830078125, -5.653564453125, -5.048828125, -4.444091796875, -3.83935546875, -3.234619140625, -2.6298828125, -2.025146484375, -1.42041015625, -0.815673828125, -0.2109375, 0.393798828125, 0.99853515625, 1.603271484375, 2.2080078125, 2.812744140625, 3.41748046875, 4.022216796875, 4.626953125, 5.231689453125, 5.83642578125, 6.441162109375, 7.0458984375, 7.650634765625, 8.25537109375, 8.860107421875, 9.46484375, 10.069580078125, 10.67431640625, 11.279052734375, 11.8837890625, 12.488525390625, 13.09326171875, 13.697998046875, 14.302734375, 14.907470703125, 15.51220703125, 16.116943359375, 16.7216796875, 17.326416015625, 17.93115234375, 18.535888671875, 19.140625]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 47.0, 967.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-314.534912109375, -308.74957275390625, -302.9642333984375, -297.17889404296875, -291.3935546875, -285.60821533203125, -279.8228759765625, -274.0375671386719, -268.2522277832031, -262.4668884277344, -256.6815490722656, -250.89620971679688, -245.1108856201172, -239.32554626464844, -233.5402069091797, -227.75486755371094, -221.9695281982422, -216.18418884277344, -210.3988494873047, -204.613525390625, -198.82818603515625, -193.0428466796875, -187.25750732421875, -181.47216796875, -175.68682861328125, -169.9014892578125, -164.11614990234375, -158.330810546875, -152.5454864501953, -146.76014709472656, -140.9748077392578, -135.18946838378906, -129.40415954589844, -123.61882019042969, -117.83348846435547, -112.04814910888672, -106.2628173828125, -100.47747802734375, -94.692138671875, -88.90679931640625, -83.1214599609375, -77.33612060546875, -71.55078887939453, -65.76544952392578, -59.9801139831543, -54.19477844238281, -48.40943908691406, -42.62410354614258, -36.83877182006836, -31.053436279296875, -25.268098831176758, -19.48276138305664, -13.697425842285156, -7.912090301513672, -2.126750946044922, 3.6585845947265625, 9.443920135498047, 15.229256629943848, 21.01459312438965, 26.799930572509766, 32.58526611328125, 38.370601654052734, 44.155941009521484, 49.94127655029297, 55.72661209106445]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 5.0, 5.0, 4.0, 4.0, 9.0, 4.0, 7.0, 7.0, 7.0, 7.0, 16.0, 13.0, 16.0, 18.0, 15.0, 21.0, 19.0, 30.0, 23.0, 26.0, 24.0, 32.0, 27.0, 42.0, 27.0, 33.0, 34.0, 34.0, 45.0, 36.0, 33.0, 30.0, 28.0, 37.0, 27.0, 27.0, 20.0, 21.0, 26.0, 19.0, 22.0, 13.0, 20.0, 10.0, 15.0, 12.0, 12.0, 10.0, 7.0, 10.0, 10.0, 5.0, 1.0, 6.0, 3.0, 1.0], "bins": [-18.782054901123047, -18.286327362060547, -17.790599822998047, -17.294872283935547, -16.799144744873047, -16.303417205810547, -15.80768871307373, -15.31196117401123, -14.816232681274414, -14.320505142211914, -13.824777603149414, -13.329050064086914, -12.833321571350098, -12.337594032287598, -11.841866493225098, -11.346138954162598, -10.850411415100098, -10.354683876037598, -9.858956336975098, -9.363227844238281, -8.867500305175781, -8.371772766113281, -7.876045227050781, -7.380317687988281, -6.884589672088623, -6.388862133026123, -5.893134117126465, -5.397406578063965, -4.901679039001465, -4.405951023101807, -3.9102234840393066, -3.4144957065582275, -2.918768882751465, -2.4230411052703857, -1.9273134469985962, -1.4315857887268066, -0.9358580112457275, -0.44013023376464844, 0.05559730529785156, 0.5513250827789307, 1.0470528602600098, 1.5427806377410889, 2.038508415222168, 2.534235954284668, 3.029963731765747, 3.525691509246826, 4.021419048309326, 4.517147064208984, 5.012874603271484, 5.508602142333984, 6.004330158233643, 6.500057697296143, 6.995785713195801, 7.491513252258301, 7.987240791320801, 8.4829683303833, 8.978696823120117, 9.474424362182617, 9.970151901245117, 10.465879440307617, 10.961607933044434, 11.457335472106934, 11.953063011169434, 12.448790550231934, 12.944518089294434]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 4.0, 5.0, 6.0, 3.0, 5.0, 13.0, 11.0, 11.0, 12.0, 13.0, 11.0, 18.0, 21.0, 19.0, 21.0, 19.0, 26.0, 27.0, 34.0, 32.0, 32.0, 40.0, 23.0, 39.0, 39.0, 38.0, 37.0, 33.0, 38.0, 37.0, 43.0, 38.0, 37.0, 27.0, 37.0, 21.0, 11.0, 18.0, 20.0, 15.0, 16.0, 14.0, 9.0, 9.0, 8.0, 5.0, 2.0, 5.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.798828125, -2.714263916015625, -2.62969970703125, -2.545135498046875, -2.4605712890625, -2.376007080078125, -2.29144287109375, -2.206878662109375, -2.122314453125, -2.037750244140625, -1.95318603515625, -1.868621826171875, -1.7840576171875, -1.699493408203125, -1.61492919921875, -1.530364990234375, -1.44580078125, -1.361236572265625, -1.27667236328125, -1.192108154296875, -1.1075439453125, -1.022979736328125, -0.93841552734375, -0.853851318359375, -0.769287109375, -0.684722900390625, -0.60015869140625, -0.515594482421875, -0.4310302734375, -0.346466064453125, -0.26190185546875, -0.177337646484375, -0.0927734375, -0.008209228515625, 0.07635498046875, 0.160919189453125, 0.2454833984375, 0.330047607421875, 0.41461181640625, 0.499176025390625, 0.583740234375, 0.668304443359375, 0.75286865234375, 0.837432861328125, 0.9219970703125, 1.006561279296875, 1.09112548828125, 1.175689697265625, 1.26025390625, 1.344818115234375, 1.42938232421875, 1.513946533203125, 1.5985107421875, 1.683074951171875, 1.76763916015625, 1.852203369140625, 1.936767578125, 2.021331787109375, 2.10589599609375, 2.190460205078125, 2.2750244140625, 2.359588623046875, 2.44415283203125, 2.528717041015625, 2.61328125]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 3.0, 7.0, 4.0, 5.0, 4.0, 7.0, 16.0, 6.0, 13.0, 17.0, 19.0, 37.0, 30.0, 49.0, 49.0, 61.0, 77.0, 108.0, 147.0, 146.0, 250.0, 331.0, 467.0, 706.0, 1121.0, 2488.0, 14065.0, 985587.0, 3105949.0, 73612.0, 4378.0, 1508.0, 869.0, 576.0, 410.0, 275.0, 222.0, 161.0, 111.0, 95.0, 61.0, 44.0, 40.0, 32.0, 19.0, 27.0, 20.0, 23.0, 8.0, 7.0, 11.0, 7.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-13.8671875, -13.436767578125, -13.00634765625, -12.575927734375, -12.1455078125, -11.715087890625, -11.28466796875, -10.854248046875, -10.423828125, -9.993408203125, -9.56298828125, -9.132568359375, -8.7021484375, -8.271728515625, -7.84130859375, -7.410888671875, -6.98046875, -6.550048828125, -6.11962890625, -5.689208984375, -5.2587890625, -4.828369140625, -4.39794921875, -3.967529296875, -3.537109375, -3.106689453125, -2.67626953125, -2.245849609375, -1.8154296875, -1.385009765625, -0.95458984375, -0.524169921875, -0.09375, 0.336669921875, 0.76708984375, 1.197509765625, 1.6279296875, 2.058349609375, 2.48876953125, 2.919189453125, 3.349609375, 3.780029296875, 4.21044921875, 4.640869140625, 5.0712890625, 5.501708984375, 5.93212890625, 6.362548828125, 6.79296875, 7.223388671875, 7.65380859375, 8.084228515625, 8.5146484375, 8.945068359375, 9.37548828125, 9.805908203125, 10.236328125, 10.666748046875, 11.09716796875, 11.527587890625, 11.9580078125, 12.388427734375, 12.81884765625, 13.249267578125, 13.6796875]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 8.0, 8.0, 21.0, 12.0, 39.0, 67.0, 114.0, 219.0, 343.0, 519.0, 692.0, 683.0, 498.0, 351.0, 208.0, 119.0, 55.0, 42.0, 33.0, 14.0, 9.0, 2.0, 4.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.48046875, -6.24932861328125, -6.0181884765625, -5.78704833984375, -5.555908203125, -5.32476806640625, -5.0936279296875, -4.86248779296875, -4.63134765625, -4.40020751953125, -4.1690673828125, -3.93792724609375, -3.706787109375, -3.47564697265625, -3.2445068359375, -3.01336669921875, -2.7822265625, -2.55108642578125, -2.3199462890625, -2.08880615234375, -1.857666015625, -1.62652587890625, -1.3953857421875, -1.16424560546875, -0.93310546875, -0.70196533203125, -0.4708251953125, -0.23968505859375, -0.008544921875, 0.22259521484375, 0.4537353515625, 0.68487548828125, 0.916015625, 1.14715576171875, 1.3782958984375, 1.60943603515625, 1.840576171875, 2.07171630859375, 2.3028564453125, 2.53399658203125, 2.76513671875, 2.99627685546875, 3.2274169921875, 3.45855712890625, 3.689697265625, 3.92083740234375, 4.1519775390625, 4.38311767578125, 4.6142578125, 4.84539794921875, 5.0765380859375, 5.30767822265625, 5.538818359375, 5.76995849609375, 6.0010986328125, 6.23223876953125, 6.46337890625, 6.69451904296875, 6.9256591796875, 7.15679931640625, 7.387939453125, 7.61907958984375, 7.8502197265625, 8.08135986328125, 8.3125]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 4.0, 6.0, 6.0, 10.0, 13.0, 33.0, 78.0, 159.0, 337.0, 888.0, 2663.0, 12596.0, 203240.0, 3330440.0, 612939.0, 24824.0, 3969.0, 1261.0, 453.0, 176.0, 90.0, 40.0, 23.0, 14.0, 9.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.7421875, -9.46893310546875, -9.1956787109375, -8.92242431640625, -8.649169921875, -8.37591552734375, -8.1026611328125, -7.82940673828125, -7.55615234375, -7.28289794921875, -7.0096435546875, -6.73638916015625, -6.463134765625, -6.18988037109375, -5.9166259765625, -5.64337158203125, -5.3701171875, -5.09686279296875, -4.8236083984375, -4.55035400390625, -4.277099609375, -4.00384521484375, -3.7305908203125, -3.45733642578125, -3.18408203125, -2.91082763671875, -2.6375732421875, -2.36431884765625, -2.091064453125, -1.81781005859375, -1.5445556640625, -1.27130126953125, -0.998046875, -0.72479248046875, -0.4515380859375, -0.17828369140625, 0.094970703125, 0.36822509765625, 0.6414794921875, 0.91473388671875, 1.18798828125, 1.46124267578125, 1.7344970703125, 2.00775146484375, 2.281005859375, 2.55426025390625, 2.8275146484375, 3.10076904296875, 3.3740234375, 3.64727783203125, 3.9205322265625, 4.19378662109375, 4.467041015625, 4.74029541015625, 5.0135498046875, 5.28680419921875, 5.56005859375, 5.83331298828125, 6.1065673828125, 6.37982177734375, 6.653076171875, 6.92633056640625, 7.1995849609375, 7.47283935546875, 7.74609375]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 4.0, 0.0, 2.0, 1.0, 4.0, 12.0, 17.0, 20.0, 32.0, 39.0, 47.0, 77.0, 93.0, 81.0, 100.0, 99.0, 84.0, 74.0, 61.0, 55.0, 30.0, 27.0, 20.0, 10.0, 7.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.791250228881836, -22.712310791015625, -21.63336944580078, -20.55443000793457, -19.475488662719727, -18.396549224853516, -17.317607879638672, -16.23866844177246, -15.159728050231934, -14.080787658691406, -13.001847267150879, -11.922906875610352, -10.84396743774414, -9.765026092529297, -8.686086654663086, -7.607146263122559, -6.528205871582031, -5.449265480041504, -4.370325088500977, -3.2913851737976074, -2.21244478225708, -1.1335043907165527, -0.054564476013183594, 1.0243759155273438, 2.103316307067871, 3.1822566986083984, 4.261197090148926, 5.340137004852295, 6.419077396392822, 7.49801778793335, 8.576957702636719, 9.655898094177246, 10.73483657836914, 11.813776969909668, 12.892717361450195, 13.971656799316406, 15.05059814453125, 16.12953758239746, 17.208477020263672, 18.287418365478516, 19.36635971069336, 20.44529914855957, 21.524240493774414, 22.603179931640625, 23.68212127685547, 24.76106071472168, 25.84000015258789, 26.918941497802734, 27.997880935668945, 29.076820373535156, 30.15576171875, 31.23470115661621, 32.31364059448242, 33.392581939697266, 34.47152328491211, 35.55046081542969, 36.62940216064453, 37.708343505859375, 38.78728103637695, 39.8662223815918, 40.94516372680664, 42.024105072021484, 43.10304260253906, 44.181983947753906, 45.26092529296875]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 6.0, 3.0, 6.0, 7.0, 3.0, 7.0, 11.0, 14.0, 12.0, 16.0, 11.0, 22.0, 24.0, 24.0, 25.0, 31.0, 34.0, 29.0, 32.0, 42.0, 40.0, 36.0, 33.0, 31.0, 51.0, 31.0, 45.0, 43.0, 29.0, 32.0, 36.0, 32.0, 27.0, 28.0, 19.0, 21.0, 23.0, 14.0, 9.0, 13.0, 12.0, 14.0, 5.0, 4.0, 6.0, 3.0, 5.0, 1.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-17.31160545349121, -16.7670841217041, -16.222562789916992, -15.678041458129883, -15.133520126342773, -14.588998794555664, -14.044477462768555, -13.499956130981445, -12.955434799194336, -12.410913467407227, -11.866392135620117, -11.321870803833008, -10.777349472045898, -10.232828140258789, -9.68830680847168, -9.14378547668457, -8.599264144897461, -8.054742813110352, -7.510221481323242, -6.965700149536133, -6.421178817749023, -5.876657485961914, -5.332136154174805, -4.787614822387695, -4.243093490600586, -3.6985721588134766, -3.154050827026367, -2.609529495239258, -2.0650081634521484, -1.520486831665039, -0.9759654998779297, -0.4314441680908203, 0.11307525634765625, 0.6575965881347656, 1.202117919921875, 1.7466392517089844, 2.2911605834960938, 2.835681915283203, 3.3802032470703125, 3.924724578857422, 4.469245910644531, 5.013767242431641, 5.55828857421875, 6.102809906005859, 6.647331237792969, 7.191852569580078, 7.7363739013671875, 8.280895233154297, 8.825416564941406, 9.369937896728516, 9.914459228515625, 10.458980560302734, 11.003501892089844, 11.548023223876953, 12.092544555664062, 12.637065887451172, 13.181587219238281, 13.72610855102539, 14.2706298828125, 14.81515121459961, 15.359672546386719, 15.904193878173828, 16.448715209960938, 16.993236541748047, 17.537757873535156]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 4.0, 3.0, 6.0, 2.0, 4.0, 14.0, 11.0, 15.0, 18.0, 17.0, 15.0, 14.0, 29.0, 23.0, 33.0, 22.0, 45.0, 36.0, 29.0, 37.0, 45.0, 40.0, 57.0, 40.0, 31.0, 51.0, 58.0, 23.0, 32.0, 34.0, 30.0, 28.0, 19.0, 21.0, 28.0, 11.0, 13.0, 9.0, 7.0, 16.0, 4.0, 9.0, 6.0, 5.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.921875, -26.943603515625, -25.96533203125, -24.987060546875, -24.0087890625, -23.030517578125, -22.05224609375, -21.073974609375, -20.095703125, -19.117431640625, -18.13916015625, -17.160888671875, -16.1826171875, -15.204345703125, -14.22607421875, -13.247802734375, -12.26953125, -11.291259765625, -10.31298828125, -9.334716796875, -8.3564453125, -7.378173828125, -6.39990234375, -5.421630859375, -4.443359375, -3.465087890625, -2.48681640625, -1.508544921875, -0.5302734375, 0.447998046875, 1.42626953125, 2.404541015625, 3.3828125, 4.361083984375, 5.33935546875, 6.317626953125, 7.2958984375, 8.274169921875, 9.25244140625, 10.230712890625, 11.208984375, 12.187255859375, 13.16552734375, 14.143798828125, 15.1220703125, 16.100341796875, 17.07861328125, 18.056884765625, 19.03515625, 20.013427734375, 20.99169921875, 21.969970703125, 22.9482421875, 23.926513671875, 24.90478515625, 25.883056640625, 26.861328125, 27.839599609375, 28.81787109375, 29.796142578125, 30.7744140625, 31.752685546875, 32.73095703125, 33.709228515625, 34.6875]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 4.0, 8.0, 14.0, 17.0, 28.0, 48.0, 66.0, 110.0, 165.0, 249.0, 463.0, 669.0, 922.0, 1391.0, 2345.0, 3662.0, 5468.0, 8726.0, 14063.0, 23602.0, 40258.0, 73807.0, 147554.0, 302451.0, 200865.0, 96261.0, 50466.0, 28794.0, 17190.0, 10479.0, 6676.0, 4060.0, 2702.0, 1822.0, 1092.0, 715.0, 499.0, 302.0, 179.0, 118.0, 87.0, 63.0, 28.0, 30.0, 23.0, 10.0, 8.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.87890625, -5.6990966796875, -5.519287109375, -5.3394775390625, -5.15966796875, -4.9798583984375, -4.800048828125, -4.6202392578125, -4.4404296875, -4.2606201171875, -4.080810546875, -3.9010009765625, -3.72119140625, -3.5413818359375, -3.361572265625, -3.1817626953125, -3.001953125, -2.8221435546875, -2.642333984375, -2.4625244140625, -2.28271484375, -2.1029052734375, -1.923095703125, -1.7432861328125, -1.5634765625, -1.3836669921875, -1.203857421875, -1.0240478515625, -0.84423828125, -0.6644287109375, -0.484619140625, -0.3048095703125, -0.125, 0.0548095703125, 0.234619140625, 0.4144287109375, 0.59423828125, 0.7740478515625, 0.953857421875, 1.1336669921875, 1.3134765625, 1.4932861328125, 1.673095703125, 1.8529052734375, 2.03271484375, 2.2125244140625, 2.392333984375, 2.5721435546875, 2.751953125, 2.9317626953125, 3.111572265625, 3.2913818359375, 3.47119140625, 3.6510009765625, 3.830810546875, 4.0106201171875, 4.1904296875, 4.3702392578125, 4.550048828125, 4.7298583984375, 4.90966796875, 5.0894775390625, 5.269287109375, 5.4490966796875, 5.62890625]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 3.0, 6.0, 4.0, 11.0, 6.0, 4.0, 12.0, 17.0, 18.0, 21.0, 16.0, 22.0, 29.0, 29.0, 29.0, 34.0, 39.0, 34.0, 46.0, 33.0, 48.0, 1068.0, 49.0, 40.0, 43.0, 36.0, 43.0, 28.0, 34.0, 36.0, 29.0, 19.0, 25.0, 22.0, 17.0, 17.0, 13.0, 9.0, 6.0, 5.0, 7.0, 6.0, 8.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.34375, -20.691650390625, -20.03955078125, -19.387451171875, -18.7353515625, -18.083251953125, -17.43115234375, -16.779052734375, -16.126953125, -15.474853515625, -14.82275390625, -14.170654296875, -13.5185546875, -12.866455078125, -12.21435546875, -11.562255859375, -10.91015625, -10.258056640625, -9.60595703125, -8.953857421875, -8.3017578125, -7.649658203125, -6.99755859375, -6.345458984375, -5.693359375, -5.041259765625, -4.38916015625, -3.737060546875, -3.0849609375, -2.432861328125, -1.78076171875, -1.128662109375, -0.4765625, 0.175537109375, 0.82763671875, 1.479736328125, 2.1318359375, 2.783935546875, 3.43603515625, 4.088134765625, 4.740234375, 5.392333984375, 6.04443359375, 6.696533203125, 7.3486328125, 8.000732421875, 8.65283203125, 9.304931640625, 9.95703125, 10.609130859375, 11.26123046875, 11.913330078125, 12.5654296875, 13.217529296875, 13.86962890625, 14.521728515625, 15.173828125, 15.825927734375, 16.47802734375, 17.130126953125, 17.7822265625, 18.434326171875, 19.08642578125, 19.738525390625, 20.390625]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 8.0, 8.0, 16.0, 23.0, 35.0, 49.0, 55.0, 99.0, 162.0, 217.0, 321.0, 508.0, 687.0, 1065.0, 1579.0, 2322.0, 3660.0, 5395.0, 8166.0, 12834.0, 20597.0, 33534.0, 56769.0, 105535.0, 227770.0, 1324464.0, 123657.0, 66084.0, 37531.0, 22742.0, 14414.0, 9000.0, 5921.0, 3851.0, 2562.0, 1796.0, 1213.0, 833.0, 537.0, 368.0, 249.0, 176.0, 112.0, 69.0, 49.0, 29.0, 25.0, 18.0, 5.0, 10.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-5.9609375, -5.78094482421875, -5.6009521484375, -5.42095947265625, -5.240966796875, -5.06097412109375, -4.8809814453125, -4.70098876953125, -4.52099609375, -4.34100341796875, -4.1610107421875, -3.98101806640625, -3.801025390625, -3.62103271484375, -3.4410400390625, -3.26104736328125, -3.0810546875, -2.90106201171875, -2.7210693359375, -2.54107666015625, -2.361083984375, -2.18109130859375, -2.0010986328125, -1.82110595703125, -1.64111328125, -1.46112060546875, -1.2811279296875, -1.10113525390625, -0.921142578125, -0.74114990234375, -0.5611572265625, -0.38116455078125, -0.201171875, -0.02117919921875, 0.1588134765625, 0.33880615234375, 0.518798828125, 0.69879150390625, 0.8787841796875, 1.05877685546875, 1.23876953125, 1.41876220703125, 1.5987548828125, 1.77874755859375, 1.958740234375, 2.13873291015625, 2.3187255859375, 2.49871826171875, 2.6787109375, 2.85870361328125, 3.0386962890625, 3.21868896484375, 3.398681640625, 3.57867431640625, 3.7586669921875, 3.93865966796875, 4.11865234375, 4.29864501953125, 4.4786376953125, 4.65863037109375, 4.838623046875, 5.01861572265625, 5.1986083984375, 5.37860107421875, 5.55859375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 6.0, 12.0, 17.0, 16.0, 26.0, 19.0, 35.0, 36.0, 45.0, 53.0, 52.0, 55.0, 64.0, 79.0, 77.0, 71.0, 51.0, 49.0, 42.0, 42.0, 27.0, 23.0, 21.0, 9.0, 12.0, 16.0, 10.0, 8.0, 6.0, 3.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00528717041015625, -0.005140960216522217, -0.004994750022888184, -0.00484853982925415, -0.004702329635620117, -0.004556119441986084, -0.004409909248352051, -0.004263699054718018, -0.004117488861083984, -0.003971278667449951, -0.003825068473815918, -0.0036788582801818848, -0.0035326480865478516, -0.0033864378929138184, -0.003240227699279785, -0.003094017505645752, -0.0029478073120117188, -0.0028015971183776855, -0.0026553869247436523, -0.002509176731109619, -0.002362966537475586, -0.0022167563438415527, -0.0020705461502075195, -0.0019243359565734863, -0.0017781257629394531, -0.00163191556930542, -0.0014857053756713867, -0.0013394951820373535, -0.0011932849884033203, -0.0010470747947692871, -0.0009008646011352539, -0.0007546544075012207, -0.0006084442138671875, -0.0004622340202331543, -0.0003160238265991211, -0.0001698136329650879, -2.3603439331054688e-05, 0.00012260675430297852, 0.0002688169479370117, 0.0004150271415710449, 0.0005612373352050781, 0.0007074475288391113, 0.0008536577224731445, 0.0009998679161071777, 0.001146078109741211, 0.0012922883033752441, 0.0014384984970092773, 0.0015847086906433105, 0.0017309188842773438, 0.001877129077911377, 0.00202333927154541, 0.0021695494651794434, 0.0023157596588134766, 0.0024619698524475098, 0.002608180046081543, 0.002754390239715576, 0.0029006004333496094, 0.0030468106269836426, 0.0031930208206176758, 0.003339231014251709, 0.003485441207885742, 0.0036316514015197754, 0.0037778615951538086, 0.003924071788787842, 0.004070281982421875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 6.0, 15.0, 14.0, 16.0, 22.0, 23.0, 31.0, 54.0, 72.0, 91.0, 126.0, 171.0, 321.0, 482.0, 872.0, 1811.0, 4464.0, 14140.0, 55196.0, 235312.0, 466138.0, 201889.0, 47090.0, 12188.0, 4105.0, 1719.0, 794.0, 490.0, 279.0, 197.0, 116.0, 91.0, 60.0, 41.0, 34.0, 18.0, 16.0, 16.0, 6.0, 8.0, 4.0, 5.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0227508544921875, -0.021978139877319336, -0.021205425262451172, -0.020432710647583008, -0.019659996032714844, -0.01888728141784668, -0.018114566802978516, -0.01734185218811035, -0.016569137573242188, -0.015796422958374023, -0.01502370834350586, -0.014250993728637695, -0.013478279113769531, -0.012705564498901367, -0.011932849884033203, -0.011160135269165039, -0.010387420654296875, -0.009614706039428711, -0.008841991424560547, -0.008069276809692383, -0.007296562194824219, -0.006523847579956055, -0.005751132965087891, -0.0049784183502197266, -0.0042057037353515625, -0.0034329891204833984, -0.0026602745056152344, -0.0018875598907470703, -0.0011148452758789062, -0.0003421306610107422, 0.0004305839538574219, 0.001203298568725586, 0.00197601318359375, 0.002748727798461914, 0.003521442413330078, 0.004294157028198242, 0.005066871643066406, 0.00583958625793457, 0.006612300872802734, 0.0073850154876708984, 0.008157730102539062, 0.008930444717407227, 0.00970315933227539, 0.010475873947143555, 0.011248588562011719, 0.012021303176879883, 0.012794017791748047, 0.013566732406616211, 0.014339447021484375, 0.015112161636352539, 0.015884876251220703, 0.016657590866088867, 0.01743030548095703, 0.018203020095825195, 0.01897573471069336, 0.019748449325561523, 0.020521163940429688, 0.02129387855529785, 0.022066593170166016, 0.02283930778503418, 0.023612022399902344, 0.024384737014770508, 0.025157451629638672, 0.025930166244506836, 0.026702880859375]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 11.0, 11.0, 19.0, 32.0, 48.0, 68.0, 94.0, 100.0, 120.0, 101.0, 109.0, 78.0, 64.0, 34.0, 40.0, 29.0, 21.0, 7.0, 7.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.005841652862727642, -0.00570902181789279, -0.005576390773057938, -0.005443759728223085, -0.005311128683388233, -0.005178498104214668, -0.005045866593718529, -0.004913236014544964, -0.004780604969710112, -0.004647973924875259, -0.004515342880040407, -0.004382711835205555, -0.004250080790370703, -0.0041174497455358505, -0.003984819166362286, -0.0038521878886967897, -0.0037195568438619375, -0.0035869257990270853, -0.003454294754192233, -0.0033216639421880245, -0.0031890328973531723, -0.00305640185251832, -0.002923770807683468, -0.0027911397628486156, -0.0026585087180137634, -0.002525877673178911, -0.002393246628344059, -0.0022606155835092068, -0.002127984771504998, -0.001995353726670146, -0.0018627226818352938, -0.0017300916370004416, -0.0015974610578268766, -0.0014648300129920244, -0.001332199084572494, -0.0011995680397376418, -0.0010669371113181114, -0.0009343060664832592, -0.000801675021648407, -0.0006690440350212157, -0.0005364130483940244, -0.00040378206176683307, -0.0002711510460358113, -0.00013852003030478954, -5.889043677598238e-06, 0.00012674194294959307, 0.0002593729877844453, 0.0003920039744116366, 0.0005246349610388279, 0.0006572659476660192, 0.0007898969342932105, 0.0009225279791280627, 0.0010551589075475931, 0.0011877899523824453, 0.0013204209972172976, 0.0014530520420521498, 0.0015856829704716802, 0.0017183140153065324, 0.0018509449437260628, 0.001983575988560915, 0.002116207033395767, 0.0022488380782306194, 0.0023814691230654716, 0.00251409993506968, 0.0026467309799045324]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 3.0, 4.0, 6.0, 2.0, 9.0, 6.0, 9.0, 13.0, 16.0, 13.0, 24.0, 21.0, 23.0, 29.0, 29.0, 36.0, 23.0, 42.0, 51.0, 36.0, 40.0, 34.0, 28.0, 28.0, 42.0, 38.0, 40.0, 39.0, 31.0, 31.0, 29.0, 22.0, 36.0, 32.0, 19.0, 23.0, 14.0, 15.0, 14.0, 11.0, 13.0, 9.0, 8.0, 5.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0], "bins": [-0.002259373664855957, -0.002196243032813072, -0.0021331124007701874, -0.0020699817687273026, -0.0020068511366844177, -0.001943720504641533, -0.001880589872598648, -0.0018174592405557632, -0.0017543286085128784, -0.0016911979764699936, -0.0016280673444271088, -0.001564936712384224, -0.0015018060803413391, -0.0014386754482984543, -0.0013755448162555695, -0.0013124141842126846, -0.0012492835521697998, -0.001186152920126915, -0.0011230222880840302, -0.0010598916560411453, -0.0009967610239982605, -0.0009336303919553757, -0.0008704997599124908, -0.000807369127869606, -0.0007442384958267212, -0.0006811078637838364, -0.0006179772317409515, -0.0005548465996980667, -0.0004917159676551819, -0.00042858533561229706, -0.00036545470356941223, -0.0003023240715265274, -0.00023919343948364258, -0.00017606280744075775, -0.00011293217539787292, -4.98015433549881e-05, 1.3329088687896729e-05, 7.645972073078156e-05, 0.00013959035277366638, 0.0002027209848165512, 0.00026585161685943604, 0.00032898224890232086, 0.0003921128809452057, 0.0004552435129880905, 0.0005183741450309753, 0.0005815047770738602, 0.000644635409116745, 0.0007077660411596298, 0.0007708966732025146, 0.0008340273052453995, 0.0008971579372882843, 0.0009602885693311691, 0.001023419201374054, 0.0010865498334169388, 0.0011496804654598236, 0.0012128110975027084, 0.0012759417295455933, 0.001339072361588478, 0.001402202993631363, 0.0014653336256742477, 0.0015284642577171326, 0.0015915948897600174, 0.0016547255218029022, 0.001717856153845787, 0.0017809867858886719]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 4.0, 3.0, 6.0, 2.0, 4.0, 14.0, 11.0, 15.0, 18.0, 17.0, 15.0, 14.0, 29.0, 23.0, 33.0, 22.0, 45.0, 36.0, 29.0, 36.0, 47.0, 39.0, 56.0, 41.0, 31.0, 52.0, 57.0, 23.0, 32.0, 34.0, 30.0, 28.0, 19.0, 21.0, 28.0, 11.0, 13.0, 9.0, 7.0, 16.0, 4.0, 9.0, 6.0, 5.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.921875, -26.943603515625, -25.96533203125, -24.987060546875, -24.0087890625, -23.030517578125, -22.05224609375, -21.073974609375, -20.095703125, -19.117431640625, -18.13916015625, -17.160888671875, -16.1826171875, -15.204345703125, -14.22607421875, -13.247802734375, -12.26953125, -11.291259765625, -10.31298828125, -9.334716796875, -8.3564453125, -7.378173828125, -6.39990234375, -5.421630859375, -4.443359375, -3.465087890625, -2.48681640625, -1.508544921875, -0.5302734375, 0.447998046875, 1.42626953125, 2.404541015625, 3.3828125, 4.361083984375, 5.33935546875, 6.317626953125, 7.2958984375, 8.274169921875, 9.25244140625, 10.230712890625, 11.208984375, 12.187255859375, 13.16552734375, 14.143798828125, 15.1220703125, 16.100341796875, 17.07861328125, 18.056884765625, 19.03515625, 20.013427734375, 20.99169921875, 21.969970703125, 22.9482421875, 23.926513671875, 24.90478515625, 25.883056640625, 26.861328125, 27.839599609375, 28.81787109375, 29.796142578125, 30.7744140625, 31.752685546875, 32.73095703125, 33.709228515625, 34.6875]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 0.0, 2.0, 2.0, 5.0, 12.0, 14.0, 17.0, 22.0, 24.0, 34.0, 46.0, 76.0, 91.0, 145.0, 192.0, 310.0, 489.0, 731.0, 1219.0, 2363.0, 4613.0, 11635.0, 36784.0, 143490.0, 445502.0, 290560.0, 74457.0, 20669.0, 7377.0, 3242.0, 1744.0, 948.0, 546.0, 352.0, 269.0, 149.0, 113.0, 84.0, 48.0, 35.0, 38.0, 24.0, 12.0, 13.0, 17.0, 14.0, 12.0, 5.0, 5.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0], "bins": [-5.7578125, -5.5872802734375, -5.416748046875, -5.2462158203125, -5.07568359375, -4.9051513671875, -4.734619140625, -4.5640869140625, -4.3935546875, -4.2230224609375, -4.052490234375, -3.8819580078125, -3.71142578125, -3.5408935546875, -3.370361328125, -3.1998291015625, -3.029296875, -2.8587646484375, -2.688232421875, -2.5177001953125, -2.34716796875, -2.1766357421875, -2.006103515625, -1.8355712890625, -1.6650390625, -1.4945068359375, -1.323974609375, -1.1534423828125, -0.98291015625, -0.8123779296875, -0.641845703125, -0.4713134765625, -0.30078125, -0.1302490234375, 0.040283203125, 0.2108154296875, 0.38134765625, 0.5518798828125, 0.722412109375, 0.8929443359375, 1.0634765625, 1.2340087890625, 1.404541015625, 1.5750732421875, 1.74560546875, 1.9161376953125, 2.086669921875, 2.2572021484375, 2.427734375, 2.5982666015625, 2.768798828125, 2.9393310546875, 3.10986328125, 3.2803955078125, 3.450927734375, 3.6214599609375, 3.7919921875, 3.9625244140625, 4.133056640625, 4.3035888671875, 4.47412109375, 4.6446533203125, 4.815185546875, 4.9857177734375, 5.15625]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 7.0, 6.0, 11.0, 14.0, 8.0, 14.0, 23.0, 29.0, 33.0, 52.0, 59.0, 58.0, 79.0, 83.0, 2109.0, 86.0, 59.0, 57.0, 57.0, 44.0, 35.0, 26.0, 25.0, 25.0, 15.0, 10.0, 9.0, 6.0, 13.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-77.3125, -75.005859375, -72.69921875, -70.392578125, -68.0859375, -65.779296875, -63.47265625, -61.166015625, -58.859375, -56.552734375, -54.24609375, -51.939453125, -49.6328125, -47.326171875, -45.01953125, -42.712890625, -40.40625, -38.099609375, -35.79296875, -33.486328125, -31.1796875, -28.873046875, -26.56640625, -24.259765625, -21.953125, -19.646484375, -17.33984375, -15.033203125, -12.7265625, -10.419921875, -8.11328125, -5.806640625, -3.5, -1.193359375, 1.11328125, 3.419921875, 5.7265625, 8.033203125, 10.33984375, 12.646484375, 14.953125, 17.259765625, 19.56640625, 21.873046875, 24.1796875, 26.486328125, 28.79296875, 31.099609375, 33.40625, 35.712890625, 38.01953125, 40.326171875, 42.6328125, 44.939453125, 47.24609375, 49.552734375, 51.859375, 54.166015625, 56.47265625, 58.779296875, 61.0859375, 63.392578125, 65.69921875, 68.005859375, 70.3125]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 7.0, 8.0, 4.0, 8.0, 10.0, 15.0, 24.0, 28.0, 37.0, 42.0, 70.0, 100.0, 112.0, 213.0, 276.0, 383.0, 690.0, 1203.0, 2927.0, 13283.0, 159533.0, 2840473.0, 110032.0, 10586.0, 2629.0, 1151.0, 610.0, 364.0, 275.0, 155.0, 129.0, 95.0, 66.0, 41.0, 35.0, 25.0, 16.0, 20.0, 7.0, 7.0, 6.0, 1.0, 5.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.015625, -9.6865234375, -9.357421875, -9.0283203125, -8.69921875, -8.3701171875, -8.041015625, -7.7119140625, -7.3828125, -7.0537109375, -6.724609375, -6.3955078125, -6.06640625, -5.7373046875, -5.408203125, -5.0791015625, -4.75, -4.4208984375, -4.091796875, -3.7626953125, -3.43359375, -3.1044921875, -2.775390625, -2.4462890625, -2.1171875, -1.7880859375, -1.458984375, -1.1298828125, -0.80078125, -0.4716796875, -0.142578125, 0.1865234375, 0.515625, 0.8447265625, 1.173828125, 1.5029296875, 1.83203125, 2.1611328125, 2.490234375, 2.8193359375, 3.1484375, 3.4775390625, 3.806640625, 4.1357421875, 4.46484375, 4.7939453125, 5.123046875, 5.4521484375, 5.78125, 6.1103515625, 6.439453125, 6.7685546875, 7.09765625, 7.4267578125, 7.755859375, 8.0849609375, 8.4140625, 8.7431640625, 9.072265625, 9.4013671875, 9.73046875, 10.0595703125, 10.388671875, 10.7177734375, 11.046875]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 4.0, 5.0, 10.0, 14.0, 39.0, 76.0, 174.0, 246.0, 193.0, 118.0, 53.0, 28.0, 10.0, 9.0, 11.0, 4.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-117.93960571289062, -114.4190902709961, -110.89857482910156, -107.37805938720703, -103.8575439453125, -100.33702850341797, -96.81651306152344, -93.2959976196289, -89.77548217773438, -86.25496673583984, -82.73445129394531, -79.21393585205078, -75.69342041015625, -72.17290496826172, -68.65238952636719, -65.13187408447266, -61.611358642578125, -58.090843200683594, -54.57032775878906, -51.04981231689453, -47.529296875, -44.00878143310547, -40.48826599121094, -36.967750549316406, -33.447235107421875, -29.926719665527344, -26.406204223632812, -22.88568878173828, -19.36517333984375, -15.844657897949219, -12.324142456054688, -8.803627014160156, -5.283103942871094, -1.7625885009765625, 1.7579269409179688, 5.2784423828125, 8.798957824707031, 12.319473266601562, 15.839988708496094, 19.360504150390625, 22.881019592285156, 26.401535034179688, 29.92205047607422, 33.44256591796875, 36.96308135986328, 40.48359680175781, 44.004112243652344, 47.524627685546875, 51.045143127441406, 54.56565856933594, 58.08617401123047, 61.606689453125, 65.12720489501953, 68.64772033691406, 72.1682357788086, 75.68875122070312, 79.20926666259766, 82.72978210449219, 86.25029754638672, 89.77081298828125, 93.29132843017578, 96.81184387207031, 100.33235931396484, 103.85287475585938, 107.3733901977539]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 2.0, 6.0, 4.0, 12.0, 7.0, 12.0, 21.0, 14.0, 18.0, 30.0, 34.0, 32.0, 23.0, 50.0, 39.0, 38.0, 48.0, 49.0, 59.0, 40.0, 48.0, 55.0, 44.0, 45.0, 41.0, 33.0, 37.0, 36.0, 22.0, 25.0, 21.0, 10.0, 12.0, 6.0, 6.0, 9.0, 6.0, 7.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.462646484375, -57.190391540527344, -54.91813659667969, -52.6458854675293, -50.37363052368164, -48.101375579833984, -45.829124450683594, -43.55686950683594, -41.28461456298828, -39.012359619140625, -36.74010467529297, -34.46785354614258, -32.19559860229492, -29.923343658447266, -27.651090621948242, -25.37883758544922, -23.106582641601562, -20.834327697753906, -18.562074661254883, -16.28982162475586, -14.017566680908203, -11.745312690734863, -9.473058700561523, -7.200804710388184, -4.928550720214844, -2.656296730041504, -0.38404273986816406, 1.8882112503051758, 4.160465240478516, 6.4327192306518555, 8.704973220825195, 10.977227210998535, 13.249481201171875, 15.521735191345215, 17.793989181518555, 20.066242218017578, 22.338497161865234, 24.61075210571289, 26.883005142211914, 29.155258178710938, 31.427513122558594, 33.69976806640625, 35.972023010253906, 38.2442741394043, 40.51652908325195, 42.78878402709961, 45.06103515625, 47.333290100097656, 49.60554504394531, 51.87779998779297, 54.150054931640625, 56.422306060791016, 58.69456100463867, 60.96681594848633, 63.23906707763672, 65.51132202148438, 67.78357696533203, 70.05583190917969, 72.32808685302734, 74.600341796875, 76.87258911132812, 79.14484405517578, 81.41709899902344, 83.6893539428711, 85.96160888671875]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 11.0, 9.0, 16.0, 17.0, 18.0, 22.0, 40.0, 60.0, 81.0, 132.0, 166.0, 237.0, 369.0, 577.0, 812.0, 1174.0, 1797.0, 2694.0, 3717.0, 5189.0, 1006721.0, 7955.0, 5121.0, 3672.0, 2548.0, 1716.0, 1237.0, 764.0, 517.0, 348.0, 219.0, 173.0, 105.0, 90.0, 51.0, 48.0, 39.0, 21.0, 24.0, 11.0, 4.0, 7.0, 6.0, 8.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0], "bins": [-11.675667762756348, -11.31039047241211, -10.945112228393555, -10.579834938049316, -10.214557647705078, -9.849279403686523, -9.484002113342285, -9.118724822998047, -8.753446578979492, -8.388169288635254, -8.0228910446167, -7.657613754272461, -7.2923359870910645, -6.927058219909668, -6.56178092956543, -6.196503162384033, -5.831225395202637, -5.46594762802124, -5.100669860839844, -4.7353925704956055, -4.370114803314209, -4.0048370361328125, -3.639559507369995, -3.2742819786071777, -2.9090042114257812, -2.5437264442443848, -2.1784489154815674, -1.8131712675094604, -1.4478936195373535, -1.0826159715652466, -0.7173383235931396, -0.35206079483032227, 0.013217926025390625, 0.37849557399749756, 0.7437732219696045, 1.1090508699417114, 1.4743285179138184, 1.8396061658859253, 2.2048838138580322, 2.5701613426208496, 2.935439109802246, 3.3007168769836426, 3.66599440574646, 4.031271934509277, 4.396549701690674, 4.76182746887207, 5.127104759216309, 5.492382526397705, 5.857660293579102, 6.222938060760498, 6.5882158279418945, 6.953493118286133, 7.318770885467529, 7.684048652648926, 8.049325942993164, 8.414604187011719, 8.779881477355957, 9.145158767700195, 9.51043701171875, 9.875714302062988, 10.240991592407227, 10.606269836425781, 10.97154712677002, 11.336824417114258, 11.702102661132812]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 10.0, 12.0, 27.0, 52.0, 124.0, 158.0, 10998.0, 51452148.0, 182.0, 66.0, 58.0, 57.0, 31.0, 26.0, 11.0, 7.0, 5.0, 4.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5163.12060546875, -5030.8798828125, -4898.63916015625, -4766.39794921875, -4634.1572265625, -4501.91650390625, -4369.67578125, -4237.4345703125, -4105.19384765625, -3972.953125, -3840.712158203125, -3708.471435546875, -3576.23046875, -3443.98974609375, -3311.7490234375, -3179.508056640625, -3047.267333984375, -2915.026611328125, -2782.78564453125, -2650.544921875, -2518.303955078125, -2386.063232421875, -2253.822265625, -2121.58154296875, -1989.3406982421875, -1857.099853515625, -1724.8590087890625, -1592.6181640625, -1460.37744140625, -1328.136474609375, -1195.895751953125, -1063.6549072265625, -931.414306640625, -799.1734619140625, -666.9326171875, -534.6918334960938, -402.45098876953125, -270.21014404296875, -137.9693603515625, -5.728515625, 126.5123291015625, 258.753173828125, 390.9939880371094, 523.2348022460938, 655.4756469726562, 787.7164916992188, 919.957275390625, 1052.1981201171875, 1184.43896484375, 1316.6798095703125, 1448.920654296875, 1581.161376953125, 1713.40234375, 1845.64306640625, 1977.8839111328125, 2110.124755859375, 2242.36572265625, 2374.6064453125, 2506.847412109375, 2639.088134765625, 2771.3291015625, 2903.56982421875, 3035.810546875, 3168.051513671875, 3300.292236328125]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [8.0, 4.0, 10.0, 15.0, 5.0, 21.0, 39.0, 59.0, 57.0, 110.0, 148.0, 231.0, 354.0, 476.0, 572.0, 768.0, 1119.0, 1700.0, 2510.0, 3661.0, 5277.0, 7544.0, 11175.0, 16182.0, 24880.0, 37421.0, 58824.0, 92086.0, 151729.0, 264004.0, 613418.0, 3900479.0, 481774.0, 233173.0, 137599.0, 84448.0, 54087.0, 34462.0, 22789.0, 14861.0, 10542.0, 6893.0, 4675.0, 3500.0, 2409.0, 1515.0, 1135.0, 811.0, 574.0, 405.0, 303.0, 198.0, 134.0, 80.0, 61.0, 33.0, 29.0, 28.0, 20.0, 11.0, 12.0, 3.0, 1.0, 5.0], "bins": [-2.548828125, -2.4676513671875, -2.386474609375, -2.3052978515625, -2.22412109375, -2.1429443359375, -2.061767578125, -1.9805908203125, -1.8994140625, -1.8182373046875, -1.737060546875, -1.6558837890625, -1.57470703125, -1.4935302734375, -1.412353515625, -1.3311767578125, -1.25, -1.1688232421875, -1.087646484375, -1.0064697265625, -0.92529296875, -0.8441162109375, -0.762939453125, -0.6817626953125, -0.6005859375, -0.5194091796875, -0.438232421875, -0.3570556640625, -0.27587890625, -0.1947021484375, -0.113525390625, -0.0323486328125, 0.048828125, 0.1300048828125, 0.211181640625, 0.2923583984375, 0.37353515625, 0.4547119140625, 0.535888671875, 0.6170654296875, 0.6982421875, 0.7794189453125, 0.860595703125, 0.9417724609375, 1.02294921875, 1.1041259765625, 1.185302734375, 1.2664794921875, 1.34765625, 1.4288330078125, 1.510009765625, 1.5911865234375, 1.67236328125, 1.7535400390625, 1.834716796875, 1.9158935546875, 1.9970703125, 2.0782470703125, 2.159423828125, 2.2406005859375, 2.32177734375, 2.4029541015625, 2.484130859375, 2.5653076171875, 2.646484375]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 2.0, 8.0, 7.0, 3.0, 9.0, 9.0, 7.0, 14.0, 14.0, 20.0, 26.0, 29.0, 34.0, 37.0, 34.0, 35.0, 43.0, 40.0, 42.0, 81.0, 366.0, 580.0, 124.0, 53.0, 54.0, 43.0, 38.0, 26.0, 32.0, 34.0, 21.0, 27.0, 29.0, 13.0, 15.0, 18.0, 12.0, 5.0, 7.0, 8.0, 7.0, 8.0, 7.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.88671875, -6.66534423828125, -6.4439697265625, -6.22259521484375, -6.001220703125, -5.77984619140625, -5.5584716796875, -5.33709716796875, -5.11572265625, -4.89434814453125, -4.6729736328125, -4.45159912109375, -4.230224609375, -4.00885009765625, -3.7874755859375, -3.56610107421875, -3.3447265625, -3.12335205078125, -2.9019775390625, -2.68060302734375, -2.459228515625, -2.23785400390625, -2.0164794921875, -1.79510498046875, -1.57373046875, -1.35235595703125, -1.1309814453125, -0.90960693359375, -0.688232421875, -0.46685791015625, -0.2454833984375, -0.02410888671875, 0.197265625, 0.41864013671875, 0.6400146484375, 0.86138916015625, 1.082763671875, 1.30413818359375, 1.5255126953125, 1.74688720703125, 1.96826171875, 2.18963623046875, 2.4110107421875, 2.63238525390625, 2.853759765625, 3.07513427734375, 3.2965087890625, 3.51788330078125, 3.7392578125, 3.96063232421875, 4.1820068359375, 4.40338134765625, 4.624755859375, 4.84613037109375, 5.0675048828125, 5.28887939453125, 5.51025390625, 5.73162841796875, 5.9530029296875, 6.17437744140625, 6.395751953125, 6.61712646484375, 6.8385009765625, 7.05987548828125, 7.28125]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [9.0, 0.0, 0.0, 12.0, 19.0, 14.0, 27.0, 19.0, 33.0, 62.0, 32.0, 71.0, 159.0, 175.0, 219.0, 311.0, 532.0, 678.0, 1058.0, 1566.0, 2353.0, 3170.0, 4743.0, 7200.0, 11652.0, 18402.0, 29579.0, 47705.0, 78133.0, 135718.0, 252716.0, 667276.0, 3942583.0, 540929.0, 228047.0, 123315.0, 72449.0, 44030.0, 27363.0, 16878.0, 10908.0, 6918.0, 4638.0, 3016.0, 2103.0, 1391.0, 976.0, 658.0, 474.0, 339.0, 214.0, 152.0, 103.0, 90.0, 67.0, 49.0, 51.0, 24.0, 0.0, 22.0, 4.0, 4.0, 5.0, 13.0], "bins": [-3.228515625, -3.128936767578125, -3.02935791015625, -2.929779052734375, -2.8302001953125, -2.730621337890625, -2.63104248046875, -2.531463623046875, -2.431884765625, -2.332305908203125, -2.23272705078125, -2.133148193359375, -2.0335693359375, -1.933990478515625, -1.83441162109375, -1.734832763671875, -1.63525390625, -1.535675048828125, -1.43609619140625, -1.336517333984375, -1.2369384765625, -1.137359619140625, -1.03778076171875, -0.938201904296875, -0.838623046875, -0.739044189453125, -0.63946533203125, -0.539886474609375, -0.4403076171875, -0.340728759765625, -0.24114990234375, -0.141571044921875, -0.0419921875, 0.057586669921875, 0.15716552734375, 0.256744384765625, 0.3563232421875, 0.455902099609375, 0.55548095703125, 0.655059814453125, 0.754638671875, 0.854217529296875, 0.95379638671875, 1.053375244140625, 1.1529541015625, 1.252532958984375, 1.35211181640625, 1.451690673828125, 1.55126953125, 1.650848388671875, 1.75042724609375, 1.850006103515625, 1.9495849609375, 2.049163818359375, 2.14874267578125, 2.248321533203125, 2.347900390625, 2.447479248046875, 2.54705810546875, 2.646636962890625, 2.7462158203125, 2.845794677734375, 2.94537353515625, 3.044952392578125, 3.14453125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 0.0, 3.0, 5.0, 4.0, 11.0, 5.0, 6.0, 22.0, 13.0, 19.0, 15.0, 27.0, 40.0, 26.0, 30.0, 37.0, 46.0, 46.0, 52.0, 104.0, 354.0, 530.0, 162.0, 70.0, 54.0, 52.0, 44.0, 39.0, 33.0, 23.0, 22.0, 20.0, 28.0, 16.0, 18.0, 12.0, 16.0, 6.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.6171875, -5.44232177734375, -5.2674560546875, -5.09259033203125, -4.917724609375, -4.74285888671875, -4.5679931640625, -4.39312744140625, -4.21826171875, -4.04339599609375, -3.8685302734375, -3.69366455078125, -3.518798828125, -3.34393310546875, -3.1690673828125, -2.99420166015625, -2.8193359375, -2.64447021484375, -2.4696044921875, -2.29473876953125, -2.119873046875, -1.94500732421875, -1.7701416015625, -1.59527587890625, -1.42041015625, -1.24554443359375, -1.0706787109375, -0.89581298828125, -0.720947265625, -0.54608154296875, -0.3712158203125, -0.19635009765625, -0.021484375, 0.15338134765625, 0.3282470703125, 0.50311279296875, 0.677978515625, 0.85284423828125, 1.0277099609375, 1.20257568359375, 1.37744140625, 1.55230712890625, 1.7271728515625, 1.90203857421875, 2.076904296875, 2.25177001953125, 2.4266357421875, 2.60150146484375, 2.7763671875, 2.95123291015625, 3.1260986328125, 3.30096435546875, 3.475830078125, 3.65069580078125, 3.8255615234375, 4.00042724609375, 4.17529296875, 4.35015869140625, 4.5250244140625, 4.69989013671875, 4.874755859375, 5.04962158203125, 5.2244873046875, 5.39935302734375, 5.57421875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 12.0, 6.0, 5.0, 14.0, 27.0, 37.0, 22.0, 33.0, 53.0, 57.0, 55.0, 97.0, 132.0, 117.0, 186.0, 255.0, 349.0, 499.0, 636.0, 806.0, 1258.0, 1856.0, 2673.0, 4456.0, 7543.0, 15317.0, 36407.0, 146945.0, 5910017.0, 99779.0, 29770.0, 12836.0, 6789.0, 3880.0, 2571.0, 1683.0, 1107.0, 821.0, 580.0, 396.0, 344.0, 252.0, 187.0, 131.0, 76.0, 77.0, 59.0, 45.0, 54.0, 46.0, 31.0, 18.0, 10.0, 9.0, 5.0, 8.0, 2.0, 9.0, 0.0, 6.0], "bins": [-9.296875, -9.0098876953125, -8.722900390625, -8.4359130859375, -8.14892578125, -7.8619384765625, -7.574951171875, -7.2879638671875, -7.0009765625, -6.7139892578125, -6.427001953125, -6.1400146484375, -5.85302734375, -5.5660400390625, -5.279052734375, -4.9920654296875, -4.705078125, -4.4180908203125, -4.131103515625, -3.8441162109375, -3.55712890625, -3.2701416015625, -2.983154296875, -2.6961669921875, -2.4091796875, -2.1221923828125, -1.835205078125, -1.5482177734375, -1.26123046875, -0.9742431640625, -0.687255859375, -0.4002685546875, -0.11328125, 0.1737060546875, 0.460693359375, 0.7476806640625, 1.03466796875, 1.3216552734375, 1.608642578125, 1.8956298828125, 2.1826171875, 2.4696044921875, 2.756591796875, 3.0435791015625, 3.33056640625, 3.6175537109375, 3.904541015625, 4.1915283203125, 4.478515625, 4.7655029296875, 5.052490234375, 5.3394775390625, 5.62646484375, 5.9134521484375, 6.200439453125, 6.4874267578125, 6.7744140625, 7.0614013671875, 7.348388671875, 7.6353759765625, 7.92236328125, 8.2093505859375, 8.496337890625, 8.7833251953125, 9.0703125]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 4.0, 5.0, 5.0, 2.0, 7.0, 9.0, 7.0, 11.0, 12.0, 10.0, 16.0, 15.0, 25.0, 20.0, 28.0, 34.0, 44.0, 41.0, 35.0, 49.0, 68.0, 133.0, 340.0, 415.0, 163.0, 85.0, 69.0, 44.0, 48.0, 36.0, 32.0, 29.0, 41.0, 24.0, 25.0, 13.0, 14.0, 10.0, 11.0, 6.0, 10.0, 8.0, 6.0, 7.0, 3.0, 5.0, 3.0, 2.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.416015625, -3.30609130859375, -3.1961669921875, -3.08624267578125, -2.976318359375, -2.86639404296875, -2.7564697265625, -2.64654541015625, -2.53662109375, -2.42669677734375, -2.3167724609375, -2.20684814453125, -2.096923828125, -1.98699951171875, -1.8770751953125, -1.76715087890625, -1.6572265625, -1.54730224609375, -1.4373779296875, -1.32745361328125, -1.217529296875, -1.10760498046875, -0.9976806640625, -0.88775634765625, -0.77783203125, -0.66790771484375, -0.5579833984375, -0.44805908203125, -0.338134765625, -0.22821044921875, -0.1182861328125, -0.00836181640625, 0.1015625, 0.21148681640625, 0.3214111328125, 0.43133544921875, 0.541259765625, 0.65118408203125, 0.7611083984375, 0.87103271484375, 0.98095703125, 1.09088134765625, 1.2008056640625, 1.31072998046875, 1.420654296875, 1.53057861328125, 1.6405029296875, 1.75042724609375, 1.8603515625, 1.97027587890625, 2.0802001953125, 2.19012451171875, 2.300048828125, 2.40997314453125, 2.5198974609375, 2.62982177734375, 2.73974609375, 2.84967041015625, 2.9595947265625, 3.06951904296875, 3.179443359375, 3.28936767578125, 3.3992919921875, 3.50921630859375, 3.619140625]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 8.0, 38.0, 75.0, 362.0, 398.0, 77.0, 30.0, 5.0, 7.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.866183280944824, -13.000533103942871, -12.134882926940918, -11.269231796264648, -10.403581619262695, -9.537931442260742, -8.672281265258789, -7.806630611419678, -6.940980434417725, -6.0753302574157715, -5.20967960357666, -4.344029426574707, -3.478379011154175, -2.6127285957336426, -1.7470784187316895, -0.8814277648925781, -0.015777587890625, 0.8498727679252625, 1.71552312374115, 2.5811734199523926, 3.446823835372925, 4.312474250793457, 5.17812442779541, 6.0437750816345215, 6.909425258636475, 7.775075435638428, 8.640726089477539, 9.506376266479492, 10.372026443481445, 11.237676620483398, 12.103326797485352, 12.968977928161621, 13.834627151489258, 14.700277328491211, 15.565927505493164, 16.431577682495117, 17.29722785949707, 18.162879943847656, 19.02853012084961, 19.894180297851562, 20.759830474853516, 21.62548065185547, 22.491130828857422, 23.356781005859375, 24.222431182861328, 25.08808135986328, 25.953731536865234, 26.81938362121582, 27.68503189086914, 28.550682067871094, 29.416332244873047, 30.281982421875, 31.147632598876953, 32.013282775878906, 32.87893295288086, 33.74458312988281, 34.61023712158203, 35.475887298583984, 36.34153747558594, 37.20718765258789, 38.072837829589844, 38.9384880065918, 39.80413818359375, 40.6697883605957, 41.535438537597656]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 2.0, 6.0, 9.0, 5.0, 9.0, 17.0, 12.0, 18.0, 16.0, 25.0, 14.0, 30.0, 39.0, 24.0, 28.0, 43.0, 33.0, 45.0, 22.0, 39.0, 44.0, 47.0, 42.0, 43.0, 35.0, 36.0, 34.0, 32.0, 37.0, 27.0, 28.0, 18.0, 21.0, 24.0, 14.0, 19.0, 11.0, 17.0, 13.0, 6.0, 8.0, 4.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.966644763946533, -4.810634613037109, -4.6546244621276855, -4.498614311218262, -4.342604637145996, -4.186594486236572, -4.030584335327148, -3.8745741844177246, -3.718564033508301, -3.562553882598877, -3.406543731689453, -3.2505338191986084, -3.0945236682891846, -2.9385135173797607, -2.782503604888916, -2.626493453979492, -2.4704833030700684, -2.3144731521606445, -2.1584630012512207, -2.002453088760376, -1.8464429378509521, -1.6904327869415283, -1.534422755241394, -1.3784127235412598, -1.222402572631836, -1.066392421722412, -0.9103823900222778, -0.7543722987174988, -0.5983622074127197, -0.4423521161079407, -0.2863420248031616, -0.13033199310302734, 0.02567768096923828, 0.18168777227401733, 0.3376978635787964, 0.49370795488357544, 0.6497180461883545, 0.8057281374931335, 0.9617382287979126, 1.1177482604980469, 1.2737584114074707, 1.4297685623168945, 1.5857785940170288, 1.741788625717163, 1.897798776626587, 2.0538089275360107, 2.2098188400268555, 2.3658289909362793, 2.521839141845703, 2.677849292755127, 2.833859443664551, 2.9898693561553955, 3.1458795070648193, 3.301889657974243, 3.457899570465088, 3.6139097213745117, 3.7699198722839355, 3.9259300231933594, 4.081940174102783, 4.237950325012207, 4.393959999084473, 4.5499701499938965, 4.70598030090332, 4.861990451812744, 5.018000602722168]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 7.0, 3.0, 6.0, 9.0, 9.0, 11.0, 20.0, 32.0, 37.0, 31.0, 66.0, 76.0, 102.0, 129.0, 177.0, 288.0, 472.0, 663.0, 1149.0, 1865.0, 3293.0, 6333.0, 14010.0, 38173.0, 189674.0, 3824287.0, 73063.0, 21455.0, 8882.0, 4212.0, 2208.0, 1276.0, 795.0, 514.0, 321.0, 208.0, 119.0, 87.0, 61.0, 57.0, 45.0, 19.0, 13.0, 11.0, 4.0, 6.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0], "bins": [-0.0255584716796875, -0.0248720645904541, -0.024185657501220703, -0.023499250411987305, -0.022812843322753906, -0.022126436233520508, -0.02144002914428711, -0.02075362205505371, -0.020067214965820312, -0.019380807876586914, -0.018694400787353516, -0.018007993698120117, -0.01732158660888672, -0.01663517951965332, -0.015948772430419922, -0.015262365341186523, -0.014575958251953125, -0.013889551162719727, -0.013203144073486328, -0.01251673698425293, -0.011830329895019531, -0.011143922805786133, -0.010457515716552734, -0.009771108627319336, -0.009084701538085938, -0.008398294448852539, -0.007711887359619141, -0.007025480270385742, -0.006339073181152344, -0.005652666091918945, -0.004966259002685547, -0.0042798519134521484, -0.00359344482421875, -0.0029070377349853516, -0.002220630645751953, -0.0015342235565185547, -0.0008478164672851562, -0.0001614093780517578, 0.0005249977111816406, 0.001211404800415039, 0.0018978118896484375, 0.002584218978881836, 0.0032706260681152344, 0.003957033157348633, 0.004643440246582031, 0.00532984733581543, 0.006016254425048828, 0.0067026615142822266, 0.007389068603515625, 0.008075475692749023, 0.008761882781982422, 0.00944828987121582, 0.010134696960449219, 0.010821104049682617, 0.011507511138916016, 0.012193918228149414, 0.012880325317382812, 0.013566732406616211, 0.01425313949584961, 0.014939546585083008, 0.015625953674316406, 0.016312360763549805, 0.016998767852783203, 0.0176851749420166, 0.01837158203125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 5.0, 0.0, 2.0, 3.0, 2.0, 8.0, 3.0, 4.0, 8.0, 6.0, 5.0, 10.0, 12.0, 10.0, 11.0, 25.0, 780.0, 16.0, 14.0, 13.0, 9.0, 8.0, 6.0, 8.0, 5.0, 6.0, 8.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004444122314453125, -0.004296720027923584, -0.004149317741394043, -0.004001915454864502, -0.003854513168334961, -0.00370711088180542, -0.003559708595275879, -0.003412306308746338, -0.003264904022216797, -0.003117501735687256, -0.002970099449157715, -0.002822697162628174, -0.002675294876098633, -0.002527892589569092, -0.0023804903030395508, -0.0022330880165100098, -0.0020856857299804688, -0.0019382834434509277, -0.0017908811569213867, -0.0016434788703918457, -0.0014960765838623047, -0.0013486742973327637, -0.0012012720108032227, -0.0010538697242736816, -0.0009064674377441406, -0.0007590651512145996, -0.0006116628646850586, -0.0004642605781555176, -0.00031685829162597656, -0.00016945600509643555, -2.205371856689453e-05, 0.00012534856796264648, 0.0002727508544921875, 0.0004201531410217285, 0.0005675554275512695, 0.0007149577140808105, 0.0008623600006103516, 0.0010097622871398926, 0.0011571645736694336, 0.0013045668601989746, 0.0014519691467285156, 0.0015993714332580566, 0.0017467737197875977, 0.0018941760063171387, 0.0020415782928466797, 0.0021889805793762207, 0.0023363828659057617, 0.0024837851524353027, 0.0026311874389648438, 0.0027785897254943848, 0.0029259920120239258, 0.003073394298553467, 0.003220796585083008, 0.003368198871612549, 0.00351560115814209, 0.003663003444671631, 0.003810405731201172, 0.003957808017730713, 0.004105210304260254, 0.004252612590789795, 0.004400014877319336, 0.004547417163848877, 0.004694819450378418, 0.004842221736907959, 0.0049896240234375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 7.0, 4.0, 4.0, 9.0, 7.0, 5.0, 18.0, 29.0, 49.0, 91.0, 146.0, 302.0, 786.0, 2859.0, 16661.0, 208067.0, 3694681.0, 247930.0, 18163.0, 2937.0, 807.0, 339.0, 143.0, 91.0, 49.0, 25.0, 18.0, 13.0, 14.0, 5.0, 7.0, 6.0, 3.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.039825439453125, -0.03870439529418945, -0.037583351135253906, -0.03646230697631836, -0.03534126281738281, -0.034220218658447266, -0.03309917449951172, -0.03197813034057617, -0.030857086181640625, -0.029736042022705078, -0.02861499786376953, -0.027493953704833984, -0.026372909545898438, -0.02525186538696289, -0.024130821228027344, -0.023009777069091797, -0.02188873291015625, -0.020767688751220703, -0.019646644592285156, -0.01852560043334961, -0.017404556274414062, -0.016283512115478516, -0.015162467956542969, -0.014041423797607422, -0.012920379638671875, -0.011799335479736328, -0.010678291320800781, -0.009557247161865234, -0.008436203002929688, -0.007315158843994141, -0.006194114685058594, -0.005073070526123047, -0.0039520263671875, -0.002830982208251953, -0.0017099380493164062, -0.0005888938903808594, 0.0005321502685546875, 0.0016531944274902344, 0.0027742385864257812, 0.003895282745361328, 0.005016326904296875, 0.006137371063232422, 0.007258415222167969, 0.008379459381103516, 0.009500503540039062, 0.01062154769897461, 0.011742591857910156, 0.012863636016845703, 0.01398468017578125, 0.015105724334716797, 0.016226768493652344, 0.01734781265258789, 0.018468856811523438, 0.019589900970458984, 0.02071094512939453, 0.021831989288330078, 0.022953033447265625, 0.024074077606201172, 0.02519512176513672, 0.026316165924072266, 0.027437210083007812, 0.02855825424194336, 0.029679298400878906, 0.030800342559814453, 0.03192138671875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 7.0, 6.0, 8.0, 3.0, 12.0, 10.0, 16.0, 22.0, 23.0, 35.0, 62.0, 78.0, 117.0, 166.0, 240.0, 431.0, 820.0, 828.0, 407.0, 256.0, 139.0, 114.0, 74.0, 54.0, 43.0, 39.0, 26.0, 12.0, 17.0, 5.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00598907470703125, -0.005775034427642822, -0.0055609941482543945, -0.005346953868865967, -0.005132913589477539, -0.004918873310089111, -0.004704833030700684, -0.004490792751312256, -0.004276752471923828, -0.0040627121925354, -0.0038486719131469727, -0.003634631633758545, -0.003420591354370117, -0.0032065510749816895, -0.0029925107955932617, -0.002778470516204834, -0.0025644302368164062, -0.0023503899574279785, -0.0021363496780395508, -0.001922309398651123, -0.0017082691192626953, -0.0014942288398742676, -0.0012801885604858398, -0.0010661482810974121, -0.0008521080017089844, -0.0006380677223205566, -0.0004240274429321289, -0.00020998716354370117, 4.0531158447265625e-06, 0.0002180933952331543, 0.00043213367462158203, 0.0006461739540100098, 0.0008602142333984375, 0.0010742545127868652, 0.001288294792175293, 0.0015023350715637207, 0.0017163753509521484, 0.0019304156303405762, 0.002144455909729004, 0.0023584961891174316, 0.0025725364685058594, 0.002786576747894287, 0.003000617027282715, 0.0032146573066711426, 0.0034286975860595703, 0.003642737865447998, 0.0038567781448364258, 0.0040708184242248535, 0.004284858703613281, 0.004498898983001709, 0.004712939262390137, 0.0049269795417785645, 0.005141019821166992, 0.00535506010055542, 0.005569100379943848, 0.005783140659332275, 0.005997180938720703, 0.006211221218109131, 0.006425261497497559, 0.006639301776885986, 0.006853342056274414, 0.007067382335662842, 0.0072814226150512695, 0.007495462894439697, 0.007709503173828125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 4.0, 7.0, 15.0, 18.0, 33.0, 60.0, 90.0, 138.0, 154.0, 149.0, 111.0, 96.0, 41.0, 30.0, 22.0, 16.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.032929886132478714, -0.031552888453006744, -0.030175894498825073, -0.028798898681998253, -0.027421902865171432, -0.026044907048344612, -0.024667911231517792, -0.02329091541469097, -0.02191391959786415, -0.02053692378103733, -0.01915992796421051, -0.01778293214738369, -0.01640593633055687, -0.01502894051373005, -0.013651944696903229, -0.012274948880076408, -0.010897953063249588, -0.009520957246422768, -0.008143961429595947, -0.006766965612769127, -0.0053899697959423065, -0.004012973979115486, -0.0026359781622886658, -0.0012589823454618454, 0.00011801347136497498, 0.0014950092881917953, 0.0028720051050186157, 0.004249000921845436, 0.0056259967386722565, 0.007002992555499077, 0.008379988372325897, 0.009756984189152718, 0.011133983731269836, 0.012510979548096657, 0.013887975364923477, 0.015264971181750298, 0.016641966998577118, 0.01801896281540394, 0.01939595863223076, 0.02077295444905758, 0.0221499502658844, 0.02352694608271122, 0.02490394189953804, 0.02628093771636486, 0.02765793353319168, 0.0290349293500185, 0.03041192516684532, 0.03178892284631729, 0.03316591680049896, 0.034542910754680634, 0.0359199084341526, 0.03729690611362457, 0.038673900067806244, 0.040050894021987915, 0.041427891701459885, 0.042804889380931854, 0.044181883335113525, 0.0455588772892952, 0.046935874968767166, 0.048312872648239136, 0.04968986660242081, 0.05106686055660248, 0.05244385823607445, 0.05382085591554642, 0.05519784986972809]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 5.0, 7.0, 9.0, 12.0, 15.0, 24.0, 17.0, 29.0, 22.0, 38.0, 35.0, 43.0, 50.0, 46.0, 48.0, 45.0, 60.0, 47.0, 46.0, 57.0, 45.0, 49.0, 29.0, 43.0, 32.0, 30.0, 24.0, 21.0, 17.0, 12.0, 15.0, 11.0, 6.0, 7.0, 3.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.02670830488204956, -0.02584611438214779, -0.024983923882246017, -0.024121733382344246, -0.023259542882442474, -0.022397352382540703, -0.02153516188263893, -0.02067297138273716, -0.019810780882835388, -0.018948590382933617, -0.018086399883031845, -0.017224209383130074, -0.016362018883228302, -0.01549982838332653, -0.014637637883424759, -0.013775447383522987, -0.012913256883621216, -0.012051066383719444, -0.011188875883817673, -0.010326685383915901, -0.00946449488401413, -0.008602304384112358, -0.0077401138842105865, -0.006877923384308815, -0.0060157328844070435, -0.005153542384505272, -0.0042913518846035, -0.003429161384701729, -0.0025669708847999573, -0.0017047803848981857, -0.0008425898849964142, 1.960061490535736e-05, 0.0008817911148071289, 0.0017439816147089005, 0.002606172114610672, 0.0034683626145124435, 0.004330553114414215, 0.005192743614315987, 0.006054934114217758, 0.00691712461411953, 0.007779315114021301, 0.008641505613923073, 0.009503696113824844, 0.010365886613726616, 0.011228077113628387, 0.012090267613530159, 0.01295245811343193, 0.013814648613333702, 0.014676839113235474, 0.015539029613137245, 0.016401220113039017, 0.01726341061294079, 0.01812560111284256, 0.01898779161274433, 0.019849982112646103, 0.020712172612547874, 0.021574363112449646, 0.022436553612351418, 0.02329874411225319, 0.02416093461215496, 0.025023125112056732, 0.025885315611958504, 0.026747506111860275, 0.027609696611762047, 0.02847188711166382]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 0.0, 5.0, 2.0, 4.0, 5.0, 10.0, 7.0, 10.0, 16.0, 28.0, 25.0, 54.0, 70.0, 90.0, 127.0, 170.0, 230.0, 341.0, 472.0, 662.0, 987.0, 1485.0, 2159.0, 3598.0, 6139.0, 11468.0, 27766.0, 595521.0, 345126.0, 25275.0, 10935.0, 5704.0, 3445.0, 2154.0, 1345.0, 932.0, 599.0, 453.0, 336.0, 194.0, 182.0, 120.0, 82.0, 64.0, 40.0, 36.0, 22.0, 20.0, 10.0, 9.0, 10.0, 4.0, 3.0, 3.0, 6.0, 3.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.034210205078125, -0.033139705657958984, -0.03206920623779297, -0.030998706817626953, -0.029928207397460938, -0.028857707977294922, -0.027787208557128906, -0.02671670913696289, -0.025646209716796875, -0.02457571029663086, -0.023505210876464844, -0.022434711456298828, -0.021364212036132812, -0.020293712615966797, -0.01922321319580078, -0.018152713775634766, -0.01708221435546875, -0.016011714935302734, -0.014941215515136719, -0.013870716094970703, -0.012800216674804688, -0.011729717254638672, -0.010659217834472656, -0.00958871841430664, -0.008518218994140625, -0.007447719573974609, -0.006377220153808594, -0.005306720733642578, -0.0042362213134765625, -0.003165721893310547, -0.0020952224731445312, -0.0010247230529785156, 4.57763671875e-05, 0.0011162757873535156, 0.0021867752075195312, 0.003257274627685547, 0.0043277740478515625, 0.005398273468017578, 0.006468772888183594, 0.007539272308349609, 0.008609771728515625, 0.00968027114868164, 0.010750770568847656, 0.011821269989013672, 0.012891769409179688, 0.013962268829345703, 0.015032768249511719, 0.016103267669677734, 0.01717376708984375, 0.018244266510009766, 0.01931476593017578, 0.020385265350341797, 0.021455764770507812, 0.022526264190673828, 0.023596763610839844, 0.02466726303100586, 0.025737762451171875, 0.02680826187133789, 0.027878761291503906, 0.028949260711669922, 0.030019760131835938, 0.031090259552001953, 0.03216075897216797, 0.033231258392333984, 0.0343017578125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 4.0, 3.0, 3.0, 2.0, 5.0, 3.0, 4.0, 5.0, 8.0, 2.0, 11.0, 9.0, 15.0, 69.0, 235.0, 351.0, 142.0, 40.0, 19.0, 9.0, 8.0, 7.0, 6.0, 7.0, 10.0, 3.0, 4.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.004428863525390625, -0.004282653331756592, -0.004136443138122559, -0.003990232944488525, -0.003844022750854492, -0.003697812557220459, -0.0035516023635864258, -0.0034053921699523926, -0.0032591819763183594, -0.003112971782684326, -0.002966761589050293, -0.0028205513954162598, -0.0026743412017822266, -0.0025281310081481934, -0.00238192081451416, -0.002235710620880127, -0.0020895004272460938, -0.0019432902336120605, -0.0017970800399780273, -0.0016508698463439941, -0.001504659652709961, -0.0013584494590759277, -0.0012122392654418945, -0.0010660290718078613, -0.0009198188781738281, -0.0007736086845397949, -0.0006273984909057617, -0.0004811882972717285, -0.0003349781036376953, -0.0001887679100036621, -4.2557716369628906e-05, 0.0001036524772644043, 0.0002498626708984375, 0.0003960728645324707, 0.0005422830581665039, 0.0006884932518005371, 0.0008347034454345703, 0.0009809136390686035, 0.0011271238327026367, 0.00127333402633667, 0.0014195442199707031, 0.0015657544136047363, 0.0017119646072387695, 0.0018581748008728027, 0.002004384994506836, 0.002150595188140869, 0.0022968053817749023, 0.0024430155754089355, 0.0025892257690429688, 0.002735435962677002, 0.002881646156311035, 0.0030278563499450684, 0.0031740665435791016, 0.0033202767372131348, 0.003466486930847168, 0.003612697124481201, 0.0037589073181152344, 0.0039051175117492676, 0.004051327705383301, 0.004197537899017334, 0.004343748092651367, 0.0044899582862854, 0.004636168479919434, 0.004782378673553467, 0.0049285888671875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 3.0, 6.0, 11.0, 8.0, 26.0, 30.0, 30.0, 41.0, 71.0, 70.0, 126.0, 197.0, 401.0, 700.0, 1285.0, 3241.0, 10739.0, 166868.0, 831751.0, 24042.0, 4869.0, 1971.0, 823.0, 463.0, 267.0, 140.0, 126.0, 74.0, 50.0, 37.0, 22.0, 11.0, 12.0, 14.0, 8.0, 2.0, 5.0, 1.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0908203125, -0.0882406234741211, -0.08566093444824219, -0.08308124542236328, -0.08050155639648438, -0.07792186737060547, -0.07534217834472656, -0.07276248931884766, -0.07018280029296875, -0.06760311126708984, -0.06502342224121094, -0.06244373321533203, -0.059864044189453125, -0.05728435516357422, -0.05470466613769531, -0.052124977111816406, -0.0495452880859375, -0.046965599060058594, -0.04438591003417969, -0.04180622100830078, -0.039226531982421875, -0.03664684295654297, -0.03406715393066406, -0.031487464904785156, -0.02890777587890625, -0.026328086853027344, -0.023748397827148438, -0.02116870880126953, -0.018589019775390625, -0.01600933074951172, -0.013429641723632812, -0.010849952697753906, -0.008270263671875, -0.005690574645996094, -0.0031108856201171875, -0.0005311965942382812, 0.002048492431640625, 0.004628181457519531, 0.0072078704833984375, 0.009787559509277344, 0.01236724853515625, 0.014946937561035156, 0.017526626586914062, 0.02010631561279297, 0.022686004638671875, 0.02526569366455078, 0.027845382690429688, 0.030425071716308594, 0.0330047607421875, 0.035584449768066406, 0.03816413879394531, 0.04074382781982422, 0.043323516845703125, 0.04590320587158203, 0.04848289489746094, 0.051062583923339844, 0.05364227294921875, 0.056221961975097656, 0.05880165100097656, 0.06138134002685547, 0.06396102905273438, 0.06654071807861328, 0.06912040710449219, 0.0717000961303711, 0.07427978515625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 6.0, 7.0, 7.0, 17.0, 10.0, 15.0, 14.0, 14.0, 15.0, 30.0, 28.0, 29.0, 19.0, 31.0, 38.0, 34.0, 31.0, 43.0, 53.0, 38.0, 35.0, 43.0, 38.0, 41.0, 34.0, 31.0, 23.0, 30.0, 24.0, 29.0, 26.0, 22.0, 17.0, 31.0, 16.0, 24.0, 6.0, 9.0, 10.0, 8.0, 6.0, 7.0, 5.0, 7.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01751708984375, -0.016912221908569336, -0.016307353973388672, -0.015702486038208008, -0.015097618103027344, -0.01449275016784668, -0.013887882232666016, -0.013283014297485352, -0.012678146362304688, -0.012073278427124023, -0.01146841049194336, -0.010863542556762695, -0.010258674621582031, -0.009653806686401367, -0.009048938751220703, -0.008444070816040039, -0.007839202880859375, -0.007234334945678711, -0.006629467010498047, -0.006024599075317383, -0.005419731140136719, -0.004814863204956055, -0.004209995269775391, -0.0036051273345947266, -0.0030002593994140625, -0.0023953914642333984, -0.0017905235290527344, -0.0011856555938720703, -0.0005807876586914062, 2.4080276489257812e-05, 0.0006289482116699219, 0.001233816146850586, 0.00183868408203125, 0.002443552017211914, 0.003048419952392578, 0.003653287887573242, 0.004258155822753906, 0.00486302375793457, 0.005467891693115234, 0.0060727596282958984, 0.0066776275634765625, 0.0072824954986572266, 0.00788736343383789, 0.008492231369018555, 0.009097099304199219, 0.009701967239379883, 0.010306835174560547, 0.010911703109741211, 0.011516571044921875, 0.012121438980102539, 0.012726306915283203, 0.013331174850463867, 0.013936042785644531, 0.014540910720825195, 0.01514577865600586, 0.015750646591186523, 0.016355514526367188, 0.01696038246154785, 0.017565250396728516, 0.01817011833190918, 0.018774986267089844, 0.019379854202270508, 0.019984722137451172, 0.020589590072631836, 0.0211944580078125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 2.0, 5.0, 13.0, 18.0, 26.0, 24.0, 65.0, 120.0, 251.0, 668.0, 2246.0, 17242.0, 988102.0, 35251.0, 3105.0, 792.0, 289.0, 141.0, 87.0, 36.0, 26.0, 16.0, 18.0, 5.0, 2.0, 1.0, 4.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07763671875, -0.07557201385498047, -0.07350730895996094, -0.0714426040649414, -0.06937789916992188, -0.06731319427490234, -0.06524848937988281, -0.06318378448486328, -0.06111907958984375, -0.05905437469482422, -0.05698966979980469, -0.054924964904785156, -0.052860260009765625, -0.050795555114746094, -0.04873085021972656, -0.04666614532470703, -0.0446014404296875, -0.04253673553466797, -0.04047203063964844, -0.038407325744628906, -0.036342620849609375, -0.034277915954589844, -0.03221321105957031, -0.03014850616455078, -0.02808380126953125, -0.02601909637451172, -0.023954391479492188, -0.021889686584472656, -0.019824981689453125, -0.017760276794433594, -0.015695571899414062, -0.013630867004394531, -0.011566162109375, -0.009501457214355469, -0.0074367523193359375, -0.005372047424316406, -0.003307342529296875, -0.0012426376342773438, 0.0008220672607421875, 0.0028867721557617188, 0.00495147705078125, 0.007016181945800781, 0.009080886840820312, 0.011145591735839844, 0.013210296630859375, 0.015275001525878906, 0.017339706420898438, 0.01940441131591797, 0.0214691162109375, 0.02353382110595703, 0.025598526000976562, 0.027663230895996094, 0.029727935791015625, 0.031792640686035156, 0.03385734558105469, 0.03592205047607422, 0.03798675537109375, 0.04005146026611328, 0.04211616516113281, 0.044180870056152344, 0.046245574951171875, 0.048310279846191406, 0.05037498474121094, 0.05243968963623047, 0.05450439453125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 4.0, 2.0, 1.0, 1.0, 5.0, 7.0, 8.0, 9.0, 9.0, 8.0, 9.0, 26.0, 31.0, 29.0, 29.0, 49.0, 64.0, 85.0, 91.0, 114.0, 88.0, 91.0, 41.0, 46.0, 37.0, 26.0, 20.0, 12.0, 6.0, 8.0, 6.0, 8.0, 10.0, 5.0, 3.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.002155303955078125, -0.0020920783281326294, -0.002028852701187134, -0.001965627074241638, -0.0019024014472961426, -0.001839175820350647, -0.0017759501934051514, -0.0017127245664596558, -0.0016494989395141602, -0.0015862733125686646, -0.001523047685623169, -0.0014598220586776733, -0.0013965964317321777, -0.0013333708047866821, -0.0012701451778411865, -0.001206919550895691, -0.0011436939239501953, -0.0010804682970046997, -0.001017242670059204, -0.0009540170431137085, -0.0008907914161682129, -0.0008275657892227173, -0.0007643401622772217, -0.0007011145353317261, -0.0006378889083862305, -0.0005746632814407349, -0.0005114376544952393, -0.00044821202754974365, -0.00038498640060424805, -0.00032176077365875244, -0.00025853514671325684, -0.00019530951976776123, -0.00013208389282226562, -6.885826587677002e-05, -5.632638931274414e-06, 5.759298801422119e-05, 0.0001208186149597168, 0.0001840442419052124, 0.000247269868850708, 0.0003104954957962036, 0.0003737211227416992, 0.0004369467496871948, 0.0005001723766326904, 0.000563398003578186, 0.0006266236305236816, 0.0006898492574691772, 0.0007530748844146729, 0.0008163005113601685, 0.0008795261383056641, 0.0009427517652511597, 0.0010059773921966553, 0.0010692030191421509, 0.0011324286460876465, 0.001195654273033142, 0.0012588798999786377, 0.0013221055269241333, 0.001385331153869629, 0.0014485567808151245, 0.0015117824077606201, 0.0015750080347061157, 0.0016382336616516113, 0.001701459288597107, 0.0017646849155426025, 0.0018279105424880981, 0.0018911361694335938]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 17.0, 16.0, 27.0, 41.0, 69.0, 176.0, 433.0, 1504.0, 6324.0, 51823.0, 892137.0, 84994.0, 8130.0, 1862.0, 574.0, 225.0, 98.0, 48.0, 26.0, 11.0, 8.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.031280517578125, -0.030103683471679688, -0.028926849365234375, -0.027750015258789062, -0.02657318115234375, -0.025396347045898438, -0.024219512939453125, -0.023042678833007812, -0.0218658447265625, -0.020689010620117188, -0.019512176513671875, -0.018335342407226562, -0.01715850830078125, -0.015981674194335938, -0.014804840087890625, -0.013628005981445312, -0.012451171875, -0.011274337768554688, -0.010097503662109375, -0.008920669555664062, -0.00774383544921875, -0.0065670013427734375, -0.005390167236328125, -0.0042133331298828125, -0.0030364990234375, -0.0018596649169921875, -0.000682830810546875, 0.0004940032958984375, 0.00167083740234375, 0.0028476715087890625, 0.004024505615234375, 0.0052013397216796875, 0.006378173828125, 0.0075550079345703125, 0.008731842041015625, 0.009908676147460938, 0.01108551025390625, 0.012262344360351562, 0.013439178466796875, 0.014616012573242188, 0.0157928466796875, 0.016969680786132812, 0.018146514892578125, 0.019323348999023438, 0.02050018310546875, 0.021677017211914062, 0.022853851318359375, 0.024030685424804688, 0.02520751953125, 0.026384353637695312, 0.027561187744140625, 0.028738021850585938, 0.02991485595703125, 0.031091690063476562, 0.032268524169921875, 0.03344535827636719, 0.0346221923828125, 0.03579902648925781, 0.036975860595703125, 0.03815269470214844, 0.03932952880859375, 0.04050636291503906, 0.041683197021484375, 0.04286003112792969, 0.044036865234375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 1.0, 2.0, 2.0, 5.0, 4.0, 5.0, 11.0, 15.0, 11.0, 14.0, 15.0, 30.0, 56.0, 55.0, 66.0, 80.0, 110.0, 104.0, 84.0, 67.0, 65.0, 46.0, 37.0, 28.0, 21.0, 15.0, 14.0, 6.0, 6.0, 7.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01605224609375, -0.01554250717163086, -0.015032768249511719, -0.014523029327392578, -0.014013290405273438, -0.013503551483154297, -0.012993812561035156, -0.012484073638916016, -0.011974334716796875, -0.011464595794677734, -0.010954856872558594, -0.010445117950439453, -0.009935379028320312, -0.009425640106201172, -0.008915901184082031, -0.00840616226196289, -0.00789642333984375, -0.007386684417724609, -0.006876945495605469, -0.006367206573486328, -0.0058574676513671875, -0.005347728729248047, -0.004837989807128906, -0.004328250885009766, -0.003818511962890625, -0.0033087730407714844, -0.0027990341186523438, -0.002289295196533203, -0.0017795562744140625, -0.0012698173522949219, -0.0007600784301757812, -0.0002503395080566406, 0.0002593994140625, 0.0007691383361816406, 0.0012788772583007812, 0.0017886161804199219, 0.0022983551025390625, 0.002808094024658203, 0.0033178329467773438, 0.0038275718688964844, 0.004337310791015625, 0.004847049713134766, 0.005356788635253906, 0.005866527557373047, 0.0063762664794921875, 0.006886005401611328, 0.007395744323730469, 0.00790548324584961, 0.00841522216796875, 0.00892496109008789, 0.009434700012207031, 0.009944438934326172, 0.010454177856445312, 0.010963916778564453, 0.011473655700683594, 0.011983394622802734, 0.012493133544921875, 0.013002872467041016, 0.013512611389160156, 0.014022350311279297, 0.014532089233398438, 0.015041828155517578, 0.015551567077636719, 0.01606130599975586, 0.016571044921875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 6.0, 2.0, 8.0, 28.0, 229.0, 631.0, 59.0, 17.0, 14.0, 5.0, 0.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8714686632156372, -0.8435510993003845, -0.8156334757804871, -0.7877159118652344, -0.7597983479499817, -0.731880784034729, -0.7039631605148315, -0.6760455965995789, -0.6481280326843262, -0.6202104687690735, -0.592292845249176, -0.5643752813339233, -0.5364577174186707, -0.508540153503418, -0.4806225299835205, -0.4527049660682678, -0.42478734254837036, -0.3968697488307953, -0.3689521849155426, -0.34103459119796753, -0.31311702728271484, -0.28519943356513977, -0.2572818398475647, -0.22936426103115082, -0.20144668221473694, -0.17352910339832306, -0.14561152458190918, -0.1176939308643341, -0.08977635204792023, -0.06185877323150635, -0.033941179513931274, -0.006023600697517395, 0.02189391851425171, 0.04981150105595589, 0.07772908359766006, 0.10564666986465454, 0.13356424868106842, 0.1614818274974823, 0.18939942121505737, 0.21731700003147125, 0.24523457884788513, 0.2731521725654602, 0.3010697364807129, 0.32898733019828796, 0.35690492391586304, 0.3848224878311157, 0.4127400815486908, 0.44065767526626587, 0.46857523918151855, 0.49649283289909363, 0.5244104266166687, 0.5523279905319214, 0.5802455544471741, 0.6081631183624268, 0.6360807418823242, 0.6639983057975769, 0.6919158697128296, 0.7198334336280823, 0.7477510571479797, 0.7756686210632324, 0.8035861849784851, 0.8315037488937378, 0.8594213724136353, 0.8873389363288879, 0.9152565598487854]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 6.0, 1.0, 4.0, 4.0, 4.0, 6.0, 2.0, 5.0, 10.0, 15.0, 22.0, 47.0, 79.0, 114.0, 159.0, 152.0, 138.0, 87.0, 46.0, 35.0, 23.0, 12.0, 5.0, 3.0, 4.0, 4.0, 6.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.4582235813140869, -0.4447319805622101, -0.43124035000801086, -0.41774874925613403, -0.4042571485042572, -0.39076554775238037, -0.37727391719818115, -0.3637823164463043, -0.3502907156944275, -0.33679911494255066, -0.32330748438835144, -0.3098158836364746, -0.2963242828845978, -0.28283268213272095, -0.26934105157852173, -0.2558494508266449, -0.24235783517360687, -0.22886621952056885, -0.21537461876869202, -0.201883003115654, -0.18839140236377716, -0.17489978671073914, -0.1614081859588623, -0.14791657030582428, -0.13442495465278625, -0.12093334645032883, -0.1074417382478714, -0.09395012259483337, -0.08045852184295654, -0.06696690618991852, -0.05347529798746109, -0.03998368978500366, -0.02649208903312683, -0.013000479899346828, 0.0004911292344331741, 0.013982739299535751, 0.02747434750199318, 0.040965959429740906, 0.054457567632198334, 0.06794917583465576, 0.08144078403711319, 0.09493239223957062, 0.10842400044202805, 0.12191560864448547, 0.1354072242975235, 0.14889883995056152, 0.16239044070243835, 0.17588204145431519, 0.1893736571073532, 0.20286527276039124, 0.21635687351226807, 0.2298484891653061, 0.24334008991718292, 0.25683170557022095, 0.2703233063220978, 0.2838149070739746, 0.29730653762817383, 0.31079813838005066, 0.3242897689342499, 0.3377813696861267, 0.35127297043800354, 0.36476457118988037, 0.3782562017440796, 0.3917478024959564, 0.40523940324783325]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 4.0, 3.0, 2.0, 4.0, 3.0, 4.0, 10.0, 8.0, 11.0, 16.0, 11.0, 24.0, 26.0, 43.0, 108.0, 729.0, 23959.0, 4166997.0, 2032.0, 108.0, 57.0, 37.0, 21.0, 17.0, 15.0, 10.0, 9.0, 5.0, 3.0, 6.0, 1.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.109375, -2.0543060302734375, -1.999237060546875, -1.9441680908203125, -1.88909912109375, -1.8340301513671875, -1.778961181640625, -1.7238922119140625, -1.6688232421875, -1.6137542724609375, -1.558685302734375, -1.5036163330078125, -1.44854736328125, -1.3934783935546875, -1.338409423828125, -1.2833404541015625, -1.228271484375, -1.1732025146484375, -1.118133544921875, -1.0630645751953125, -1.00799560546875, -0.9529266357421875, -0.897857666015625, -0.8427886962890625, -0.7877197265625, -0.7326507568359375, -0.677581787109375, -0.6225128173828125, -0.56744384765625, -0.5123748779296875, -0.457305908203125, -0.4022369384765625, -0.34716796875, -0.2920989990234375, -0.237030029296875, -0.1819610595703125, -0.12689208984375, -0.0718231201171875, -0.016754150390625, 0.0383148193359375, 0.0933837890625, 0.1484527587890625, 0.203521728515625, 0.2585906982421875, 0.31365966796875, 0.3687286376953125, 0.423797607421875, 0.4788665771484375, 0.533935546875, 0.5890045166015625, 0.644073486328125, 0.6991424560546875, 0.75421142578125, 0.8092803955078125, 0.864349365234375, 0.9194183349609375, 0.9744873046875, 1.0295562744140625, 1.084625244140625, 1.1396942138671875, 1.19476318359375, 1.2498321533203125, 1.304901123046875, 1.3599700927734375, 1.4150390625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 5.0, 2.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 2.0, 4.0, 11.0, 5.0, 8.0, 10.0, 13.0, 11.0, 27.0, 34.0, 78.0, 107.0, 158.0, 157.0, 97.0, 85.0, 59.0, 30.0, 11.0, 10.0, 11.0, 7.0, 4.0, 7.0, 9.0, 3.0, 3.0, 5.0, 5.0, 4.0, 2.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003025054931640625, -0.0029384493827819824, -0.00285184383392334, -0.0027652382850646973, -0.0026786327362060547, -0.002592027187347412, -0.0025054216384887695, -0.002418816089630127, -0.0023322105407714844, -0.002245604991912842, -0.0021589994430541992, -0.0020723938941955566, -0.001985788345336914, -0.0018991827964782715, -0.001812577247619629, -0.0017259716987609863, -0.0016393661499023438, -0.0015527606010437012, -0.0014661550521850586, -0.001379549503326416, -0.0012929439544677734, -0.0012063384056091309, -0.0011197328567504883, -0.0010331273078918457, -0.0009465217590332031, -0.0008599162101745605, -0.000773310661315918, -0.0006867051124572754, -0.0006000995635986328, -0.0005134940147399902, -0.00042688846588134766, -0.0003402829170227051, -0.0002536773681640625, -0.00016707181930541992, -8.046627044677734e-05, 6.139278411865234e-06, 9.274482727050781e-05, 0.0001793503761291504, 0.00026595592498779297, 0.00035256147384643555, 0.0004391670227050781, 0.0005257725715637207, 0.0006123781204223633, 0.0006989836692810059, 0.0007855892181396484, 0.000872194766998291, 0.0009588003158569336, 0.0010454058647155762, 0.0011320114135742188, 0.0012186169624328613, 0.001305222511291504, 0.0013918280601501465, 0.001478433609008789, 0.0015650391578674316, 0.0016516447067260742, 0.0017382502555847168, 0.0018248558044433594, 0.001911461353302002, 0.0019980669021606445, 0.002084672451019287, 0.0021712779998779297, 0.0022578835487365723, 0.002344489097595215, 0.0024310946464538574, 0.0025177001953125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 1.0, 2.0, 2.0, 6.0, 10.0, 7.0, 10.0, 13.0, 25.0, 23.0, 29.0, 39.0, 49.0, 64.0, 76.0, 96.0, 142.0, 220.0, 1362.0, 4033475.0, 157222.0, 643.0, 178.0, 141.0, 100.0, 89.0, 49.0, 56.0, 24.0, 34.0, 24.0, 15.0, 24.0, 6.0, 5.0, 3.0, 11.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26953125, -0.2595024108886719, -0.24947357177734375, -0.23944473266601562, -0.2294158935546875, -0.21938705444335938, -0.20935821533203125, -0.19932937622070312, -0.189300537109375, -0.17927169799804688, -0.16924285888671875, -0.15921401977539062, -0.1491851806640625, -0.13915634155273438, -0.12912750244140625, -0.11909866333007812, -0.10906982421875, -0.09904098510742188, -0.08901214599609375, -0.07898330688476562, -0.0689544677734375, -0.058925628662109375, -0.04889678955078125, -0.038867950439453125, -0.028839111328125, -0.018810272216796875, -0.00878143310546875, 0.001247406005859375, 0.0112762451171875, 0.021305084228515625, 0.03133392333984375, 0.041362762451171875, 0.0513916015625, 0.061420440673828125, 0.07144927978515625, 0.08147811889648438, 0.0915069580078125, 0.10153579711914062, 0.11156463623046875, 0.12159347534179688, 0.131622314453125, 0.14165115356445312, 0.15167999267578125, 0.16170883178710938, 0.1717376708984375, 0.18176651000976562, 0.19179534912109375, 0.20182418823242188, 0.21185302734375, 0.22188186645507812, 0.23191070556640625, 0.24193954467773438, 0.2519683837890625, 0.2619972229003906, 0.27202606201171875, 0.2820549011230469, 0.292083740234375, 0.3021125793457031, 0.31214141845703125, 0.3221702575683594, 0.3321990966796875, 0.3422279357910156, 0.35225677490234375, 0.3622856140136719, 0.372314453125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 1.0, 7.0, 7.0, 7.0, 12.0, 12.0, 14.0, 15.0, 22.0, 31.0, 57.0, 77.0, 101.0, 131.0, 230.0, 325.0, 547.0, 899.0, 505.0, 287.0, 210.0, 186.0, 110.0, 78.0, 55.0, 34.0, 21.0, 26.0, 19.0, 12.0, 7.0, 7.0, 2.0, 7.0, 7.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.004611968994140625, -0.0044699907302856445, -0.004328012466430664, -0.004186034202575684, -0.004044055938720703, -0.0039020776748657227, -0.003760099411010742, -0.0036181211471557617, -0.0034761428833007812, -0.0033341646194458008, -0.0031921863555908203, -0.00305020809173584, -0.0029082298278808594, -0.002766251564025879, -0.0026242733001708984, -0.002482295036315918, -0.0023403167724609375, -0.002198338508605957, -0.0020563602447509766, -0.001914381980895996, -0.0017724037170410156, -0.0016304254531860352, -0.0014884471893310547, -0.0013464689254760742, -0.0012044906616210938, -0.0010625123977661133, -0.0009205341339111328, -0.0007785558700561523, -0.0006365776062011719, -0.0004945993423461914, -0.00035262107849121094, -0.00021064281463623047, -6.866455078125e-05, 7.331371307373047e-05, 0.00021529197692871094, 0.0003572702407836914, 0.0004992485046386719, 0.0006412267684936523, 0.0007832050323486328, 0.0009251832962036133, 0.0010671615600585938, 0.0012091398239135742, 0.0013511180877685547, 0.0014930963516235352, 0.0016350746154785156, 0.001777052879333496, 0.0019190311431884766, 0.002061009407043457, 0.0022029876708984375, 0.002344965934753418, 0.0024869441986083984, 0.002628922462463379, 0.0027709007263183594, 0.00291287899017334, 0.0030548572540283203, 0.0031968355178833008, 0.0033388137817382812, 0.0034807920455932617, 0.003622770309448242, 0.0037647485733032227, 0.003906726837158203, 0.004048705101013184, 0.004190683364868164, 0.0043326616287231445, 0.004474639892578125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 8.0, 159.0, 810.0, 39.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04298434779047966, -0.029278934001922607, -0.015573520213365555, -0.0018681064248085022, 0.01183730736374855, 0.0255427248775959, 0.039248134940862656, 0.05295354500412941, 0.06665895879268646, 0.08036437630653381, 0.09406978636980057, 0.10777519643306732, 0.12148061394691467, 0.13518603146076202, 0.14889144897460938, 0.16259685158729553, 0.17630226910114288, 0.19000768661499023, 0.2037130892276764, 0.21741850674152374, 0.2311239242553711, 0.24482934176921844, 0.2585347592830658, 0.27224016189575195, 0.2859455943107605, 0.29965099692344666, 0.3133564293384552, 0.32706183195114136, 0.3407672643661499, 0.35447266697883606, 0.3681780695915222, 0.38188350200653076, 0.39558887481689453, 0.4092942774295807, 0.42299970984458923, 0.4367051124572754, 0.45041054487228394, 0.4641159474849701, 0.47782135009765625, 0.4915267825126648, 0.5052322149276733, 0.5189376473426819, 0.5326430201530457, 0.5463484525680542, 0.5600538849830627, 0.5737593173980713, 0.5874646902084351, 0.6011701226234436, 0.6148754954338074, 0.6285809278488159, 0.6422863006591797, 0.6559917330741882, 0.6696971654891968, 0.6834025382995605, 0.6971079707145691, 0.7108134031295776, 0.7245187759399414, 0.73822420835495, 0.7519295811653137, 0.7656350135803223, 0.7793404459953308, 0.7930458784103394, 0.8067512512207031, 0.8204566836357117, 0.8341621160507202]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 12.0, 10.0, 21.0, 33.0, 58.0, 88.0, 102.0, 122.0, 120.0, 103.0, 106.0, 79.0, 56.0, 38.0, 24.0, 11.0, 9.0, 4.0, 6.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02246958017349243, -0.02055458351969719, -0.018639585003256798, -0.016724586486816406, -0.014809589833021164, -0.012894592247903347, -0.01097959466278553, -0.009064597077667713, -0.007149599492549896, -0.005234601907432079, -0.0033196043223142624, -0.0014046067371964455, 0.0005103908479213715, 0.0024253884330391884, 0.004340386018157005, 0.006255383603274822, 0.00817038118839264, 0.010085378773510456, 0.012000376358628273, 0.01391537394374609, 0.015830371528863907, 0.01774536818265915, 0.01966036669909954, 0.021575365215539932, 0.023490361869335175, 0.025405358523130417, 0.02732035703957081, 0.0292353555560112, 0.031150352209806442, 0.033065348863601685, 0.034980349242687225, 0.03689534589648247, 0.03881034255027771, 0.04072533920407295, 0.042640335857868195, 0.044555336236953735, 0.04647033289074898, 0.04838532954454422, 0.05030032992362976, 0.052215326577425, 0.054130323231220245, 0.05604531988501549, 0.05796031653881073, 0.05987531691789627, 0.06179031357169151, 0.06370531022548676, 0.0656203106045723, 0.06753530353307724, 0.06945030391216278, 0.07136530429124832, 0.07328029721975327, 0.0751952975988388, 0.07711029052734375, 0.07902529090642929, 0.08094029128551483, 0.08285528421401978, 0.08477028459310532, 0.08668528497219086, 0.0886002779006958, 0.09051527827978134, 0.09243027865886688, 0.09434527158737183, 0.09626027196645737, 0.09817526489496231, 0.10009026527404785]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 9.0, 4.0, 4.0, 8.0, 12.0, 15.0, 23.0, 18.0, 39.0, 25.0, 39.0, 78.0, 225.0, 923.0, 5108.0, 47532.0, 956079.0, 33027.0, 4113.0, 798.0, 206.0, 80.0, 47.0, 30.0, 26.0, 15.0, 9.0, 19.0, 9.0, 10.0, 3.0, 4.0, 5.0, 5.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08380126953125, -0.08104801177978516, -0.07829475402832031, -0.07554149627685547, -0.07278823852539062, -0.07003498077392578, -0.06728172302246094, -0.0645284652709961, -0.06177520751953125, -0.059021949768066406, -0.05626869201660156, -0.05351543426513672, -0.050762176513671875, -0.04800891876220703, -0.04525566101074219, -0.042502403259277344, -0.0397491455078125, -0.036995887756347656, -0.03424263000488281, -0.03148937225341797, -0.028736114501953125, -0.02598285675048828, -0.023229598999023438, -0.020476341247558594, -0.01772308349609375, -0.014969825744628906, -0.012216567993164062, -0.009463310241699219, -0.006710052490234375, -0.003956794738769531, -0.0012035369873046875, 0.0015497207641601562, 0.004302978515625, 0.007056236267089844, 0.009809494018554688, 0.012562751770019531, 0.015316009521484375, 0.01806926727294922, 0.020822525024414062, 0.023575782775878906, 0.02632904052734375, 0.029082298278808594, 0.03183555603027344, 0.03458881378173828, 0.037342071533203125, 0.04009532928466797, 0.04284858703613281, 0.045601844787597656, 0.0483551025390625, 0.051108360290527344, 0.05386161804199219, 0.05661487579345703, 0.059368133544921875, 0.06212139129638672, 0.06487464904785156, 0.0676279067993164, 0.07038116455078125, 0.0731344223022461, 0.07588768005371094, 0.07864093780517578, 0.08139419555664062, 0.08414745330810547, 0.08690071105957031, 0.08965396881103516, 0.0924072265625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 5.0, 4.0, 0.0, 8.0, 9.0, 17.0, 28.0, 84.0, 253.0, 328.0, 162.0, 46.0, 24.0, 13.0, 18.0, 5.0, 8.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00287628173828125, -0.0026438236236572266, -0.002411365509033203, -0.0021789073944091797, -0.0019464492797851562, -0.0017139911651611328, -0.0014815330505371094, -0.001249074935913086, -0.0010166168212890625, -0.0007841587066650391, -0.0005517005920410156, -0.0003192424774169922, -8.678436279296875e-05, 0.0001456737518310547, 0.0003781318664550781, 0.0006105899810791016, 0.000843048095703125, 0.0010755062103271484, 0.0013079643249511719, 0.0015404224395751953, 0.0017728805541992188, 0.002005338668823242, 0.0022377967834472656, 0.002470254898071289, 0.0027027130126953125, 0.002935171127319336, 0.0031676292419433594, 0.003400087356567383, 0.0036325454711914062, 0.0038650035858154297, 0.004097461700439453, 0.0043299198150634766, 0.0045623779296875, 0.0047948360443115234, 0.005027294158935547, 0.00525975227355957, 0.005492210388183594, 0.005724668502807617, 0.005957126617431641, 0.006189584732055664, 0.0064220428466796875, 0.006654500961303711, 0.006886959075927734, 0.007119417190551758, 0.007351875305175781, 0.007584333419799805, 0.007816791534423828, 0.008049249649047852, 0.008281707763671875, 0.008514165878295898, 0.008746623992919922, 0.008979082107543945, 0.009211540222167969, 0.009443998336791992, 0.009676456451416016, 0.009908914566040039, 0.010141372680664062, 0.010373830795288086, 0.01060628890991211, 0.010838747024536133, 0.011071205139160156, 0.01130366325378418, 0.011536121368408203, 0.011768579483032227, 0.01200103759765625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 2.0, 3.0, 7.0, 10.0, 11.0, 16.0, 15.0, 20.0, 27.0, 31.0, 25.0, 55.0, 84.0, 384.0, 3499.0, 357317.0, 680882.0, 5350.0, 477.0, 123.0, 42.0, 23.0, 27.0, 35.0, 12.0, 17.0, 15.0, 3.0, 13.0, 8.0, 5.0, 2.0, 4.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0821533203125, -0.07922554016113281, -0.07629776000976562, -0.07336997985839844, -0.07044219970703125, -0.06751441955566406, -0.06458663940429688, -0.06165885925292969, -0.0587310791015625, -0.05580329895019531, -0.052875518798828125, -0.04994773864746094, -0.04701995849609375, -0.04409217834472656, -0.041164398193359375, -0.03823661804199219, -0.035308837890625, -0.03238105773925781, -0.029453277587890625, -0.026525497436523438, -0.02359771728515625, -0.020669937133789062, -0.017742156982421875, -0.014814376831054688, -0.0118865966796875, -0.008958816528320312, -0.006031036376953125, -0.0031032562255859375, -0.00017547607421875, 0.0027523040771484375, 0.005680084228515625, 0.008607864379882812, 0.01153564453125, 0.014463424682617188, 0.017391204833984375, 0.020318984985351562, 0.02324676513671875, 0.026174545288085938, 0.029102325439453125, 0.03203010559082031, 0.0349578857421875, 0.03788566589355469, 0.040813446044921875, 0.04374122619628906, 0.04666900634765625, 0.04959678649902344, 0.052524566650390625, 0.05545234680175781, 0.058380126953125, 0.06130790710449219, 0.06423568725585938, 0.06716346740722656, 0.07009124755859375, 0.07301902770996094, 0.07594680786132812, 0.07887458801269531, 0.0818023681640625, 0.08473014831542969, 0.08765792846679688, 0.09058570861816406, 0.09351348876953125, 0.09644126892089844, 0.09936904907226562, 0.10229682922363281, 0.105224609375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 4.0, 4.0, 4.0, 13.0, 11.0, 11.0, 14.0, 16.0, 22.0, 20.0, 22.0, 27.0, 19.0, 37.0, 36.0, 36.0, 46.0, 42.0, 40.0, 51.0, 64.0, 44.0, 42.0, 44.0, 34.0, 27.0, 26.0, 27.0, 29.0, 19.0, 28.0, 32.0, 21.0, 18.0, 10.0, 15.0, 9.0, 12.0, 4.0, 6.0, 6.0, 4.0, 6.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.01145172119140625, -0.01109921932220459, -0.01074671745300293, -0.01039421558380127, -0.01004171371459961, -0.00968921184539795, -0.009336709976196289, -0.008984208106994629, -0.008631706237792969, -0.008279204368591309, -0.007926702499389648, -0.007574200630187988, -0.007221698760986328, -0.006869196891784668, -0.006516695022583008, -0.006164193153381348, -0.0058116912841796875, -0.005459189414978027, -0.005106687545776367, -0.004754185676574707, -0.004401683807373047, -0.004049181938171387, -0.0036966800689697266, -0.0033441781997680664, -0.0029916763305664062, -0.002639174461364746, -0.002286672592163086, -0.0019341707229614258, -0.0015816688537597656, -0.0012291669845581055, -0.0008766651153564453, -0.0005241632461547852, -0.000171661376953125, 0.00018084049224853516, 0.0005333423614501953, 0.0008858442306518555, 0.0012383460998535156, 0.0015908479690551758, 0.001943349838256836, 0.002295851707458496, 0.0026483535766601562, 0.0030008554458618164, 0.0033533573150634766, 0.0037058591842651367, 0.004058361053466797, 0.004410862922668457, 0.004763364791870117, 0.005115866661071777, 0.0054683685302734375, 0.005820870399475098, 0.006173372268676758, 0.006525874137878418, 0.006878376007080078, 0.007230877876281738, 0.0075833797454833984, 0.007935881614685059, 0.008288383483886719, 0.008640885353088379, 0.008993387222290039, 0.0093458890914917, 0.00969839096069336, 0.01005089282989502, 0.01040339469909668, 0.01075589656829834, 0.0111083984375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 3.0, 10.0, 14.0, 36.0, 89.0, 381.0, 8923.0, 1037235.0, 1554.0, 183.0, 57.0, 22.0, 11.0, 8.0, 5.0, 4.0, 1.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2335205078125, -0.2258167266845703, -0.21811294555664062, -0.21040916442871094, -0.20270538330078125, -0.19500160217285156, -0.18729782104492188, -0.1795940399169922, -0.1718902587890625, -0.1641864776611328, -0.15648269653320312, -0.14877891540527344, -0.14107513427734375, -0.13337135314941406, -0.12566757202148438, -0.11796379089355469, -0.110260009765625, -0.10255622863769531, -0.09485244750976562, -0.08714866638183594, -0.07944488525390625, -0.07174110412597656, -0.06403732299804688, -0.05633354187011719, -0.0486297607421875, -0.04092597961425781, -0.033222198486328125, -0.025518417358398438, -0.01781463623046875, -0.010110855102539062, -0.002407073974609375, 0.0052967071533203125, 0.01300048828125, 0.020704269409179688, 0.028408050537109375, 0.03611183166503906, 0.04381561279296875, 0.05151939392089844, 0.059223175048828125, 0.06692695617675781, 0.0746307373046875, 0.08233451843261719, 0.09003829956054688, 0.09774208068847656, 0.10544586181640625, 0.11314964294433594, 0.12085342407226562, 0.1285572052001953, 0.136260986328125, 0.1439647674560547, 0.15166854858398438, 0.15937232971191406, 0.16707611083984375, 0.17477989196777344, 0.18248367309570312, 0.1901874542236328, 0.1978912353515625, 0.2055950164794922, 0.21329879760742188, 0.22100257873535156, 0.22870635986328125, 0.23641014099121094, 0.24411392211914062, 0.2518177032470703, 0.259521484375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 6.0, 9.0, 6.0, 16.0, 20.0, 41.0, 74.0, 361.0, 295.0, 58.0, 33.0, 14.0, 14.0, 12.0, 12.0, 5.0, 7.0, 3.0, 4.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.0029010772705078125, -0.0028318464756011963, -0.00276261568069458, -0.002693384885787964, -0.0026241540908813477, -0.0025549232959747314, -0.0024856925010681152, -0.002416461706161499, -0.002347230911254883, -0.0022780001163482666, -0.0022087693214416504, -0.002139538526535034, -0.002070307731628418, -0.0020010769367218018, -0.0019318461418151855, -0.0018626153469085693, -0.0017933845520019531, -0.001724153757095337, -0.0016549229621887207, -0.0015856921672821045, -0.0015164613723754883, -0.001447230577468872, -0.0013779997825622559, -0.0013087689876556396, -0.0012395381927490234, -0.0011703073978424072, -0.001101076602935791, -0.0010318458080291748, -0.0009626150131225586, -0.0008933842182159424, -0.0008241534233093262, -0.00075492262840271, -0.0006856918334960938, -0.0006164610385894775, -0.0005472302436828613, -0.0004779994487762451, -0.0004087686538696289, -0.0003395378589630127, -0.0002703070640563965, -0.00020107626914978027, -0.00013184547424316406, -6.261467933654785e-05, 6.616115570068359e-06, 7.584691047668457e-05, 0.00014507770538330078, 0.000214308500289917, 0.0002835392951965332, 0.0003527700901031494, 0.0004220008850097656, 0.0004912316799163818, 0.000560462474822998, 0.0006296932697296143, 0.0006989240646362305, 0.0007681548595428467, 0.0008373856544494629, 0.0009066164493560791, 0.0009758472442626953, 0.0010450780391693115, 0.0011143088340759277, 0.001183539628982544, 0.0012527704238891602, 0.0013220012187957764, 0.0013912320137023926, 0.0014604628086090088, 0.001529693603515625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 12.0, 11.0, 19.0, 30.0, 34.0, 55.0, 85.0, 173.0, 319.0, 714.0, 2163.0, 9456.0, 95604.0, 884027.0, 46422.0, 6376.0, 1694.0, 645.0, 259.0, 178.0, 90.0, 72.0, 30.0, 28.0, 16.0, 14.0, 3.0, 5.0, 5.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.062225341796875, -0.06041574478149414, -0.05860614776611328, -0.05679655075073242, -0.05498695373535156, -0.0531773567199707, -0.051367759704589844, -0.049558162689208984, -0.047748565673828125, -0.045938968658447266, -0.044129371643066406, -0.04231977462768555, -0.04051017761230469, -0.03870058059692383, -0.03689098358154297, -0.03508138656616211, -0.03327178955078125, -0.03146219253540039, -0.02965259552001953, -0.027842998504638672, -0.026033401489257812, -0.024223804473876953, -0.022414207458496094, -0.020604610443115234, -0.018795013427734375, -0.016985416412353516, -0.015175819396972656, -0.013366222381591797, -0.011556625366210938, -0.009747028350830078, -0.007937431335449219, -0.006127834320068359, -0.0043182373046875, -0.0025086402893066406, -0.0006990432739257812, 0.0011105537414550781, 0.0029201507568359375, 0.004729747772216797, 0.006539344787597656, 0.008348941802978516, 0.010158538818359375, 0.011968135833740234, 0.013777732849121094, 0.015587329864501953, 0.017396926879882812, 0.019206523895263672, 0.02101612091064453, 0.02282571792602539, 0.02463531494140625, 0.02644491195678711, 0.02825450897216797, 0.030064105987548828, 0.03187370300292969, 0.03368330001831055, 0.035492897033691406, 0.037302494049072266, 0.039112091064453125, 0.040921688079833984, 0.042731285095214844, 0.0445408821105957, 0.04635047912597656, 0.04816007614135742, 0.04996967315673828, 0.05177927017211914, 0.0535888671875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 7.0, 5.0, 5.0, 4.0, 5.0, 6.0, 13.0, 15.0, 21.0, 21.0, 41.0, 69.0, 95.0, 136.0, 153.0, 139.0, 93.0, 61.0, 38.0, 18.0, 15.0, 14.0, 13.0, 7.0, 5.0, 5.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01352691650390625, -0.012825369834899902, -0.012123823165893555, -0.011422276496887207, -0.01072072982788086, -0.010019183158874512, -0.009317636489868164, -0.008616089820861816, -0.007914543151855469, -0.007212996482849121, -0.0065114498138427734, -0.005809903144836426, -0.005108356475830078, -0.0044068098068237305, -0.003705263137817383, -0.003003716468811035, -0.0023021697998046875, -0.0016006231307983398, -0.0008990764617919922, -0.00019752979278564453, 0.0005040168762207031, 0.0012055635452270508, 0.0019071102142333984, 0.002608656883239746, 0.0033102035522460938, 0.004011750221252441, 0.004713296890258789, 0.005414843559265137, 0.006116390228271484, 0.006817936897277832, 0.00751948356628418, 0.008221030235290527, 0.008922576904296875, 0.009624123573303223, 0.01032567024230957, 0.011027216911315918, 0.011728763580322266, 0.012430310249328613, 0.013131856918334961, 0.013833403587341309, 0.014534950256347656, 0.015236496925354004, 0.01593804359436035, 0.0166395902633667, 0.017341136932373047, 0.018042683601379395, 0.018744230270385742, 0.01944577693939209, 0.020147323608398438, 0.020848870277404785, 0.021550416946411133, 0.02225196361541748, 0.022953510284423828, 0.023655056953430176, 0.024356603622436523, 0.02505815029144287, 0.02575969696044922, 0.026461243629455566, 0.027162790298461914, 0.02786433696746826, 0.02856588363647461, 0.029267430305480957, 0.029968976974487305, 0.030670523643493652, 0.0313720703125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 8.0, 10.0, 16.0, 43.0, 88.0, 184.0, 261.0, 211.0, 98.0, 31.0, 19.0, 11.0, 9.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19143696129322052, -0.1858953833580017, -0.1803537905216217, -0.1748121976852417, -0.1692706197500229, -0.16372904181480408, -0.15818744897842407, -0.15264585614204407, -0.14710427820682526, -0.14156270027160645, -0.13602110743522644, -0.13047951459884644, -0.12493793666362762, -0.11939635127782822, -0.11385476589202881, -0.1083131805062294, -0.10277159512042999, -0.09723000973463058, -0.09168842434883118, -0.08614683896303177, -0.08060525357723236, -0.07506366819143295, -0.06952208280563354, -0.06398049741983414, -0.05843891203403473, -0.05289732664823532, -0.04735574126243591, -0.041814155876636505, -0.0362725704908371, -0.03073098510503769, -0.02518939971923828, -0.019647814333438873, -0.01410624384880066, -0.008564658463001251, -0.0030230730772018433, 0.0025185123085975647, 0.008060097694396973, 0.01360168308019638, 0.01914326846599579, 0.024684853851795197, 0.030226439237594604, 0.03576802462339401, 0.04130961000919342, 0.04685119539499283, 0.052392780780792236, 0.057934366166591644, 0.06347595155239105, 0.06901753693819046, 0.07455912232398987, 0.08010070770978928, 0.08564229309558868, 0.09118387848138809, 0.0967254638671875, 0.10226704925298691, 0.10780863463878632, 0.11335022002458572, 0.11889180541038513, 0.12443339079618454, 0.12997497618198395, 0.13551655411720276, 0.14105814695358276, 0.14659973978996277, 0.15214131772518158, 0.1576828956604004, 0.1632244884967804]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 2.0, 3.0, 7.0, 4.0, 16.0, 19.0, 26.0, 34.0, 55.0, 100.0, 86.0, 130.0, 131.0, 93.0, 87.0, 70.0, 36.0, 38.0, 24.0, 16.0, 7.0, 6.0, 7.0, 4.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22065919637680054, -0.2150178849697113, -0.20937658846378326, -0.20373529195785522, -0.198093980550766, -0.19245266914367676, -0.18681137263774872, -0.18117007613182068, -0.17552876472473145, -0.1698874533176422, -0.16424615681171417, -0.15860486030578613, -0.1529635488986969, -0.14732223749160767, -0.14168094098567963, -0.1360396444797516, -0.13039833307266235, -0.12475702911615372, -0.11911572515964508, -0.11347442120313644, -0.10783311724662781, -0.10219181329011917, -0.09655050933361053, -0.0909092053771019, -0.08526790142059326, -0.07962659746408463, -0.07398529350757599, -0.06834398955106735, -0.06270268559455872, -0.05706138163805008, -0.05142007768154144, -0.045778773725032806, -0.04013746976852417, -0.03449616581201553, -0.028854861855506897, -0.02321355789899826, -0.017572253942489624, -0.011930949985980988, -0.006289646029472351, -0.0006483420729637146, 0.004992961883544922, 0.010634265840053558, 0.016275569796562195, 0.02191687375307083, 0.027558177709579468, 0.033199481666088104, 0.03884078562259674, 0.04448208957910538, 0.050123393535614014, 0.05576469749212265, 0.06140600144863129, 0.06704730540513992, 0.07268860936164856, 0.0783299133181572, 0.08397121727466583, 0.08961252123117447, 0.0952538251876831, 0.10089512914419174, 0.10653643310070038, 0.11217773705720901, 0.11781904101371765, 0.12346034497022629, 0.12910164892673492, 0.13474294543266296, 0.1403842568397522]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 6.0, 0.0, 2.0, 6.0, 0.0, 4.0, 6.0, 6.0, 8.0, 10.0, 6.0, 4.0, 8.0, 6.0, 14.0, 8.0, 16.0, 6.0, 16.0, 23.0, 43.0, 212.0, 26896.0, 4166108.0, 612.0, 70.0, 35.0, 17.0, 26.0, 20.0, 18.0, 11.0, 13.0, 10.0, 8.0, 8.0, 10.0, 6.0, 2.0, 6.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-0.67822265625, -0.6604537963867188, -0.6426849365234375, -0.6249160766601562, -0.607147216796875, -0.5893783569335938, -0.5716094970703125, -0.5538406372070312, -0.53607177734375, -0.5183029174804688, -0.5005340576171875, -0.48276519775390625, -0.464996337890625, -0.44722747802734375, -0.4294586181640625, -0.41168975830078125, -0.3939208984375, -0.37615203857421875, -0.3583831787109375, -0.34061431884765625, -0.322845458984375, -0.30507659912109375, -0.2873077392578125, -0.26953887939453125, -0.25177001953125, -0.23400115966796875, -0.2162322998046875, -0.19846343994140625, -0.180694580078125, -0.16292572021484375, -0.1451568603515625, -0.12738800048828125, -0.109619140625, -0.09185028076171875, -0.0740814208984375, -0.05631256103515625, -0.038543701171875, -0.02077484130859375, -0.0030059814453125, 0.01476287841796875, 0.03253173828125, 0.05030059814453125, 0.0680694580078125, 0.08583831787109375, 0.103607177734375, 0.12137603759765625, 0.1391448974609375, 0.15691375732421875, 0.1746826171875, 0.19245147705078125, 0.2102203369140625, 0.22798919677734375, 0.245758056640625, 0.26352691650390625, 0.2812957763671875, 0.29906463623046875, 0.31683349609375, 0.33460235595703125, 0.3523712158203125, 0.37014007568359375, 0.387908935546875, 0.40567779541015625, 0.4234466552734375, 0.44121551513671875, 0.458984375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 2.0, 5.0, 11.0, 8.0, 10.0, 17.0, 25.0, 57.0, 91.0, 115.0, 142.0, 145.0, 107.0, 77.0, 61.0, 30.0, 26.0, 17.0, 18.0, 15.0, 3.0, 7.0, 3.0, 7.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003326416015625, -0.003219783306121826, -0.0031131505966186523, -0.0030065178871154785, -0.0028998851776123047, -0.002793252468109131, -0.002686619758605957, -0.002579987049102783, -0.0024733543395996094, -0.0023667216300964355, -0.0022600889205932617, -0.002153456211090088, -0.002046823501586914, -0.0019401907920837402, -0.0018335580825805664, -0.0017269253730773926, -0.0016202926635742188, -0.001513659954071045, -0.001407027244567871, -0.0013003945350646973, -0.0011937618255615234, -0.0010871291160583496, -0.0009804964065551758, -0.000873863697052002, -0.0007672309875488281, -0.0006605982780456543, -0.0005539655685424805, -0.00044733285903930664, -0.0003407001495361328, -0.00023406744003295898, -0.00012743473052978516, -2.0802021026611328e-05, 8.58306884765625e-05, 0.00019246339797973633, 0.00029909610748291016, 0.000405728816986084, 0.0005123615264892578, 0.0006189942359924316, 0.0007256269454956055, 0.0008322596549987793, 0.0009388923645019531, 0.001045525074005127, 0.0011521577835083008, 0.0012587904930114746, 0.0013654232025146484, 0.0014720559120178223, 0.001578688621520996, 0.00168532133102417, 0.0017919540405273438, 0.0018985867500305176, 0.0020052194595336914, 0.0021118521690368652, 0.002218484878540039, 0.002325117588043213, 0.0024317502975463867, 0.0025383830070495605, 0.0026450157165527344, 0.002751648426055908, 0.002858281135559082, 0.002964913845062256, 0.0030715465545654297, 0.0031781792640686035, 0.0032848119735717773, 0.003391444683074951, 0.003498077392578125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 9.0, 8.0, 18.0, 9.0, 28.0, 35.0, 61.0, 80.0, 121.0, 188.0, 223.0, 570.0, 3211691.0, 979834.0, 574.0, 215.0, 147.0, 143.0, 118.0, 64.0, 52.0, 45.0, 12.0, 17.0, 7.0, 7.0, 3.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.208740234375, -0.19879150390625, -0.1888427734375, -0.17889404296875, -0.1689453125, -0.15899658203125, -0.1490478515625, -0.13909912109375, -0.129150390625, -0.11920166015625, -0.1092529296875, -0.09930419921875, -0.08935546875, -0.07940673828125, -0.0694580078125, -0.05950927734375, -0.049560546875, -0.03961181640625, -0.0296630859375, -0.01971435546875, -0.009765625, 0.00018310546875, 0.0101318359375, 0.02008056640625, 0.030029296875, 0.03997802734375, 0.0499267578125, 0.05987548828125, 0.06982421875, 0.07977294921875, 0.0897216796875, 0.09967041015625, 0.109619140625, 0.11956787109375, 0.1295166015625, 0.13946533203125, 0.1494140625, 0.15936279296875, 0.1693115234375, 0.17926025390625, 0.189208984375, 0.19915771484375, 0.2091064453125, 0.21905517578125, 0.22900390625, 0.23895263671875, 0.2489013671875, 0.25885009765625, 0.268798828125, 0.27874755859375, 0.2886962890625, 0.29864501953125, 0.30859375, 0.31854248046875, 0.3284912109375, 0.33843994140625, 0.348388671875, 0.35833740234375, 0.3682861328125, 0.37823486328125, 0.38818359375, 0.39813232421875, 0.4080810546875, 0.41802978515625, 0.427978515625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 5.0, 7.0, 33.0, 125.0, 2498.0, 1295.0, 88.0, 32.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.005390167236328125, -0.0044800639152526855, -0.003569960594177246, -0.0026598572731018066, -0.0017497539520263672, -0.0008396506309509277, 7.045269012451172e-05, 0.0009805560111999512, 0.0018906593322753906, 0.00280076265335083, 0.0037108659744262695, 0.004620969295501709, 0.0055310726165771484, 0.006441175937652588, 0.007351279258728027, 0.008261382579803467, 0.009171485900878906, 0.010081589221954346, 0.010991692543029785, 0.011901795864105225, 0.012811899185180664, 0.013722002506256104, 0.014632105827331543, 0.015542209148406982, 0.016452312469482422, 0.01736241579055786, 0.0182725191116333, 0.01918262243270874, 0.02009272575378418, 0.02100282907485962, 0.02191293239593506, 0.022823035717010498, 0.023733139038085938, 0.024643242359161377, 0.025553345680236816, 0.026463449001312256, 0.027373552322387695, 0.028283655643463135, 0.029193758964538574, 0.030103862285614014, 0.031013965606689453, 0.03192406892776489, 0.03283417224884033, 0.03374427556991577, 0.03465437889099121, 0.03556448221206665, 0.03647458553314209, 0.03738468885421753, 0.03829479217529297, 0.03920489549636841, 0.04011499881744385, 0.04102510213851929, 0.04193520545959473, 0.042845308780670166, 0.043755412101745605, 0.044665515422821045, 0.045575618743896484, 0.046485722064971924, 0.04739582538604736, 0.0483059287071228, 0.04921603202819824, 0.05012613534927368, 0.05103623867034912, 0.05194634199142456, 0.0528564453125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 7.0, 8.0, 26.0, 119.0, 649.0, 176.0, 18.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5053959488868713, -0.48323574662208557, -0.4610755145549774, -0.43891531229019165, -0.4167550802230835, -0.39459487795829773, -0.37243467569351196, -0.3502744436264038, -0.32811424136161804, -0.3059540390968323, -0.2837938070297241, -0.26163360476493835, -0.2394733875989914, -0.21731317043304443, -0.19515296816825867, -0.1729927510023117, -0.15083253383636475, -0.12867231667041779, -0.10651210695505142, -0.08435189723968506, -0.0621916800737381, -0.04003146290779114, -0.01787126064300537, 0.004288956522941589, 0.02644917368888855, 0.04860938712954521, 0.07076960057020187, 0.09292981028556824, 0.1150900274515152, 0.13725024461746216, 0.15941044688224792, 0.18157066404819489, 0.20373082160949707, 0.22589103877544403, 0.248051255941391, 0.27021145820617676, 0.2923716902732849, 0.3145318925380707, 0.33669209480285645, 0.3588523268699646, 0.38101252913475037, 0.40317273139953613, 0.4253329634666443, 0.44749316573143005, 0.4696533679962158, 0.491813600063324, 0.5139738321304321, 0.5361340045928955, 0.5582942366600037, 0.5804544687271118, 0.6026146411895752, 0.6247748732566833, 0.6469351053237915, 0.6690952777862549, 0.691255509853363, 0.7134157419204712, 0.7355759143829346, 0.7577361464500427, 0.7798963189125061, 0.8020565509796143, 0.8242167830467224, 0.8463770151138306, 0.868537187576294, 0.8906974196434021, 0.9128576517105103]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 12.0, 27.0, 89.0, 165.0, 271.0, 231.0, 130.0, 59.0, 23.0, 3.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22550296783447266, -0.20513667166233063, -0.1847703754901886, -0.16440406441688538, -0.14403776824474335, -0.12367147207260132, -0.10330516844987869, -0.08293886482715607, -0.06257256865501404, -0.04220626875758171, -0.021839968860149384, -0.0014736689627170563, 0.01889263093471527, 0.0392589271068573, 0.059625230729579926, 0.07999153435230255, 0.10035783052444458, 0.12072412669658661, 0.14109042286872864, 0.16145673394203186, 0.1818230301141739, 0.20218932628631592, 0.22255563735961914, 0.24292193353176117, 0.2632882297039032, 0.2836545407772064, 0.30402082204818726, 0.3243871331214905, 0.3447534441947937, 0.36511972546577454, 0.38548603653907776, 0.4058523178100586, 0.4262186288833618, 0.44658493995666504, 0.4669512212276459, 0.4873175323009491, 0.5076838135719299, 0.5280501246452332, 0.5484164357185364, 0.5687827467918396, 0.589148998260498, 0.6095153093338013, 0.6298816204071045, 0.6502478718757629, 0.6706141829490662, 0.6909804940223694, 0.7113468050956726, 0.7317131161689758, 0.752079427242279, 0.7724457383155823, 0.7928120493888855, 0.813178300857544, 0.8335446119308472, 0.8539109230041504, 0.8742772340774536, 0.8946435451507568, 0.9150098562240601, 0.9353761672973633, 0.9557424783706665, 0.976108729839325, 0.9964750409126282, 1.0168414115905762, 1.0372076034545898, 1.057573914527893, 1.0779402256011963]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 8.0, 7.0, 6.0, 6.0, 8.0, 10.0, 16.0, 19.0, 23.0, 30.0, 33.0, 39.0, 50.0, 46.0, 52.0, 57.0, 90.0, 1047111.0, 533.0, 64.0, 69.0, 55.0, 38.0, 35.0, 23.0, 28.0, 13.0, 17.0, 16.0, 10.0, 10.0, 10.0, 4.0, 3.0, 3.0, 5.0, 4.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.17578125, -2.1163482666015625, -2.056915283203125, -1.9974822998046875, -1.93804931640625, -1.8786163330078125, -1.819183349609375, -1.7597503662109375, -1.7003173828125, -1.6408843994140625, -1.581451416015625, -1.5220184326171875, -1.46258544921875, -1.4031524658203125, -1.343719482421875, -1.2842864990234375, -1.224853515625, -1.1654205322265625, -1.105987548828125, -1.0465545654296875, -0.98712158203125, -0.9276885986328125, -0.868255615234375, -0.8088226318359375, -0.7493896484375, -0.6899566650390625, -0.630523681640625, -0.5710906982421875, -0.51165771484375, -0.4522247314453125, -0.392791748046875, -0.3333587646484375, -0.27392578125, -0.2144927978515625, -0.155059814453125, -0.0956268310546875, -0.03619384765625, 0.0232391357421875, 0.082672119140625, 0.1421051025390625, 0.2015380859375, 0.2609710693359375, 0.320404052734375, 0.3798370361328125, 0.43927001953125, 0.4987030029296875, 0.558135986328125, 0.6175689697265625, 0.677001953125, 0.7364349365234375, 0.795867919921875, 0.8553009033203125, 0.91473388671875, 0.9741668701171875, 1.033599853515625, 1.0930328369140625, 1.1524658203125, 1.2118988037109375, 1.271331787109375, 1.3307647705078125, 1.39019775390625, 1.4496307373046875, 1.509063720703125, 1.5684967041015625, 1.6279296875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [50.0, 766.0, 202.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00855255126953125, -0.0037001371383666992, 0.0011522769927978516, 0.006004691123962402, 0.010857105255126953, 0.015709519386291504, 0.020561933517456055, 0.025414347648620605, 0.030266761779785156, 0.03511917591094971, 0.03997159004211426, 0.04482400417327881, 0.04967641830444336, 0.05452883243560791, 0.05938124656677246, 0.06423366069793701, 0.06908607482910156, 0.07393848896026611, 0.07879090309143066, 0.08364331722259521, 0.08849573135375977, 0.09334814548492432, 0.09820055961608887, 0.10305297374725342, 0.10790538787841797, 0.11275780200958252, 0.11761021614074707, 0.12246263027191162, 0.12731504440307617, 0.13216745853424072, 0.13701987266540527, 0.14187228679656982, 0.14672470092773438, 0.15157711505889893, 0.15642952919006348, 0.16128194332122803, 0.16613435745239258, 0.17098677158355713, 0.17583918571472168, 0.18069159984588623, 0.18554401397705078, 0.19039642810821533, 0.19524884223937988, 0.20010125637054443, 0.20495367050170898, 0.20980608463287354, 0.21465849876403809, 0.21951091289520264, 0.2243633270263672, 0.22921574115753174, 0.2340681552886963, 0.23892056941986084, 0.2437729835510254, 0.24862539768218994, 0.2534778118133545, 0.25833022594451904, 0.2631826400756836, 0.26803505420684814, 0.2728874683380127, 0.27773988246917725, 0.2825922966003418, 0.28744471073150635, 0.2922971248626709, 0.29714953899383545, 0.302001953125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 6.0, 4.0, 4.0, 5.0, 14.0, 10.0, 18.0, 23.0, 35.0, 55.0, 76.0, 139.0, 198.0, 323.0, 597.0, 1113.0, 2408.0, 5776.0, 17418.0, 65934.0, 572492.0, 310921.0, 48234.0, 13458.0, 4809.0, 2074.0, 1026.0, 559.0, 280.0, 176.0, 99.0, 80.0, 61.0, 41.0, 24.0, 20.0, 15.0, 11.0, 5.0, 3.0, 5.0, 5.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.323974609375, -0.31412506103515625, -0.3042755126953125, -0.29442596435546875, -0.284576416015625, -0.27472686767578125, -0.2648773193359375, -0.25502777099609375, -0.24517822265625, -0.23532867431640625, -0.2254791259765625, -0.21562957763671875, -0.205780029296875, -0.19593048095703125, -0.1860809326171875, -0.17623138427734375, -0.1663818359375, -0.15653228759765625, -0.1466827392578125, -0.13683319091796875, -0.126983642578125, -0.11713409423828125, -0.1072845458984375, -0.09743499755859375, -0.08758544921875, -0.07773590087890625, -0.0678863525390625, -0.05803680419921875, -0.048187255859375, -0.03833770751953125, -0.0284881591796875, -0.01863861083984375, -0.0087890625, 0.00106048583984375, 0.0109100341796875, 0.02075958251953125, 0.030609130859375, 0.04045867919921875, 0.0503082275390625, 0.06015777587890625, 0.07000732421875, 0.07985687255859375, 0.0897064208984375, 0.09955596923828125, 0.109405517578125, 0.11925506591796875, 0.1291046142578125, 0.13895416259765625, 0.1488037109375, 0.15865325927734375, 0.1685028076171875, 0.17835235595703125, 0.188201904296875, 0.19805145263671875, 0.2079010009765625, 0.21775054931640625, 0.22760009765625, 0.23744964599609375, 0.2472991943359375, 0.25714874267578125, 0.266998291015625, 0.27684783935546875, 0.2866973876953125, 0.29654693603515625, 0.306396484375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 4.0, 8.0, 12.0, 15.0, 15.0, 18.0, 36.0, 36.0, 29.0, 40.0, 65.0, 85.0, 69.0, 68.0, 76.0, 68.0, 56.0, 59.0, 44.0, 44.0, 40.0, 20.0, 13.0, 19.0, 8.0, 12.0, 10.0, 8.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.263916015625, -0.25655364990234375, -0.2491912841796875, -0.24182891845703125, -0.234466552734375, -0.22710418701171875, -0.2197418212890625, -0.21237945556640625, -0.20501708984375, -0.19765472412109375, -0.1902923583984375, -0.18292999267578125, -0.175567626953125, -0.16820526123046875, -0.1608428955078125, -0.15348052978515625, -0.1461181640625, -0.13875579833984375, -0.1313934326171875, -0.12403106689453125, -0.116668701171875, -0.10930633544921875, -0.1019439697265625, -0.09458160400390625, -0.08721923828125, -0.07985687255859375, -0.0724945068359375, -0.06513214111328125, -0.057769775390625, -0.05040740966796875, -0.0430450439453125, -0.03568267822265625, -0.0283203125, -0.02095794677734375, -0.0135955810546875, -0.00623321533203125, 0.001129150390625, 0.00849151611328125, 0.0158538818359375, 0.02321624755859375, 0.03057861328125, 0.03794097900390625, 0.0453033447265625, 0.05266571044921875, 0.060028076171875, 0.06739044189453125, 0.0747528076171875, 0.08211517333984375, 0.0894775390625, 0.09683990478515625, 0.1042022705078125, 0.11156463623046875, 0.118927001953125, 0.12628936767578125, 0.1336517333984375, 0.14101409912109375, 0.14837646484375, 0.15573883056640625, 0.1631011962890625, 0.17046356201171875, 0.177825927734375, 0.18518829345703125, 0.1925506591796875, 0.19991302490234375, 0.207275390625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 3.0, 7.0, 6.0, 9.0, 22.0, 24.0, 37.0, 52.0, 85.0, 150.0, 271.0, 475.0, 1108.0, 3399.0, 15940.0, 245110.0, 739376.0, 33891.0, 5539.0, 1521.0, 663.0, 312.0, 195.0, 101.0, 80.0, 50.0, 31.0, 24.0, 18.0, 13.0, 10.0, 4.0, 5.0, 1.0, 5.0, 1.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.327880859375, -0.3176918029785156, -0.30750274658203125, -0.2973136901855469, -0.2871246337890625, -0.2769355773925781, -0.26674652099609375, -0.2565574645996094, -0.246368408203125, -0.23617935180664062, -0.22599029541015625, -0.21580123901367188, -0.2056121826171875, -0.19542312622070312, -0.18523406982421875, -0.17504501342773438, -0.16485595703125, -0.15466690063476562, -0.14447784423828125, -0.13428878784179688, -0.1240997314453125, -0.11391067504882812, -0.10372161865234375, -0.09353256225585938, -0.083343505859375, -0.07315444946289062, -0.06296539306640625, -0.052776336669921875, -0.0425872802734375, -0.032398223876953125, -0.02220916748046875, -0.012020111083984375, -0.0018310546875, 0.008358001708984375, 0.01854705810546875, 0.028736114501953125, 0.0389251708984375, 0.049114227294921875, 0.05930328369140625, 0.06949234008789062, 0.079681396484375, 0.08987045288085938, 0.10005950927734375, 0.11024856567382812, 0.1204376220703125, 0.13062667846679688, 0.14081573486328125, 0.15100479125976562, 0.16119384765625, 0.17138290405273438, 0.18157196044921875, 0.19176101684570312, 0.2019500732421875, 0.21213912963867188, 0.22232818603515625, 0.23251724243164062, 0.242706298828125, 0.2528953552246094, 0.26308441162109375, 0.2732734680175781, 0.2834625244140625, 0.2936515808105469, 0.30384063720703125, 0.3140296936035156, 0.32421875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 2.0, 4.0, 10.0, 3.0, 6.0, 5.0, 7.0, 7.0, 12.0, 18.0, 20.0, 25.0, 47.0, 66.0, 96.0, 140.0, 149.0, 93.0, 76.0, 58.0, 49.0, 20.0, 19.0, 14.0, 7.0, 8.0, 11.0, 6.0, 6.0, 6.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0002460479736328125, -0.00023922696709632874, -0.00023240596055984497, -0.0002255849540233612, -0.00021876394748687744, -0.00021194294095039368, -0.0002051219344139099, -0.00019830092787742615, -0.00019147992134094238, -0.00018465891480445862, -0.00017783790826797485, -0.0001710169017314911, -0.00016419589519500732, -0.00015737488865852356, -0.0001505538821220398, -0.00014373287558555603, -0.00013691186904907227, -0.0001300908625125885, -0.00012326985597610474, -0.00011644884943962097, -0.00010962784290313721, -0.00010280683636665344, -9.598582983016968e-05, -8.916482329368591e-05, -8.234381675720215e-05, -7.552281022071838e-05, -6.870180368423462e-05, -6.188079714775085e-05, -5.505979061126709e-05, -4.8238784074783325e-05, -4.141777753829956e-05, -3.4596771001815796e-05, -2.777576446533203e-05, -2.0954757928848267e-05, -1.4133751392364502e-05, -7.312744855880737e-06, -4.917383193969727e-07, 6.329268217086792e-06, 1.3150274753570557e-05, 1.997128129005432e-05, 2.6792287826538086e-05, 3.361329436302185e-05, 4.0434300899505615e-05, 4.725530743598938e-05, 5.4076313972473145e-05, 6.089732050895691e-05, 6.771832704544067e-05, 7.453933358192444e-05, 8.13603401184082e-05, 8.818134665489197e-05, 9.500235319137573e-05, 0.0001018233597278595, 0.00010864436626434326, 0.00011546537280082703, 0.0001222863793373108, 0.00012910738587379456, 0.00013592839241027832, 0.00014274939894676208, 0.00014957040548324585, 0.00015639141201972961, 0.00016321241855621338, 0.00017003342509269714, 0.0001768544316291809, 0.00018367543816566467, 0.00019049644470214844]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 5.0, 3.0, 5.0, 5.0, 7.0, 14.0, 18.0, 39.0, 31.0, 56.0, 89.0, 146.0, 254.0, 515.0, 955.0, 2237.0, 5823.0, 22359.0, 576117.0, 410045.0, 20160.0, 5572.0, 2102.0, 929.0, 446.0, 239.0, 139.0, 73.0, 59.0, 31.0, 22.0, 19.0, 6.0, 12.0, 7.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.50830078125, -0.4941673278808594, -0.48003387451171875, -0.4659004211425781, -0.4517669677734375, -0.4376335144042969, -0.42350006103515625, -0.4093666076660156, -0.395233154296875, -0.3810997009277344, -0.36696624755859375, -0.3528327941894531, -0.3386993408203125, -0.3245658874511719, -0.31043243408203125, -0.2962989807128906, -0.28216552734375, -0.2680320739746094, -0.25389862060546875, -0.23976516723632812, -0.2256317138671875, -0.21149826049804688, -0.19736480712890625, -0.18323135375976562, -0.169097900390625, -0.15496444702148438, -0.14083099365234375, -0.12669754028320312, -0.1125640869140625, -0.09843063354492188, -0.08429718017578125, -0.07016372680664062, -0.0560302734375, -0.041896820068359375, -0.02776336669921875, -0.013629913330078125, 0.0005035400390625, 0.014636993408203125, 0.02877044677734375, 0.042903900146484375, 0.057037353515625, 0.07117080688476562, 0.08530426025390625, 0.09943771362304688, 0.1135711669921875, 0.12770462036132812, 0.14183807373046875, 0.15597152709960938, 0.17010498046875, 0.18423843383789062, 0.19837188720703125, 0.21250534057617188, 0.2266387939453125, 0.24077224731445312, 0.25490570068359375, 0.2690391540527344, 0.283172607421875, 0.2973060607910156, 0.31143951416015625, 0.3255729675292969, 0.3397064208984375, 0.3538398742675781, 0.36797332763671875, 0.3821067810058594, 0.396240234375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 11.0, 6.0, 12.0, 15.0, 22.0, 34.0, 71.0, 248.0, 297.0, 130.0, 50.0, 25.0, 16.0, 11.0, 9.0, 6.0, 4.0, 7.0, 3.0, 5.0, 5.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.286376953125, -0.27925682067871094, -0.2721366882324219, -0.2650165557861328, -0.25789642333984375, -0.2507762908935547, -0.24365615844726562, -0.23653602600097656, -0.2294158935546875, -0.22229576110839844, -0.21517562866210938, -0.2080554962158203, -0.20093536376953125, -0.1938152313232422, -0.18669509887695312, -0.17957496643066406, -0.172454833984375, -0.16533470153808594, -0.15821456909179688, -0.1510944366455078, -0.14397430419921875, -0.1368541717529297, -0.12973403930664062, -0.12261390686035156, -0.1154937744140625, -0.10837364196777344, -0.10125350952148438, -0.09413337707519531, -0.08701324462890625, -0.07989311218261719, -0.07277297973632812, -0.06565284729003906, -0.05853271484375, -0.05141258239746094, -0.044292449951171875, -0.03717231750488281, -0.03005218505859375, -0.022932052612304688, -0.015811920166015625, -0.008691787719726562, -0.0015716552734375, 0.0055484771728515625, 0.012668609619140625, 0.019788742065429688, 0.02690887451171875, 0.03402900695800781, 0.041149139404296875, 0.04826927185058594, 0.055389404296875, 0.06250953674316406, 0.06962966918945312, 0.07674980163574219, 0.08386993408203125, 0.09099006652832031, 0.09811019897460938, 0.10523033142089844, 0.1123504638671875, 0.11947059631347656, 0.12659072875976562, 0.1337108612060547, 0.14083099365234375, 0.1479511260986328, 0.15507125854492188, 0.16219139099121094, 0.1693115234375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 11.0, 19.0, 42.0, 83.0, 315.0, 418.0, 90.0, 17.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.587178945541382, -2.4654762744903564, -2.343773603439331, -2.2220709323883057, -2.1003682613372803, -1.9786655902862549, -1.8569629192352295, -1.735260248184204, -1.6135575771331787, -1.4918549060821533, -1.370152235031128, -1.2484495639801025, -1.1267468929290771, -1.0050442218780518, -0.8833415508270264, -0.761638879776001, -0.6399362087249756, -0.5182335376739502, -0.3965308666229248, -0.2748281955718994, -0.15312552452087402, -0.03142285346984863, 0.09027981758117676, 0.21198248863220215, 0.33368515968322754, 0.45538783073425293, 0.5770905017852783, 0.6987931728363037, 0.8204958438873291, 0.9421985149383545, 1.0639011859893799, 1.1856038570404053, 1.3073062896728516, 1.429008960723877, 1.5507116317749023, 1.6724143028259277, 1.7941169738769531, 1.9158196449279785, 2.037522315979004, 2.1592249870300293, 2.2809276580810547, 2.40263032913208, 2.5243330001831055, 2.646035671234131, 2.7677383422851562, 2.8894410133361816, 3.011143684387207, 3.1328463554382324, 3.254549026489258, 3.376251697540283, 3.4979543685913086, 3.619657039642334, 3.7413597106933594, 3.8630623817443848, 3.98476505279541, 4.1064677238464355, 4.228170394897461, 4.349873065948486, 4.471575736999512, 4.593278408050537, 4.7149810791015625, 4.836683750152588, 4.958386421203613, 5.080089092254639, 5.201791763305664]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 7.0, 4.0, 13.0, 14.0, 12.0, 33.0, 30.0, 38.0, 45.0, 76.0, 83.0, 70.0, 85.0, 83.0, 71.0, 59.0, 64.0, 48.0, 44.0, 41.0, 29.0, 21.0, 14.0, 8.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0924594402313232, -1.035036563873291, -0.977613627910614, -0.920190691947937, -0.8627678155899048, -0.8053449392318726, -0.7479220032691956, -0.6904990673065186, -0.6330761909484863, -0.5756533145904541, -0.5182303786277771, -0.4608074724674225, -0.40338456630706787, -0.34596166014671326, -0.28853875398635864, -0.23111584782600403, -0.17369294166564941, -0.1162700355052948, -0.058847129344940186, -0.0014242231845855713, 0.05599868297576904, 0.11342158913612366, 0.17084449529647827, 0.22826740145683289, 0.2856903076171875, 0.3431132137775421, 0.40053611993789673, 0.45795902609825134, 0.515381932258606, 0.5728048086166382, 0.6302277445793152, 0.6876506805419922, 0.7450735569000244, 0.8024964332580566, 0.8599193692207336, 0.9173423051834106, 0.9747651815414429, 1.032188057899475, 1.0896110534667969, 1.147033929824829, 1.2044568061828613, 1.2618796825408936, 1.3193025588989258, 1.3767255544662476, 1.4341484308242798, 1.491571307182312, 1.5489943027496338, 1.606417179107666, 1.6638400554656982, 1.7212629318237305, 1.7786858081817627, 1.8361088037490845, 1.8935316801071167, 1.950954556465149, 2.0083775520324707, 2.065800428390503, 2.123223304748535, 2.1806461811065674, 2.2380690574645996, 2.295491933822632, 2.352914810180664, 2.4103379249572754, 2.4677608013153076, 2.52518367767334, 2.582606554031372]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 35.0, 134.0, 13743.0, 4179190.0, 596.0, 237.0, 119.0, 92.0, 60.0, 36.0, 18.0, 21.0, 8.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.89111328125, -0.6778488159179688, -0.4645843505859375, -0.25131988525390625, -0.038055419921875, 0.17520904541015625, 0.3884735107421875, 0.6017379760742188, 0.81500244140625, 1.0282669067382812, 1.2415313720703125, 1.4547958374023438, 1.668060302734375, 1.8813247680664062, 2.0945892333984375, 2.3078536987304688, 2.5211181640625, 2.7343826293945312, 2.9476470947265625, 3.1609115600585938, 3.374176025390625, 3.5874404907226562, 3.8007049560546875, 4.013969421386719, 4.22723388671875, 4.440498352050781, 4.6537628173828125, 4.867027282714844, 5.080291748046875, 5.293556213378906, 5.5068206787109375, 5.720085144042969, 5.933349609375, 6.146614074707031, 6.3598785400390625, 6.573143005371094, 6.786407470703125, 6.999671936035156, 7.2129364013671875, 7.426200866699219, 7.63946533203125, 7.852729797363281, 8.065994262695312, 8.279258728027344, 8.492523193359375, 8.705787658691406, 8.919052124023438, 9.132316589355469, 9.3455810546875, 9.558845520019531, 9.772109985351562, 9.985374450683594, 10.198638916015625, 10.411903381347656, 10.625167846679688, 10.838432312011719, 11.05169677734375, 11.264961242675781, 11.478225708007812, 11.691490173339844, 11.904754638671875, 12.118019104003906, 12.331283569335938, 12.544548034667969, 12.7578125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [4.0, 27.0, 104.0, 298.0, 351.0, 177.0, 48.0, 11.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.023223876953125, -0.017798900604248047, -0.012373924255371094, -0.006948947906494141, -0.0015239715576171875, 0.0039010047912597656, 0.009325981140136719, 0.014750957489013672, 0.020175933837890625, 0.025600910186767578, 0.03102588653564453, 0.036450862884521484, 0.04187583923339844, 0.04730081558227539, 0.052725791931152344, 0.0581507682800293, 0.06357574462890625, 0.0690007209777832, 0.07442569732666016, 0.07985067367553711, 0.08527565002441406, 0.09070062637329102, 0.09612560272216797, 0.10155057907104492, 0.10697555541992188, 0.11240053176879883, 0.11782550811767578, 0.12325048446655273, 0.1286754608154297, 0.13410043716430664, 0.1395254135131836, 0.14495038986206055, 0.1503753662109375, 0.15580034255981445, 0.1612253189086914, 0.16665029525756836, 0.1720752716064453, 0.17750024795532227, 0.18292522430419922, 0.18835020065307617, 0.19377517700195312, 0.19920015335083008, 0.20462512969970703, 0.21005010604858398, 0.21547508239746094, 0.2209000587463379, 0.22632503509521484, 0.2317500114440918, 0.23717498779296875, 0.2425999641418457, 0.24802494049072266, 0.2534499168395996, 0.25887489318847656, 0.2642998695373535, 0.26972484588623047, 0.2751498222351074, 0.2805747985839844, 0.28599977493286133, 0.2914247512817383, 0.29684972763061523, 0.3022747039794922, 0.30769968032836914, 0.3131246566772461, 0.31854963302612305, 0.323974609375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 8.0, 13.0, 16.0, 23.0, 33.0, 58.0, 89.0, 176.0, 352.0, 813.0, 2949.0, 19311.0, 4098754.0, 66214.0, 3737.0, 1010.0, 335.0, 170.0, 92.0, 62.0, 35.0, 25.0, 6.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.357421875, -2.2980499267578125, -2.238677978515625, -2.1793060302734375, -2.11993408203125, -2.0605621337890625, -2.001190185546875, -1.9418182373046875, -1.8824462890625, -1.8230743408203125, -1.763702392578125, -1.7043304443359375, -1.64495849609375, -1.5855865478515625, -1.526214599609375, -1.4668426513671875, -1.407470703125, -1.3480987548828125, -1.288726806640625, -1.2293548583984375, -1.16998291015625, -1.1106109619140625, -1.051239013671875, -0.9918670654296875, -0.9324951171875, -0.8731231689453125, -0.813751220703125, -0.7543792724609375, -0.69500732421875, -0.6356353759765625, -0.576263427734375, -0.5168914794921875, -0.45751953125, -0.3981475830078125, -0.338775634765625, -0.2794036865234375, -0.22003173828125, -0.1606597900390625, -0.101287841796875, -0.0419158935546875, 0.0174560546875, 0.0768280029296875, 0.136199951171875, 0.1955718994140625, 0.25494384765625, 0.3143157958984375, 0.373687744140625, 0.4330596923828125, 0.492431640625, 0.5518035888671875, 0.611175537109375, 0.6705474853515625, 0.72991943359375, 0.7892913818359375, 0.848663330078125, 0.9080352783203125, 0.9674072265625, 1.0267791748046875, 1.086151123046875, 1.1455230712890625, 1.20489501953125, 1.2642669677734375, 1.323638916015625, 1.3830108642578125, 1.4423828125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 0.0, 3.0, 3.0, 3.0, 1.0, 15.0, 8.0, 16.0, 31.0, 39.0, 81.0, 158.0, 2431.0, 1116.0, 110.0, 40.0, 15.0, 7.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3994140625, -0.39052581787109375, -0.3816375732421875, -0.37274932861328125, -0.363861083984375, -0.35497283935546875, -0.3460845947265625, -0.33719635009765625, -0.32830810546875, -0.31941986083984375, -0.3105316162109375, -0.30164337158203125, -0.292755126953125, -0.28386688232421875, -0.2749786376953125, -0.26609039306640625, -0.2572021484375, -0.24831390380859375, -0.2394256591796875, -0.23053741455078125, -0.221649169921875, -0.21276092529296875, -0.2038726806640625, -0.19498443603515625, -0.18609619140625, -0.17720794677734375, -0.1683197021484375, -0.15943145751953125, -0.150543212890625, -0.14165496826171875, -0.1327667236328125, -0.12387847900390625, -0.114990234375, -0.10610198974609375, -0.0972137451171875, -0.08832550048828125, -0.079437255859375, -0.07054901123046875, -0.0616607666015625, -0.05277252197265625, -0.04388427734375, -0.03499603271484375, -0.0261077880859375, -0.01721954345703125, -0.008331298828125, 0.00055694580078125, 0.0094451904296875, 0.01833343505859375, 0.0272216796875, 0.03610992431640625, 0.0449981689453125, 0.05388641357421875, 0.062774658203125, 0.07166290283203125, 0.0805511474609375, 0.08943939208984375, 0.09832763671875, 0.10721588134765625, 0.1161041259765625, 0.12499237060546875, 0.133880615234375, 0.14276885986328125, 0.1516571044921875, 0.16054534912109375, 0.16943359375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 9.0, 22.0, 33.0, 79.0, 217.0, 431.0, 146.0, 42.0, 10.0, 8.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.462117910385132, -2.3997251987457275, -2.3373324871063232, -2.27493953704834, -2.2125468254089355, -2.1501541137695312, -2.087761402130127, -2.0253686904907227, -1.9629758596420288, -1.9005831480026245, -1.8381903171539307, -1.7757976055145264, -1.713404893875122, -1.6510120630264282, -1.588619351387024, -1.52622652053833, -1.4638338088989258, -1.4014410972595215, -1.3390482664108276, -1.2766555547714233, -1.214262843132019, -1.1518700122833252, -1.089477300643921, -1.0270845890045166, -0.9646918773651123, -0.9022991061210632, -0.8399063944816589, -0.7775136232376099, -0.7151208519935608, -0.6527280807495117, -0.5903353691101074, -0.5279425978660583, -0.4655498266220093, -0.4031570851802826, -0.3407643139362335, -0.27837157249450684, -0.21597881615161896, -0.15358605980873108, -0.0911933183670044, -0.028800547122955322, 0.03359219431877136, 0.09598495066165924, 0.15837770700454712, 0.2207704484462738, 0.2831631898880005, 0.34555596113204956, 0.40794870257377625, 0.4703414738178253, 0.532734215259552, 0.5951269865036011, 0.6575196981430054, 0.7199124693870544, 0.7823052406311035, 0.8446979522705078, 0.9070907235145569, 0.969483494758606, 1.0318762063980103, 1.0942689180374146, 1.1566617488861084, 1.2190544605255127, 1.281447172164917, 1.3438400030136108, 1.4062327146530151, 1.468625545501709, 1.5310182571411133]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 8.0, 16.0, 12.0, 23.0, 20.0, 36.0, 53.0, 70.0, 84.0, 98.0, 88.0, 88.0, 69.0, 84.0, 75.0, 48.0, 43.0, 27.0, 19.0, 13.0, 12.0, 9.0, 1.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2092745304107666, -1.174912691116333, -1.1405508518218994, -1.1061891317367554, -1.0718272924423218, -1.0374654531478882, -1.0031036138534546, -0.968741774559021, -0.9343799948692322, -0.9000181555747986, -0.8656563758850098, -0.8312945365905762, -0.7969326972961426, -0.7625709176063538, -0.7282090783119202, -0.6938472986221313, -0.6594854593276978, -0.6251236200332642, -0.5907618403434753, -0.5564000010490417, -0.5220382213592529, -0.48767638206481934, -0.45331454277038574, -0.41895273327827454, -0.38459092378616333, -0.3502291142940521, -0.3158673048019409, -0.2815054655075073, -0.24714365601539612, -0.2127818465232849, -0.1784200221300125, -0.1440581977367401, -0.10969632863998413, -0.07533451169729233, -0.040972694754600525, -0.006610877811908722, 0.02775093913078308, 0.06211274862289429, 0.09647457301616669, 0.1308363974094391, 0.1651982069015503, 0.1995600163936615, 0.2339218407869339, 0.2682836651802063, 0.3026454746723175, 0.3370072841644287, 0.3713691234588623, 0.4057309329509735, 0.4400927424430847, 0.4744545519351959, 0.5088163614273071, 0.5431782007217407, 0.5775400400161743, 0.6119018197059631, 0.6462636590003967, 0.6806254386901855, 0.7149872779846191, 0.7493491172790527, 0.7837108969688416, 0.8180727362632751, 0.852434515953064, 0.8867963552474976, 0.9211581945419312, 0.9555200338363647, 0.9898818135261536]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0, 2.0, 3.0, 5.0, 2.0, 4.0, 6.0, 4.0, 8.0, 17.0, 12.0, 19.0, 18.0, 25.0, 35.0, 29.0, 48.0, 61.0, 129.0, 572.0, 9393.0, 933074.0, 102208.0, 2281.0, 255.0, 73.0, 53.0, 41.0, 28.0, 19.0, 25.0, 16.0, 18.0, 21.0, 11.0, 9.0, 7.0, 7.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.6865234375, -1.6365814208984375, -1.586639404296875, -1.5366973876953125, -1.48675537109375, -1.4368133544921875, -1.386871337890625, -1.3369293212890625, -1.2869873046875, -1.2370452880859375, -1.187103271484375, -1.1371612548828125, -1.08721923828125, -1.0372772216796875, -0.987335205078125, -0.9373931884765625, -0.887451171875, -0.8375091552734375, -0.787567138671875, -0.7376251220703125, -0.68768310546875, -0.6377410888671875, -0.587799072265625, -0.5378570556640625, -0.4879150390625, -0.4379730224609375, -0.388031005859375, -0.3380889892578125, -0.28814697265625, -0.2382049560546875, -0.188262939453125, -0.1383209228515625, -0.08837890625, -0.0384368896484375, 0.011505126953125, 0.0614471435546875, 0.11138916015625, 0.1613311767578125, 0.211273193359375, 0.2612152099609375, 0.3111572265625, 0.3610992431640625, 0.411041259765625, 0.4609832763671875, 0.51092529296875, 0.5608673095703125, 0.610809326171875, 0.6607513427734375, 0.710693359375, 0.7606353759765625, 0.810577392578125, 0.8605194091796875, 0.91046142578125, 0.9604034423828125, 1.010345458984375, 1.0602874755859375, 1.1102294921875, 1.1601715087890625, 1.210113525390625, 1.2600555419921875, 1.30999755859375, 1.3599395751953125, 1.409881591796875, 1.4598236083984375, 1.509765625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 4.0, 24.0, 69.0, 137.0, 283.0, 252.0, 156.0, 62.0, 22.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.047149658203125, -0.04127836227416992, -0.035407066345214844, -0.029535770416259766, -0.023664474487304688, -0.01779317855834961, -0.011921882629394531, -0.006050586700439453, -0.000179290771484375, 0.005692005157470703, 0.011563301086425781, 0.01743459701538086, 0.023305892944335938, 0.029177188873291016, 0.035048484802246094, 0.04091978073120117, 0.04679107666015625, 0.05266237258911133, 0.058533668518066406, 0.06440496444702148, 0.07027626037597656, 0.07614755630493164, 0.08201885223388672, 0.0878901481628418, 0.09376144409179688, 0.09963274002075195, 0.10550403594970703, 0.11137533187866211, 0.11724662780761719, 0.12311792373657227, 0.12898921966552734, 0.13486051559448242, 0.1407318115234375, 0.14660310745239258, 0.15247440338134766, 0.15834569931030273, 0.1642169952392578, 0.1700882911682129, 0.17595958709716797, 0.18183088302612305, 0.18770217895507812, 0.1935734748840332, 0.19944477081298828, 0.20531606674194336, 0.21118736267089844, 0.21705865859985352, 0.2229299545288086, 0.22880125045776367, 0.23467254638671875, 0.24054384231567383, 0.2464151382446289, 0.252286434173584, 0.25815773010253906, 0.26402902603149414, 0.2699003219604492, 0.2757716178894043, 0.2816429138183594, 0.28751420974731445, 0.29338550567626953, 0.2992568016052246, 0.3051280975341797, 0.31099939346313477, 0.31687068939208984, 0.3227419853210449, 0.32861328125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 5.0, 5.0, 4.0, 5.0, 5.0, 7.0, 14.0, 19.0, 26.0, 23.0, 43.0, 54.0, 74.0, 89.0, 149.0, 205.0, 351.0, 639.0, 1297.0, 3724.0, 13764.0, 81292.0, 645779.0, 258087.0, 31476.0, 6928.0, 2154.0, 942.0, 478.0, 298.0, 158.0, 128.0, 80.0, 73.0, 55.0, 38.0, 28.0, 16.0, 16.0, 8.0, 8.0, 5.0, 6.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28369140625, -0.2730865478515625, -0.262481689453125, -0.2518768310546875, -0.24127197265625, -0.2306671142578125, -0.220062255859375, -0.2094573974609375, -0.1988525390625, -0.1882476806640625, -0.177642822265625, -0.1670379638671875, -0.15643310546875, -0.1458282470703125, -0.135223388671875, -0.1246185302734375, -0.114013671875, -0.1034088134765625, -0.092803955078125, -0.0821990966796875, -0.07159423828125, -0.0609893798828125, -0.050384521484375, -0.0397796630859375, -0.0291748046875, -0.0185699462890625, -0.007965087890625, 0.0026397705078125, 0.01324462890625, 0.0238494873046875, 0.034454345703125, 0.0450592041015625, 0.0556640625, 0.0662689208984375, 0.076873779296875, 0.0874786376953125, 0.09808349609375, 0.1086883544921875, 0.119293212890625, 0.1298980712890625, 0.1405029296875, 0.1511077880859375, 0.161712646484375, 0.1723175048828125, 0.18292236328125, 0.1935272216796875, 0.204132080078125, 0.2147369384765625, 0.225341796875, 0.2359466552734375, 0.246551513671875, 0.2571563720703125, 0.26776123046875, 0.2783660888671875, 0.288970947265625, 0.2995758056640625, 0.3101806640625, 0.3207855224609375, 0.331390380859375, 0.3419952392578125, 0.35260009765625, 0.3632049560546875, 0.373809814453125, 0.3844146728515625, 0.39501953125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 4.0, 8.0, 6.0, 4.0, 8.0, 8.0, 17.0, 15.0, 13.0, 16.0, 19.0, 31.0, 44.0, 42.0, 35.0, 50.0, 47.0, 48.0, 59.0, 42.0, 57.0, 50.0, 57.0, 39.0, 50.0, 37.0, 37.0, 30.0, 19.0, 22.0, 17.0, 19.0, 11.0, 14.0, 7.0, 10.0, 2.0, 5.0, 1.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.15087890625, -0.14498138427734375, -0.1390838623046875, -0.13318634033203125, -0.127288818359375, -0.12139129638671875, -0.1154937744140625, -0.10959625244140625, -0.10369873046875, -0.09780120849609375, -0.0919036865234375, -0.08600616455078125, -0.080108642578125, -0.07421112060546875, -0.0683135986328125, -0.06241607666015625, -0.0565185546875, -0.05062103271484375, -0.0447235107421875, -0.03882598876953125, -0.032928466796875, -0.02703094482421875, -0.0211334228515625, -0.01523590087890625, -0.00933837890625, -0.00344085693359375, 0.0024566650390625, 0.00835418701171875, 0.014251708984375, 0.02014923095703125, 0.0260467529296875, 0.03194427490234375, 0.037841796875, 0.04373931884765625, 0.0496368408203125, 0.05553436279296875, 0.061431884765625, 0.06732940673828125, 0.0732269287109375, 0.07912445068359375, 0.08502197265625, 0.09091949462890625, 0.0968170166015625, 0.10271453857421875, 0.108612060546875, 0.11450958251953125, 0.1204071044921875, 0.12630462646484375, 0.1322021484375, 0.13809967041015625, 0.1439971923828125, 0.14989471435546875, 0.155792236328125, 0.16168975830078125, 0.1675872802734375, 0.17348480224609375, 0.17938232421875, 0.18527984619140625, 0.1911773681640625, 0.19707489013671875, 0.202972412109375, 0.20886993408203125, 0.2147674560546875, 0.22066497802734375, 0.2265625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 6.0, 4.0, 16.0, 18.0, 46.0, 67.0, 152.0, 316.0, 976.0, 5618.0, 342589.0, 689270.0, 7577.0, 1149.0, 427.0, 170.0, 71.0, 30.0, 19.0, 16.0, 8.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.472412109375, -0.4542884826660156, -0.43616485595703125, -0.4180412292480469, -0.3999176025390625, -0.3817939758300781, -0.36367034912109375, -0.3455467224121094, -0.327423095703125, -0.3092994689941406, -0.29117584228515625, -0.2730522155761719, -0.2549285888671875, -0.23680496215820312, -0.21868133544921875, -0.20055770874023438, -0.18243408203125, -0.16431045532226562, -0.14618682861328125, -0.12806320190429688, -0.1099395751953125, -0.09181594848632812, -0.07369232177734375, -0.055568695068359375, -0.037445068359375, -0.019321441650390625, -0.00119781494140625, 0.016925811767578125, 0.0350494384765625, 0.053173065185546875, 0.07129669189453125, 0.08942031860351562, 0.1075439453125, 0.12566757202148438, 0.14379119873046875, 0.16191482543945312, 0.1800384521484375, 0.19816207885742188, 0.21628570556640625, 0.23440933227539062, 0.252532958984375, 0.2706565856933594, 0.28878021240234375, 0.3069038391113281, 0.3250274658203125, 0.3431510925292969, 0.36127471923828125, 0.3793983459472656, 0.39752197265625, 0.4156455993652344, 0.43376922607421875, 0.4518928527832031, 0.4700164794921875, 0.4881401062011719, 0.5062637329101562, 0.5243873596191406, 0.542510986328125, 0.5606346130371094, 0.5787582397460938, 0.5968818664550781, 0.6150054931640625, 0.6331291198730469, 0.6512527465820312, 0.6693763732910156, 0.6875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 5.0, 9.0, 4.0, 5.0, 10.0, 34.0, 52.0, 118.0, 219.0, 256.0, 148.0, 84.0, 42.0, 12.0, 8.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.0007457733154296875, -0.0007314775139093399, -0.0007171817123889923, -0.0007028859108686447, -0.0006885901093482971, -0.0006742943078279495, -0.0006599985063076019, -0.0006457027047872543, -0.0006314069032669067, -0.0006171111017465591, -0.0006028153002262115, -0.000588519498705864, -0.0005742236971855164, -0.0005599278956651688, -0.0005456320941448212, -0.0005313362926244736, -0.000517040491104126, -0.0005027446895837784, -0.0004884488880634308, -0.0004741530865430832, -0.0004598572850227356, -0.000445561483502388, -0.0004312656819820404, -0.0004169698804616928, -0.0004026740789413452, -0.0003883782774209976, -0.00037408247590065, -0.00035978667438030243, -0.00034549087285995483, -0.00033119507133960724, -0.00031689926981925964, -0.00030260346829891205, -0.00028830766677856445, -0.00027401186525821686, -0.00025971606373786926, -0.00024542026221752167, -0.00023112446069717407, -0.00021682865917682648, -0.00020253285765647888, -0.0001882370561361313, -0.0001739412546157837, -0.0001596454530954361, -0.0001453496515750885, -0.0001310538500547409, -0.00011675804853439331, -0.00010246224701404572, -8.816644549369812e-05, -7.387064397335052e-05, -5.957484245300293e-05, -4.5279040932655334e-05, -3.098323941230774e-05, -1.6687437891960144e-05, -2.391636371612549e-06, 1.1904165148735046e-05, 2.619996666908264e-05, 4.049576818943024e-05, 5.479156970977783e-05, 6.908737123012543e-05, 8.338317275047302e-05, 9.767897427082062e-05, 0.00011197477579116821, 0.0001262705773115158, 0.0001405663788318634, 0.000154862180352211, 0.0001691579818725586]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 8.0, 5.0, 7.0, 17.0, 12.0, 38.0, 47.0, 90.0, 168.0, 312.0, 764.0, 2403.0, 11244.0, 148976.0, 829740.0, 46140.0, 5955.0, 1493.0, 584.0, 240.0, 117.0, 65.0, 50.0, 30.0, 12.0, 16.0, 13.0, 6.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.260498046875, -0.249786376953125, -0.23907470703125, -0.228363037109375, -0.2176513671875, -0.206939697265625, -0.19622802734375, -0.185516357421875, -0.1748046875, -0.164093017578125, -0.15338134765625, -0.142669677734375, -0.1319580078125, -0.121246337890625, -0.11053466796875, -0.099822998046875, -0.089111328125, -0.078399658203125, -0.06768798828125, -0.056976318359375, -0.0462646484375, -0.035552978515625, -0.02484130859375, -0.014129638671875, -0.00341796875, 0.007293701171875, 0.01800537109375, 0.028717041015625, 0.0394287109375, 0.050140380859375, 0.06085205078125, 0.071563720703125, 0.082275390625, 0.092987060546875, 0.10369873046875, 0.114410400390625, 0.1251220703125, 0.135833740234375, 0.14654541015625, 0.157257080078125, 0.16796875, 0.178680419921875, 0.18939208984375, 0.200103759765625, 0.2108154296875, 0.221527099609375, 0.23223876953125, 0.242950439453125, 0.253662109375, 0.264373779296875, 0.27508544921875, 0.285797119140625, 0.2965087890625, 0.307220458984375, 0.31793212890625, 0.328643798828125, 0.33935546875, 0.350067138671875, 0.36077880859375, 0.371490478515625, 0.3822021484375, 0.392913818359375, 0.40362548828125, 0.414337158203125, 0.425048828125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 7.0, 5.0, 5.0, 7.0, 11.0, 9.0, 27.0, 61.0, 107.0, 142.0, 178.0, 171.0, 115.0, 62.0, 38.0, 20.0, 15.0, 6.0, 7.0, 2.0, 3.0, 7.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1136474609375, -0.10819244384765625, -0.1027374267578125, -0.09728240966796875, -0.091827392578125, -0.08637237548828125, -0.0809173583984375, -0.07546234130859375, -0.07000732421875, -0.06455230712890625, -0.0590972900390625, -0.05364227294921875, -0.048187255859375, -0.04273223876953125, -0.0372772216796875, -0.03182220458984375, -0.0263671875, -0.02091217041015625, -0.0154571533203125, -0.01000213623046875, -0.004547119140625, 0.00090789794921875, 0.0063629150390625, 0.01181793212890625, 0.01727294921875, 0.02272796630859375, 0.0281829833984375, 0.03363800048828125, 0.039093017578125, 0.04454803466796875, 0.0500030517578125, 0.05545806884765625, 0.0609130859375, 0.06636810302734375, 0.0718231201171875, 0.07727813720703125, 0.082733154296875, 0.08818817138671875, 0.0936431884765625, 0.09909820556640625, 0.10455322265625, 0.11000823974609375, 0.1154632568359375, 0.12091827392578125, 0.126373291015625, 0.13182830810546875, 0.1372833251953125, 0.14273834228515625, 0.148193359375, 0.15364837646484375, 0.1591033935546875, 0.16455841064453125, 0.170013427734375, 0.17546844482421875, 0.1809234619140625, 0.18637847900390625, 0.19183349609375, 0.19728851318359375, 0.2027435302734375, 0.20819854736328125, 0.213653564453125, 0.21910858154296875, 0.2245635986328125, 0.23001861572265625, 0.2354736328125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 9.0, 20.0, 136.0, 645.0, 179.0, 22.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.646785736083984, -9.466341018676758, -9.285895347595215, -9.105450630187988, -8.925005912780762, -8.744560241699219, -8.564115524291992, -8.383670806884766, -8.203225135803223, -8.022780418395996, -7.842335224151611, -7.661890029907227, -7.481444835662842, -7.300999641418457, -7.1205549240112305, -6.940109729766846, -6.759665012359619, -6.579219818115234, -6.398775100708008, -6.218329906463623, -6.037884712219238, -5.857439994812012, -5.676994800567627, -5.496549606323242, -5.316104888916016, -5.135659694671631, -4.955214977264404, -4.7747697830200195, -4.594324588775635, -4.41387939453125, -4.233434677124023, -4.052989482879639, -3.872544765472412, -3.6920998096466064, -3.5116546154022217, -3.331209659576416, -3.1507644653320312, -2.9703195095062256, -2.78987455368042, -2.609429359436035, -2.4289841651916504, -2.2485392093658447, -2.06809401512146, -1.8876490592956543, -1.707203984260559, -1.5267589092254639, -1.3463139533996582, -1.165868878364563, -0.9854239225387573, -0.8049788475036621, -0.6245338320732117, -0.44408881664276123, -0.263643741607666, -0.0831986665725708, 0.09724628925323486, 0.2776913642883301, 0.4581364393234253, 0.6385815143585205, 0.819026529788971, 0.9994715452194214, 1.1799166202545166, 1.3603616952896118, 1.5408066511154175, 1.7212517261505127, 1.901696801185608]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 6.0, 10.0, 13.0, 11.0, 10.0, 19.0, 24.0, 16.0, 24.0, 29.0, 38.0, 41.0, 44.0, 57.0, 48.0, 57.0, 67.0, 64.0, 54.0, 49.0, 48.0, 41.0, 46.0, 18.0, 37.0, 37.0, 18.0, 13.0, 19.0, 8.0, 12.0, 13.0, 6.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5172576904296875, -1.4781373739242554, -1.4390170574188232, -1.3998967409133911, -1.360776424407959, -1.3216559886932373, -1.2825356721878052, -1.243415355682373, -1.204295039176941, -1.1651747226715088, -1.1260544061660767, -1.0869340896606445, -1.0478136539459229, -1.0086933374404907, -0.9695730209350586, -0.9304527044296265, -0.8913323879241943, -0.8522120714187622, -0.8130917549133301, -0.7739713788032532, -0.734851062297821, -0.6957307457923889, -0.656610369682312, -0.6174900531768799, -0.5783697366714478, -0.5392494201660156, -0.5001291036605835, -0.4610087275505066, -0.42188841104507446, -0.38276809453964233, -0.3436477482318878, -0.3045274019241333, -0.26540714502334595, -0.22628681361675262, -0.1871664822101593, -0.14804615080356598, -0.10892581939697266, -0.06980548799037933, -0.03068515658378601, 0.008435189723968506, 0.047555506229400635, 0.08667583763599396, 0.12579616904258728, 0.1649165004491806, 0.20403683185577393, 0.24315716326236725, 0.28227749466896057, 0.3213978409767151, 0.3605181574821472, 0.39963847398757935, 0.43875882029533386, 0.4778791666030884, 0.5169994831085205, 0.5561197996139526, 0.5952401161193848, 0.6343604922294617, 0.6734808087348938, 0.7126011252403259, 0.7517215013504028, 0.790841817855835, 0.8299621343612671, 0.8690824508666992, 0.9082027673721313, 0.9473231434822083, 0.9864434599876404]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 4.0, 13.0, 30.0, 127.0, 590.0, 4489.0, 80867.0, 4069151.0, 34900.0, 2656.0, 531.0, 213.0, 131.0, 105.0, 87.0, 52.0, 56.0, 41.0, 33.0, 32.0, 25.0, 23.0, 21.0, 17.0, 15.0, 9.0, 12.0, 12.0, 8.0, 6.0, 4.0, 2.0, 2.0, 6.0, 7.0, 2.0, 0.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.469970703125, -0.4247856140136719, -0.37960052490234375, -0.3344154357910156, -0.2892303466796875, -0.24404525756835938, -0.19886016845703125, -0.15367507934570312, -0.108489990234375, -0.06330490112304688, -0.01811981201171875, 0.027065277099609375, 0.0722503662109375, 0.11743545532226562, 0.16262054443359375, 0.20780563354492188, 0.25299072265625, 0.2981758117675781, 0.34336090087890625, 0.3885459899902344, 0.4337310791015625, 0.4789161682128906, 0.5241012573242188, 0.5692863464355469, 0.614471435546875, 0.6596565246582031, 0.7048416137695312, 0.7500267028808594, 0.7952117919921875, 0.8403968811035156, 0.8855819702148438, 0.9307670593261719, 0.9759521484375, 1.0211372375488281, 1.0663223266601562, 1.1115074157714844, 1.1566925048828125, 1.2018775939941406, 1.2470626831054688, 1.2922477722167969, 1.337432861328125, 1.3826179504394531, 1.4278030395507812, 1.4729881286621094, 1.5181732177734375, 1.5633583068847656, 1.6085433959960938, 1.6537284851074219, 1.69891357421875, 1.7440986633300781, 1.7892837524414062, 1.8344688415527344, 1.8796539306640625, 1.9248390197753906, 1.9700241088867188, 2.015209197998047, 2.060394287109375, 2.105579376220703, 2.1507644653320312, 2.1959495544433594, 2.2411346435546875, 2.2863197326660156, 2.3315048217773438, 2.376689910888672, 2.421875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 12.0, 28.0, 75.0, 149.0, 219.0, 222.0, 178.0, 79.0, 36.0, 16.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.039459228515625, -0.03395223617553711, -0.02844524383544922, -0.022938251495361328, -0.017431259155273438, -0.011924266815185547, -0.006417274475097656, -0.0009102821350097656, 0.004596710205078125, 0.010103702545166016, 0.015610694885253906, 0.021117687225341797, 0.026624679565429688, 0.03213167190551758, 0.03763866424560547, 0.04314565658569336, 0.04865264892578125, 0.05415964126586914, 0.05966663360595703, 0.06517362594604492, 0.07068061828613281, 0.0761876106262207, 0.0816946029663086, 0.08720159530639648, 0.09270858764648438, 0.09821557998657227, 0.10372257232666016, 0.10922956466674805, 0.11473655700683594, 0.12024354934692383, 0.12575054168701172, 0.1312575340270996, 0.1367645263671875, 0.1422715187072754, 0.14777851104736328, 0.15328550338745117, 0.15879249572753906, 0.16429948806762695, 0.16980648040771484, 0.17531347274780273, 0.18082046508789062, 0.18632745742797852, 0.1918344497680664, 0.1973414421081543, 0.2028484344482422, 0.20835542678833008, 0.21386241912841797, 0.21936941146850586, 0.22487640380859375, 0.23038339614868164, 0.23589038848876953, 0.24139738082885742, 0.2469043731689453, 0.2524113655090332, 0.2579183578491211, 0.263425350189209, 0.2689323425292969, 0.27443933486938477, 0.27994632720947266, 0.28545331954956055, 0.29096031188964844, 0.29646730422973633, 0.3019742965698242, 0.3074812889099121, 0.31298828125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 8.0, 9.0, 21.0, 43.0, 60.0, 92.0, 334.0, 1901.0, 4156803.0, 32916.0, 1447.0, 320.0, 128.0, 73.0, 58.0, 25.0, 17.0, 15.0, 6.0, 8.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2578125, -2.131103515625, -2.00439453125, -1.877685546875, -1.7509765625, -1.624267578125, -1.49755859375, -1.370849609375, -1.244140625, -1.117431640625, -0.99072265625, -0.864013671875, -0.7373046875, -0.610595703125, -0.48388671875, -0.357177734375, -0.23046875, -0.103759765625, 0.02294921875, 0.149658203125, 0.2763671875, 0.403076171875, 0.52978515625, 0.656494140625, 0.783203125, 0.909912109375, 1.03662109375, 1.163330078125, 1.2900390625, 1.416748046875, 1.54345703125, 1.670166015625, 1.796875, 1.923583984375, 2.05029296875, 2.177001953125, 2.3037109375, 2.430419921875, 2.55712890625, 2.683837890625, 2.810546875, 2.937255859375, 3.06396484375, 3.190673828125, 3.3173828125, 3.444091796875, 3.57080078125, 3.697509765625, 3.82421875, 3.950927734375, 4.07763671875, 4.204345703125, 4.3310546875, 4.457763671875, 4.58447265625, 4.711181640625, 4.837890625, 4.964599609375, 5.09130859375, 5.218017578125, 5.3447265625, 5.471435546875, 5.59814453125, 5.724853515625, 5.8515625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [5.0, 5.0, 12.0, 27.0, 77.0, 908.0, 2894.0, 106.0, 26.0, 14.0, 2.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.086669921875, -0.07242202758789062, -0.05817413330078125, -0.043926239013671875, -0.0296783447265625, -0.015430450439453125, -0.00118255615234375, 0.013065338134765625, 0.027313232421875, 0.041561126708984375, 0.05580902099609375, 0.07005691528320312, 0.0843048095703125, 0.09855270385742188, 0.11280059814453125, 0.12704849243164062, 0.14129638671875, 0.15554428100585938, 0.16979217529296875, 0.18404006958007812, 0.1982879638671875, 0.21253585815429688, 0.22678375244140625, 0.24103164672851562, 0.255279541015625, 0.2695274353027344, 0.28377532958984375, 0.2980232238769531, 0.3122711181640625, 0.3265190124511719, 0.34076690673828125, 0.3550148010253906, 0.3692626953125, 0.3835105895996094, 0.39775848388671875, 0.4120063781738281, 0.4262542724609375, 0.4405021667480469, 0.45475006103515625, 0.4689979553222656, 0.483245849609375, 0.4974937438964844, 0.5117416381835938, 0.5259895324707031, 0.5402374267578125, 0.5544853210449219, 0.5687332153320312, 0.5829811096191406, 0.59722900390625, 0.6114768981933594, 0.6257247924804688, 0.6399726867675781, 0.6542205810546875, 0.6684684753417969, 0.6827163696289062, 0.6969642639160156, 0.711212158203125, 0.7254600524902344, 0.7397079467773438, 0.7539558410644531, 0.7682037353515625, 0.7824516296386719, 0.7966995239257812, 0.8109474182128906, 0.8251953125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 7.0, 19.0, 57.0, 356.0, 445.0, 80.0, 21.0, 8.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3457646369934082, -1.2343119382858276, -1.122859239578247, -1.011406421661377, -0.8999537229537964, -0.7885010242462158, -0.6770482659339905, -0.5655955076217651, -0.45414280891418457, -0.3426900804042816, -0.23123735189437866, -0.11978462338447571, -0.008331894874572754, 0.10312080383300781, 0.21457356214523315, 0.3260263204574585, 0.43747901916503906, 0.5489317178726196, 0.660384476184845, 0.7718372344970703, 0.8832899332046509, 0.9947426319122314, 1.1061954498291016, 1.2176481485366821, 1.3291008472442627, 1.4405535459518433, 1.5520062446594238, 1.663459062576294, 1.7749117612838745, 1.886364459991455, 1.9978172779083252, 2.1092700958251953, 2.2207226753234863, 2.3321754932403564, 2.4436280727386475, 2.5550808906555176, 2.6665334701538086, 2.7779862880706787, 2.889439105987549, 3.00089168548584, 3.11234450340271, 3.22379732131958, 3.335249900817871, 3.446702718734741, 3.5581555366516113, 3.6696081161499023, 3.7810609340667725, 3.8925137519836426, 4.003966331481934, 4.115418910980225, 4.226871967315674, 4.338324546813965, 4.449777126312256, 4.561229705810547, 4.672682762145996, 4.784135341644287, 4.895587921142578, 5.007040500640869, 5.118493556976318, 5.229946136474609, 5.3413987159729, 5.452851295471191, 5.564304351806641, 5.675756931304932, 5.787209987640381]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 7.0, 9.0, 12.0, 30.0, 29.0, 62.0, 84.0, 117.0, 109.0, 134.0, 124.0, 104.0, 77.0, 49.0, 27.0, 11.0, 11.0, 6.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.885972499847412, -1.822251796722412, -1.758531093597412, -1.6948102712631226, -1.6310895681381226, -1.5673688650131226, -1.503648042678833, -1.439927339553833, -1.376206636428833, -1.312485933303833, -1.248765230178833, -1.1850444078445435, -1.1213237047195435, -1.0576030015945435, -0.9938822388648987, -0.9301614761352539, -0.8664407730102539, -0.8027200698852539, -0.7389993071556091, -0.6752785444259644, -0.6115578413009644, -0.5478371381759644, -0.4841163754463196, -0.4203956425189972, -0.3566749095916748, -0.2929541766643524, -0.22923344373703003, -0.16551271080970764, -0.10179197788238525, -0.038071244955062866, 0.02564948797225952, 0.08937022089958191, 0.1530909538269043, 0.21681168675422668, 0.2805324196815491, 0.34425315260887146, 0.40797388553619385, 0.47169461846351624, 0.5354153513908386, 0.5991361141204834, 0.6628568172454834, 0.7265775203704834, 0.7902982831001282, 0.854019045829773, 0.917739748954773, 0.981460452079773, 1.0451812744140625, 1.1089019775390625, 1.1726226806640625, 1.2363433837890625, 1.3000640869140625, 1.363784909248352, 1.427505612373352, 1.491226315498352, 1.5549471378326416, 1.6186678409576416, 1.6823885440826416, 1.7461092472076416, 1.8098299503326416, 1.8735507726669312, 1.9372714757919312, 2.0009922981262207, 2.0647130012512207, 2.1284337043762207, 2.1921544075012207]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 3.0, 6.0, 11.0, 9.0, 10.0, 19.0, 26.0, 40.0, 53.0, 109.0, 228.0, 632.0, 2974.0, 40951.0, 954392.0, 44687.0, 3194.0, 636.0, 249.0, 103.0, 73.0, 41.0, 36.0, 19.0, 16.0, 10.0, 7.0, 8.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.08203125, -1.0378875732421875, -0.993743896484375, -0.9496002197265625, -0.90545654296875, -0.8613128662109375, -0.817169189453125, -0.7730255126953125, -0.7288818359375, -0.6847381591796875, -0.640594482421875, -0.5964508056640625, -0.55230712890625, -0.5081634521484375, -0.464019775390625, -0.4198760986328125, -0.375732421875, -0.3315887451171875, -0.287445068359375, -0.2433013916015625, -0.19915771484375, -0.1550140380859375, -0.110870361328125, -0.0667266845703125, -0.0225830078125, 0.0215606689453125, 0.065704345703125, 0.1098480224609375, 0.15399169921875, 0.1981353759765625, 0.242279052734375, 0.2864227294921875, 0.33056640625, 0.3747100830078125, 0.418853759765625, 0.4629974365234375, 0.50714111328125, 0.5512847900390625, 0.595428466796875, 0.6395721435546875, 0.6837158203125, 0.7278594970703125, 0.772003173828125, 0.8161468505859375, 0.86029052734375, 0.9044342041015625, 0.948577880859375, 0.9927215576171875, 1.036865234375, 1.0810089111328125, 1.125152587890625, 1.1692962646484375, 1.21343994140625, 1.2575836181640625, 1.301727294921875, 1.3458709716796875, 1.3900146484375, 1.4341583251953125, 1.478302001953125, 1.5224456787109375, 1.56658935546875, 1.6107330322265625, 1.654876708984375, 1.6990203857421875, 1.7431640625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 18.0, 37.0, 65.0, 123.0, 158.0, 184.0, 175.0, 110.0, 72.0, 41.0, 13.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11322021484375, -0.10639286041259766, -0.09956550598144531, -0.09273815155029297, -0.08591079711914062, -0.07908344268798828, -0.07225608825683594, -0.0654287338256836, -0.05860137939453125, -0.051774024963378906, -0.04494667053222656, -0.03811931610107422, -0.031291961669921875, -0.02446460723876953, -0.017637252807617188, -0.010809898376464844, -0.0039825439453125, 0.0028448104858398438, 0.009672164916992188, 0.01649951934814453, 0.023326873779296875, 0.03015422821044922, 0.03698158264160156, 0.043808937072753906, 0.05063629150390625, 0.057463645935058594, 0.06429100036621094, 0.07111835479736328, 0.07794570922851562, 0.08477306365966797, 0.09160041809082031, 0.09842777252197266, 0.105255126953125, 0.11208248138427734, 0.11890983581542969, 0.12573719024658203, 0.13256454467773438, 0.13939189910888672, 0.14621925354003906, 0.1530466079711914, 0.15987396240234375, 0.1667013168334961, 0.17352867126464844, 0.18035602569580078, 0.18718338012695312, 0.19401073455810547, 0.2008380889892578, 0.20766544342041016, 0.2144927978515625, 0.22132015228271484, 0.2281475067138672, 0.23497486114501953, 0.24180221557617188, 0.24862957000732422, 0.25545692443847656, 0.2622842788696289, 0.26911163330078125, 0.2759389877319336, 0.28276634216308594, 0.2895936965942383, 0.2964210510253906, 0.30324840545654297, 0.3100757598876953, 0.31690311431884766, 0.32373046875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 6.0, 3.0, 5.0, 6.0, 11.0, 14.0, 8.0, 19.0, 20.0, 28.0, 36.0, 56.0, 65.0, 95.0, 170.0, 315.0, 496.0, 968.0, 2170.0, 5623.0, 19488.0, 114126.0, 711974.0, 156845.0, 24687.0, 6451.0, 2372.0, 1061.0, 553.0, 319.0, 174.0, 114.0, 67.0, 68.0, 32.0, 28.0, 16.0, 18.0, 8.0, 12.0, 7.0, 3.0, 4.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.449951171875, -0.435699462890625, -0.42144775390625, -0.407196044921875, -0.3929443359375, -0.378692626953125, -0.36444091796875, -0.350189208984375, -0.3359375, -0.321685791015625, -0.30743408203125, -0.293182373046875, -0.2789306640625, -0.264678955078125, -0.25042724609375, -0.236175537109375, -0.221923828125, -0.207672119140625, -0.19342041015625, -0.179168701171875, -0.1649169921875, -0.150665283203125, -0.13641357421875, -0.122161865234375, -0.10791015625, -0.093658447265625, -0.07940673828125, -0.065155029296875, -0.0509033203125, -0.036651611328125, -0.02239990234375, -0.008148193359375, 0.006103515625, 0.020355224609375, 0.03460693359375, 0.048858642578125, 0.0631103515625, 0.077362060546875, 0.09161376953125, 0.105865478515625, 0.1201171875, 0.134368896484375, 0.14862060546875, 0.162872314453125, 0.1771240234375, 0.191375732421875, 0.20562744140625, 0.219879150390625, 0.234130859375, 0.248382568359375, 0.26263427734375, 0.276885986328125, 0.2911376953125, 0.305389404296875, 0.31964111328125, 0.333892822265625, 0.34814453125, 0.362396240234375, 0.37664794921875, 0.390899658203125, 0.4051513671875, 0.419403076171875, 0.43365478515625, 0.447906494140625, 0.462158203125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 5.0, 5.0, 17.0, 14.0, 20.0, 20.0, 35.0, 36.0, 40.0, 42.0, 63.0, 64.0, 64.0, 63.0, 70.0, 65.0, 69.0, 51.0, 46.0, 43.0, 38.0, 22.0, 26.0, 21.0, 18.0, 6.0, 8.0, 4.0, 4.0, 6.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.376220703125, -0.36444854736328125, -0.3526763916015625, -0.34090423583984375, -0.329132080078125, -0.31735992431640625, -0.3055877685546875, -0.29381561279296875, -0.28204345703125, -0.27027130126953125, -0.2584991455078125, -0.24672698974609375, -0.234954833984375, -0.22318267822265625, -0.2114105224609375, -0.19963836669921875, -0.1878662109375, -0.17609405517578125, -0.1643218994140625, -0.15254974365234375, -0.140777587890625, -0.12900543212890625, -0.1172332763671875, -0.10546112060546875, -0.09368896484375, -0.08191680908203125, -0.0701446533203125, -0.05837249755859375, -0.046600341796875, -0.03482818603515625, -0.0230560302734375, -0.01128387451171875, 0.00048828125, 0.01226043701171875, 0.0240325927734375, 0.03580474853515625, 0.047576904296875, 0.05934906005859375, 0.0711212158203125, 0.08289337158203125, 0.09466552734375, 0.10643768310546875, 0.1182098388671875, 0.12998199462890625, 0.141754150390625, 0.15352630615234375, 0.1652984619140625, 0.17707061767578125, 0.1888427734375, 0.20061492919921875, 0.2123870849609375, 0.22415924072265625, 0.235931396484375, 0.24770355224609375, 0.2594757080078125, 0.27124786376953125, 0.28302001953125, 0.29479217529296875, 0.3065643310546875, 0.31833648681640625, 0.330108642578125, 0.34188079833984375, 0.3536529541015625, 0.36542510986328125, 0.377197265625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 6.0, 5.0, 5.0, 17.0, 15.0, 16.0, 20.0, 34.0, 63.0, 90.0, 162.0, 234.0, 505.0, 1164.0, 3032.0, 8804.0, 35771.0, 296613.0, 597271.0, 81599.0, 15035.0, 4695.0, 1705.0, 772.0, 367.0, 198.0, 97.0, 66.0, 50.0, 41.0, 14.0, 22.0, 11.0, 10.0, 9.0, 10.0, 9.0, 2.0, 5.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1551513671875, -0.15033531188964844, -0.14551925659179688, -0.1407032012939453, -0.13588714599609375, -0.1310710906982422, -0.12625503540039062, -0.12143898010253906, -0.1166229248046875, -0.11180686950683594, -0.10699081420898438, -0.10217475891113281, -0.09735870361328125, -0.09254264831542969, -0.08772659301757812, -0.08291053771972656, -0.078094482421875, -0.07327842712402344, -0.06846237182617188, -0.06364631652832031, -0.05883026123046875, -0.05401420593261719, -0.049198150634765625, -0.04438209533691406, -0.0395660400390625, -0.03474998474121094, -0.029933929443359375, -0.025117874145507812, -0.02030181884765625, -0.015485763549804688, -0.010669708251953125, -0.0058536529541015625, -0.00103759765625, 0.0037784576416015625, 0.008594512939453125, 0.013410568237304688, 0.01822662353515625, 0.023042678833007812, 0.027858734130859375, 0.03267478942871094, 0.0374908447265625, 0.04230690002441406, 0.047122955322265625, 0.05193901062011719, 0.05675506591796875, 0.06157112121582031, 0.06638717651367188, 0.07120323181152344, 0.076019287109375, 0.08083534240722656, 0.08565139770507812, 0.09046745300292969, 0.09528350830078125, 0.10009956359863281, 0.10491561889648438, 0.10973167419433594, 0.1145477294921875, 0.11936378479003906, 0.12417984008789062, 0.1289958953857422, 0.13381195068359375, 0.1386280059814453, 0.14344406127929688, 0.14826011657714844, 0.153076171875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 10.0, 18.0, 14.0, 17.0, 26.0, 32.0, 55.0, 32.0, 51.0, 74.0, 82.0, 91.0, 105.0, 64.0, 67.0, 53.0, 43.0, 38.0, 26.0, 26.0, 19.0, 14.0, 13.0, 10.0, 5.0, 2.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.00016570091247558594, -0.00016160588711500168, -0.00015751086175441742, -0.00015341583639383316, -0.0001493208110332489, -0.00014522578567266464, -0.00014113076031208038, -0.00013703573495149612, -0.00013294070959091187, -0.0001288456842303276, -0.00012475065886974335, -0.00012065563350915909, -0.00011656060814857483, -0.00011246558278799057, -0.00010837055742740631, -0.00010427553206682205, -0.00010018050670623779, -9.608548134565353e-05, -9.199045598506927e-05, -8.789543062448502e-05, -8.380040526390076e-05, -7.97053799033165e-05, -7.561035454273224e-05, -7.151532918214798e-05, -6.742030382156372e-05, -6.332527846097946e-05, -5.92302531003952e-05, -5.5135227739810944e-05, -5.1040202379226685e-05, -4.6945177018642426e-05, -4.2850151658058167e-05, -3.875512629747391e-05, -3.466010093688965e-05, -3.056507557630539e-05, -2.647005021572113e-05, -2.237502485513687e-05, -1.8279999494552612e-05, -1.4184974133968353e-05, -1.0089948773384094e-05, -5.994923412799835e-06, -1.8998980522155762e-06, 2.195127308368683e-06, 6.290152668952942e-06, 1.0385178029537201e-05, 1.448020339012146e-05, 1.857522875070572e-05, 2.2670254111289978e-05, 2.6765279471874237e-05, 3.0860304832458496e-05, 3.4955330193042755e-05, 3.9050355553627014e-05, 4.314538091421127e-05, 4.724040627479553e-05, 5.133543163537979e-05, 5.543045699596405e-05, 5.952548235654831e-05, 6.362050771713257e-05, 6.771553307771683e-05, 7.181055843830109e-05, 7.590558379888535e-05, 8.00006091594696e-05, 8.409563452005386e-05, 8.819065988063812e-05, 9.228568524122238e-05, 9.638071060180664e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 2.0, 6.0, 3.0, 17.0, 18.0, 25.0, 34.0, 63.0, 75.0, 162.0, 313.0, 711.0, 1804.0, 5311.0, 21146.0, 230386.0, 704729.0, 67817.0, 10672.0, 3090.0, 1160.0, 458.0, 209.0, 140.0, 80.0, 47.0, 25.0, 9.0, 11.0, 9.0, 4.0, 3.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1634521484375, -0.1578693389892578, -0.15228652954101562, -0.14670372009277344, -0.14112091064453125, -0.13553810119628906, -0.12995529174804688, -0.12437248229980469, -0.1187896728515625, -0.11320686340332031, -0.10762405395507812, -0.10204124450683594, -0.09645843505859375, -0.09087562561035156, -0.08529281616210938, -0.07971000671386719, -0.074127197265625, -0.06854438781738281, -0.06296157836914062, -0.05737876892089844, -0.05179595947265625, -0.04621315002441406, -0.040630340576171875, -0.03504753112792969, -0.0294647216796875, -0.023881912231445312, -0.018299102783203125, -0.012716293334960938, -0.00713348388671875, -0.0015506744384765625, 0.004032135009765625, 0.009614944458007812, 0.01519775390625, 0.020780563354492188, 0.026363372802734375, 0.03194618225097656, 0.03752899169921875, 0.04311180114746094, 0.048694610595703125, 0.05427742004394531, 0.0598602294921875, 0.06544303894042969, 0.07102584838867188, 0.07660865783691406, 0.08219146728515625, 0.08777427673339844, 0.09335708618164062, 0.09893989562988281, 0.104522705078125, 0.11010551452636719, 0.11568832397460938, 0.12127113342285156, 0.12685394287109375, 0.13243675231933594, 0.13801956176757812, 0.1436023712158203, 0.1491851806640625, 0.1547679901123047, 0.16035079956054688, 0.16593360900878906, 0.17151641845703125, 0.17709922790527344, 0.18268203735351562, 0.1882648468017578, 0.19384765625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 1.0, 1.0, 2.0, 7.0, 5.0, 11.0, 15.0, 29.0, 35.0, 58.0, 108.0, 138.0, 147.0, 130.0, 108.0, 80.0, 57.0, 25.0, 18.0, 12.0, 4.0, 7.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09002685546875, -0.08619022369384766, -0.08235359191894531, -0.07851696014404297, -0.07468032836914062, -0.07084369659423828, -0.06700706481933594, -0.0631704330444336, -0.05933380126953125, -0.055497169494628906, -0.05166053771972656, -0.04782390594482422, -0.043987274169921875, -0.04015064239501953, -0.03631401062011719, -0.032477378845214844, -0.0286407470703125, -0.024804115295410156, -0.020967483520507812, -0.01713085174560547, -0.013294219970703125, -0.009457588195800781, -0.0056209564208984375, -0.0017843246459960938, 0.00205230712890625, 0.005888938903808594, 0.009725570678710938, 0.013562202453613281, 0.017398834228515625, 0.02123546600341797, 0.025072097778320312, 0.028908729553222656, 0.032745361328125, 0.036581993103027344, 0.04041862487792969, 0.04425525665283203, 0.048091888427734375, 0.05192852020263672, 0.05576515197753906, 0.059601783752441406, 0.06343841552734375, 0.0672750473022461, 0.07111167907714844, 0.07494831085205078, 0.07878494262695312, 0.08262157440185547, 0.08645820617675781, 0.09029483795166016, 0.0941314697265625, 0.09796810150146484, 0.10180473327636719, 0.10564136505126953, 0.10947799682617188, 0.11331462860107422, 0.11715126037597656, 0.1209878921508789, 0.12482452392578125, 0.1286611557006836, 0.13249778747558594, 0.13633441925048828, 0.14017105102539062, 0.14400768280029297, 0.1478443145751953, 0.15168094635009766, 0.155517578125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 8.0, 7.0, 25.0, 77.0, 189.0, 383.0, 218.0, 59.0, 26.0, 10.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.911895275115967, -2.7886033058166504, -2.665311336517334, -2.5420193672180176, -2.4187276363372803, -2.295435667037964, -2.1721436977386475, -2.048851728439331, -1.9255597591400146, -1.8022677898406982, -1.6789759397506714, -1.555683970451355, -1.4323920011520386, -1.3091001510620117, -1.1858081817626953, -1.062516212463379, -0.939224362373352, -0.8159324526786804, -0.692640483379364, -0.5693485736846924, -0.44605663418769836, -0.32276469469070435, -0.19947278499603271, -0.07618081569671631, 0.04711109399795532, 0.17040303349494934, 0.29369497299194336, 0.416986882686615, 0.5402787923812866, 0.663570761680603, 0.7868626713752747, 0.9101546406745911, 1.0334465503692627, 1.156738519668579, 1.280030369758606, 1.4033223390579224, 1.5266143083572388, 1.6499061584472656, 1.773198127746582, 1.8964900970458984, 2.019782066345215, 2.1430740356445312, 2.2663660049438477, 2.389657974243164, 2.5129497051239014, 2.6362416744232178, 2.759533643722534, 2.8828256130218506, 3.006117343902588, 3.1294093132019043, 3.2527012825012207, 3.375993251800537, 3.4992849826812744, 3.622576951980591, 3.7458689212799072, 3.8691608905792236, 3.99245285987854, 4.115744590759277, 4.239036560058594, 4.36232852935791, 4.485620498657227, 4.608912467956543, 4.732204437255859, 4.855496406555176, 4.978788375854492]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 4.0, 7.0, 8.0, 6.0, 16.0, 19.0, 17.0, 15.0, 29.0, 29.0, 35.0, 39.0, 39.0, 51.0, 43.0, 53.0, 42.0, 74.0, 54.0, 46.0, 50.0, 54.0, 40.0, 37.0, 27.0, 33.0, 30.0, 29.0, 18.0, 11.0, 10.0, 13.0, 11.0, 6.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4132628440856934, -1.359816074371338, -1.3063693046569824, -1.252922534942627, -1.199475884437561, -1.1460291147232056, -1.09258234500885, -1.0391355752944946, -0.9856888055801392, -0.9322420358657837, -0.878795325756073, -0.8253485560417175, -0.7719017863273621, -0.7184550762176514, -0.6650083065032959, -0.6115615367889404, -0.5581148266792297, -0.5046680569648743, -0.4512213170528412, -0.3977745771408081, -0.34432780742645264, -0.29088106751441956, -0.23743432760238647, -0.183987557888031, -0.13054081797599792, -0.07709406316280365, -0.023647315800189972, 0.029799431562423706, 0.08324618637561798, 0.13669294118881226, 0.19013968110084534, 0.2435864508152008, 0.2970331907272339, 0.35047993063926697, 0.40392670035362244, 0.4573734402656555, 0.510820209980011, 0.5642669200897217, 0.6177136898040771, 0.6711604595184326, 0.7246072292327881, 0.7780539989471436, 0.8315007090568542, 0.8849474787712097, 0.9383942484855652, 0.9918409585952759, 1.0452877283096313, 1.0987344980239868, 1.1521811485290527, 1.2056279182434082, 1.2590746879577637, 1.3125214576721191, 1.365968108177185, 1.4194148778915405, 1.472861647605896, 1.5263084173202515, 1.579755187034607, 1.6332019567489624, 1.6866487264633179, 1.7400953769683838, 1.7935421466827393, 1.8469889163970947, 1.9004356861114502, 1.9538824558258057, 2.007329225540161]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 6.0, 4.0, 19.0, 19.0, 27.0, 75.0, 146.0, 375.0, 923.0, 3046.0, 15142.0, 243294.0, 3888614.0, 34492.0, 5147.0, 1379.0, 591.0, 285.0, 181.0, 120.0, 90.0, 70.0, 41.0, 36.0, 23.0, 16.0, 24.0, 15.0, 16.0, 12.0, 12.0, 8.0, 3.0, 9.0, 4.0, 6.0, 4.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.465087890625, -0.4345054626464844, -0.40392303466796875, -0.3733406066894531, -0.3427581787109375, -0.3121757507324219, -0.28159332275390625, -0.2510108947753906, -0.220428466796875, -0.18984603881835938, -0.15926361083984375, -0.12868118286132812, -0.0980987548828125, -0.06751632690429688, -0.03693389892578125, -0.006351470947265625, 0.02423095703125, 0.054813385009765625, 0.08539581298828125, 0.11597824096679688, 0.1465606689453125, 0.17714309692382812, 0.20772552490234375, 0.23830795288085938, 0.268890380859375, 0.2994728088378906, 0.33005523681640625, 0.3606376647949219, 0.3912200927734375, 0.4218025207519531, 0.45238494873046875, 0.4829673767089844, 0.5135498046875, 0.5441322326660156, 0.5747146606445312, 0.6052970886230469, 0.6358795166015625, 0.6664619445800781, 0.6970443725585938, 0.7276268005371094, 0.758209228515625, 0.7887916564941406, 0.8193740844726562, 0.8499565124511719, 0.8805389404296875, 0.9111213684082031, 0.9417037963867188, 0.9722862243652344, 1.00286865234375, 1.0334510803222656, 1.0640335083007812, 1.0946159362792969, 1.1251983642578125, 1.1557807922363281, 1.1863632202148438, 1.2169456481933594, 1.247528076171875, 1.2781105041503906, 1.3086929321289062, 1.3392753601074219, 1.3698577880859375, 1.4004402160644531, 1.4310226440429688, 1.4616050720214844, 1.4921875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 7.0, 21.0, 37.0, 60.0, 125.0, 139.0, 168.0, 164.0, 128.0, 77.0, 48.0, 20.0, 10.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.083251953125, -0.07669448852539062, -0.07013702392578125, -0.06357955932617188, -0.0570220947265625, -0.050464630126953125, -0.04390716552734375, -0.037349700927734375, -0.030792236328125, -0.024234771728515625, -0.01767730712890625, -0.011119842529296875, -0.0045623779296875, 0.001995086669921875, 0.00855255126953125, 0.015110015869140625, 0.02166748046875, 0.028224945068359375, 0.03478240966796875, 0.041339874267578125, 0.0478973388671875, 0.054454803466796875, 0.06101226806640625, 0.06756973266601562, 0.074127197265625, 0.08068466186523438, 0.08724212646484375, 0.09379959106445312, 0.1003570556640625, 0.10691452026367188, 0.11347198486328125, 0.12002944946289062, 0.1265869140625, 0.13314437866210938, 0.13970184326171875, 0.14625930786132812, 0.1528167724609375, 0.15937423706054688, 0.16593170166015625, 0.17248916625976562, 0.179046630859375, 0.18560409545898438, 0.19216156005859375, 0.19871902465820312, 0.2052764892578125, 0.21183395385742188, 0.21839141845703125, 0.22494888305664062, 0.23150634765625, 0.23806381225585938, 0.24462127685546875, 0.2511787414550781, 0.2577362060546875, 0.2642936706542969, 0.27085113525390625, 0.2774085998535156, 0.283966064453125, 0.2905235290527344, 0.29708099365234375, 0.3036384582519531, 0.3101959228515625, 0.3167533874511719, 0.32331085205078125, 0.3298683166503906, 0.33642578125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 7.0, 17.0, 28.0, 37.0, 85.0, 141.0, 307.0, 629.0, 2103.0, 19959.0, 4148945.0, 18391.0, 2170.0, 752.0, 355.0, 159.0, 89.0, 40.0, 36.0, 8.0, 11.0, 6.0, 2.0, 0.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4443359375, -1.395355224609375, -1.34637451171875, -1.297393798828125, -1.2484130859375, -1.199432373046875, -1.15045166015625, -1.101470947265625, -1.052490234375, -1.003509521484375, -0.95452880859375, -0.905548095703125, -0.8565673828125, -0.807586669921875, -0.75860595703125, -0.709625244140625, -0.66064453125, -0.611663818359375, -0.56268310546875, -0.513702392578125, -0.4647216796875, -0.415740966796875, -0.36676025390625, -0.317779541015625, -0.268798828125, -0.219818115234375, -0.17083740234375, -0.121856689453125, -0.0728759765625, -0.023895263671875, 0.02508544921875, 0.074066162109375, 0.123046875, 0.172027587890625, 0.22100830078125, 0.269989013671875, 0.3189697265625, 0.367950439453125, 0.41693115234375, 0.465911865234375, 0.514892578125, 0.563873291015625, 0.61285400390625, 0.661834716796875, 0.7108154296875, 0.759796142578125, 0.80877685546875, 0.857757568359375, 0.90673828125, 0.955718994140625, 1.00469970703125, 1.053680419921875, 1.1026611328125, 1.151641845703125, 1.20062255859375, 1.249603271484375, 1.298583984375, 1.347564697265625, 1.39654541015625, 1.445526123046875, 1.4945068359375, 1.543487548828125, 1.59246826171875, 1.641448974609375, 1.6904296875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 8.0, 3.0, 6.0, 17.0, 54.0, 237.0, 2769.0, 794.0, 111.0, 38.0, 17.0, 11.0, 5.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.220703125, -0.2121429443359375, -0.203582763671875, -0.1950225830078125, -0.18646240234375, -0.1779022216796875, -0.169342041015625, -0.1607818603515625, -0.1522216796875, -0.1436614990234375, -0.135101318359375, -0.1265411376953125, -0.11798095703125, -0.1094207763671875, -0.100860595703125, -0.0923004150390625, -0.083740234375, -0.0751800537109375, -0.066619873046875, -0.0580596923828125, -0.04949951171875, -0.0409393310546875, -0.032379150390625, -0.0238189697265625, -0.0152587890625, -0.0066986083984375, 0.001861572265625, 0.0104217529296875, 0.01898193359375, 0.0275421142578125, 0.036102294921875, 0.0446624755859375, 0.05322265625, 0.0617828369140625, 0.070343017578125, 0.0789031982421875, 0.08746337890625, 0.0960235595703125, 0.104583740234375, 0.1131439208984375, 0.1217041015625, 0.1302642822265625, 0.138824462890625, 0.1473846435546875, 0.15594482421875, 0.1645050048828125, 0.173065185546875, 0.1816253662109375, 0.190185546875, 0.1987457275390625, 0.207305908203125, 0.2158660888671875, 0.22442626953125, 0.2329864501953125, 0.241546630859375, 0.2501068115234375, 0.2586669921875, 0.2672271728515625, 0.275787353515625, 0.2843475341796875, 0.29290771484375, 0.3014678955078125, 0.310028076171875, 0.3185882568359375, 0.3271484375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 7.0, 10.0, 60.0, 338.0, 464.0, 91.0, 25.0, 6.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.004013776779175, -2.925145149230957, -2.8462765216827393, -2.7674078941345215, -2.6885392665863037, -2.609670639038086, -2.530802011489868, -2.4519333839416504, -2.3730649948120117, -2.294196367263794, -2.215327739715576, -2.1364591121673584, -2.0575904846191406, -1.9787218570709229, -1.8998533487319946, -1.8209847211837769, -1.7421159744262695, -1.6632473468780518, -1.584378719329834, -1.5055100917816162, -1.4266414642333984, -1.3477728366851807, -1.2689043283462524, -1.1900357007980347, -1.111167073249817, -1.0322984457015991, -0.9534298181533813, -0.8745612502098083, -0.7956926226615906, -0.7168239951133728, -0.6379554271697998, -0.559086799621582, -0.48021793365478516, -0.4013493061065674, -0.322480708360672, -0.24361209571361542, -0.16474348306655884, -0.08587485551834106, -0.007006257772445679, 0.07186233997344971, 0.15073096752166748, 0.22959958016872406, 0.30846819281578064, 0.387336790561676, 0.4662054181098938, 0.5450740456581116, 0.6239426136016846, 0.7028112411499023, 0.7816798686981201, 0.8605484962463379, 0.9394171237945557, 1.0182857513427734, 1.0971543788909912, 1.176023006439209, 1.2548915147781372, 1.333760142326355, 1.4126287698745728, 1.4914973974227905, 1.5703660249710083, 1.649234652519226, 1.7281031608581543, 1.806971788406372, 1.8858404159545898, 1.9647090435028076, 2.0435776710510254]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 5.0, 11.0, 1.0, 11.0, 7.0, 18.0, 17.0, 32.0, 46.0, 48.0, 55.0, 55.0, 78.0, 66.0, 66.0, 68.0, 71.0, 62.0, 55.0, 48.0, 45.0, 40.0, 18.0, 25.0, 16.0, 15.0, 12.0, 4.0, 5.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.6948535442352295, -0.6740829348564148, -0.6533122658729553, -0.6325416564941406, -0.6117710471153259, -0.5910004377365112, -0.5702297687530518, -0.5494591593742371, -0.5286885499954224, -0.5079179406166077, -0.4871473014354706, -0.4663766622543335, -0.4456060528755188, -0.4248354136943817, -0.40406477451324463, -0.38329416513442993, -0.36252349615097046, -0.3417528569698334, -0.3209822475910187, -0.3002116084098816, -0.2794409990310669, -0.2586703598499298, -0.23789972066879272, -0.21712909638881683, -0.19635847210884094, -0.17558784782886505, -0.15481722354888916, -0.13404658436775208, -0.11327596008777618, -0.09250533580780029, -0.0717347040772438, -0.05096407234668732, -0.030193448066711426, -0.009422820061445236, 0.011347807943820953, 0.03211843594908714, 0.05288906395435333, 0.07365968823432922, 0.09443031996488571, 0.1152009516954422, 0.1359715759754181, 0.15674220025539398, 0.17751282453536987, 0.19828346371650696, 0.21905408799648285, 0.23982471227645874, 0.2605953514575958, 0.2813659906387329, 0.3021366000175476, 0.3229072391986847, 0.3436778485774994, 0.3644484877586365, 0.38521909713745117, 0.40598973631858826, 0.42676037549972534, 0.44753098487854004, 0.4683016240596771, 0.4890722632408142, 0.5098428726196289, 0.5306134819984436, 0.5513841509819031, 0.5721547603607178, 0.5929253697395325, 0.6136960387229919, 0.6344666481018066]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 3.0, 6.0, 10.0, 13.0, 24.0, 20.0, 39.0, 45.0, 97.0, 186.0, 422.0, 1227.0, 5814.0, 148310.0, 866920.0, 21686.0, 2471.0, 715.0, 256.0, 121.0, 54.0, 41.0, 36.0, 16.0, 13.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.56640625, -1.52545166015625, -1.4844970703125, -1.44354248046875, -1.402587890625, -1.36163330078125, -1.3206787109375, -1.27972412109375, -1.23876953125, -1.19781494140625, -1.1568603515625, -1.11590576171875, -1.074951171875, -1.03399658203125, -0.9930419921875, -0.95208740234375, -0.9111328125, -0.87017822265625, -0.8292236328125, -0.78826904296875, -0.747314453125, -0.70635986328125, -0.6654052734375, -0.62445068359375, -0.58349609375, -0.54254150390625, -0.5015869140625, -0.46063232421875, -0.419677734375, -0.37872314453125, -0.3377685546875, -0.29681396484375, -0.255859375, -0.21490478515625, -0.1739501953125, -0.13299560546875, -0.092041015625, -0.05108642578125, -0.0101318359375, 0.03082275390625, 0.07177734375, 0.11273193359375, 0.1536865234375, 0.19464111328125, 0.235595703125, 0.27655029296875, 0.3175048828125, 0.35845947265625, 0.3994140625, 0.44036865234375, 0.4813232421875, 0.52227783203125, 0.563232421875, 0.60418701171875, 0.6451416015625, 0.68609619140625, 0.72705078125, 0.76800537109375, 0.8089599609375, 0.84991455078125, 0.890869140625, 0.93182373046875, 0.9727783203125, 1.01373291015625, 1.0546875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 1.0, 5.0, 9.0, 16.0, 37.0, 58.0, 78.0, 121.0, 128.0, 150.0, 135.0, 108.0, 78.0, 38.0, 25.0, 11.0, 6.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08734130859375, -0.08079242706298828, -0.07424354553222656, -0.06769466400146484, -0.061145782470703125, -0.054596900939941406, -0.04804801940917969, -0.04149913787841797, -0.03495025634765625, -0.02840137481689453, -0.021852493286132812, -0.015303611755371094, -0.008754730224609375, -0.0022058486938476562, 0.0043430328369140625, 0.010891914367675781, 0.0174407958984375, 0.02398967742919922, 0.030538558959960938, 0.037087440490722656, 0.043636322021484375, 0.050185203552246094, 0.05673408508300781, 0.06328296661376953, 0.06983184814453125, 0.07638072967529297, 0.08292961120605469, 0.0894784927368164, 0.09602737426757812, 0.10257625579833984, 0.10912513732910156, 0.11567401885986328, 0.122222900390625, 0.12877178192138672, 0.13532066345214844, 0.14186954498291016, 0.14841842651367188, 0.1549673080444336, 0.1615161895751953, 0.16806507110595703, 0.17461395263671875, 0.18116283416748047, 0.1877117156982422, 0.1942605972290039, 0.20080947875976562, 0.20735836029052734, 0.21390724182128906, 0.22045612335205078, 0.2270050048828125, 0.23355388641357422, 0.24010276794433594, 0.24665164947509766, 0.2532005310058594, 0.2597494125366211, 0.2662982940673828, 0.27284717559814453, 0.27939605712890625, 0.28594493865966797, 0.2924938201904297, 0.2990427017211914, 0.3055915832519531, 0.31214046478271484, 0.31868934631347656, 0.3252382278442383, 0.331787109375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 6.0, 2.0, 11.0, 9.0, 15.0, 25.0, 32.0, 50.0, 94.0, 185.0, 401.0, 927.0, 2265.0, 7543.0, 47571.0, 770289.0, 195701.0, 16908.0, 3930.0, 1325.0, 582.0, 291.0, 163.0, 77.0, 41.0, 32.0, 27.0, 18.0, 10.0, 7.0, 2.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5546875, -0.5313262939453125, -0.507965087890625, -0.4846038818359375, -0.46124267578125, -0.4378814697265625, -0.414520263671875, -0.3911590576171875, -0.3677978515625, -0.3444366455078125, -0.321075439453125, -0.2977142333984375, -0.27435302734375, -0.2509918212890625, -0.227630615234375, -0.2042694091796875, -0.180908203125, -0.1575469970703125, -0.134185791015625, -0.1108245849609375, -0.08746337890625, -0.0641021728515625, -0.040740966796875, -0.0173797607421875, 0.0059814453125, 0.0293426513671875, 0.052703857421875, 0.0760650634765625, 0.09942626953125, 0.1227874755859375, 0.146148681640625, 0.1695098876953125, 0.19287109375, 0.2162322998046875, 0.239593505859375, 0.2629547119140625, 0.28631591796875, 0.3096771240234375, 0.333038330078125, 0.3563995361328125, 0.3797607421875, 0.4031219482421875, 0.426483154296875, 0.4498443603515625, 0.47320556640625, 0.4965667724609375, 0.519927978515625, 0.5432891845703125, 0.566650390625, 0.5900115966796875, 0.613372802734375, 0.6367340087890625, 0.66009521484375, 0.6834564208984375, 0.706817626953125, 0.7301788330078125, 0.7535400390625, 0.7769012451171875, 0.800262451171875, 0.8236236572265625, 0.84698486328125, 0.8703460693359375, 0.893707275390625, 0.9170684814453125, 0.9404296875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 7.0, 6.0, 14.0, 10.0, 16.0, 21.0, 36.0, 44.0, 55.0, 78.0, 84.0, 77.0, 98.0, 96.0, 71.0, 48.0, 50.0, 43.0, 40.0, 27.0, 19.0, 23.0, 10.0, 3.0, 4.0, 3.0, 4.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4638671875, -0.44628143310546875, -0.4286956787109375, -0.41110992431640625, -0.393524169921875, -0.37593841552734375, -0.3583526611328125, -0.34076690673828125, -0.32318115234375, -0.30559539794921875, -0.2880096435546875, -0.27042388916015625, -0.252838134765625, -0.23525238037109375, -0.2176666259765625, -0.20008087158203125, -0.1824951171875, -0.16490936279296875, -0.1473236083984375, -0.12973785400390625, -0.112152099609375, -0.09456634521484375, -0.0769805908203125, -0.05939483642578125, -0.04180908203125, -0.02422332763671875, -0.0066375732421875, 0.01094818115234375, 0.028533935546875, 0.04611968994140625, 0.0637054443359375, 0.08129119873046875, 0.098876953125, 0.11646270751953125, 0.1340484619140625, 0.15163421630859375, 0.169219970703125, 0.18680572509765625, 0.2043914794921875, 0.22197723388671875, 0.23956298828125, 0.25714874267578125, 0.2747344970703125, 0.29232025146484375, 0.309906005859375, 0.32749176025390625, 0.3450775146484375, 0.36266326904296875, 0.3802490234375, 0.39783477783203125, 0.4154205322265625, 0.43300628662109375, 0.450592041015625, 0.46817779541015625, 0.4857635498046875, 0.5033493041992188, 0.52093505859375, 0.5385208129882812, 0.5561065673828125, 0.5736923217773438, 0.591278076171875, 0.6088638305664062, 0.6264495849609375, 0.6440353393554688, 0.66162109375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 3.0, 1.0, 4.0, 2.0, 3.0, 13.0, 17.0, 30.0, 45.0, 53.0, 88.0, 177.0, 320.0, 736.0, 2177.0, 9480.0, 101504.0, 806593.0, 113455.0, 9968.0, 2280.0, 799.0, 365.0, 176.0, 77.0, 66.0, 38.0, 23.0, 16.0, 15.0, 8.0, 7.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1741943359375, -0.16762542724609375, -0.1610565185546875, -0.15448760986328125, -0.147918701171875, -0.14134979248046875, -0.1347808837890625, -0.12821197509765625, -0.12164306640625, -0.11507415771484375, -0.1085052490234375, -0.10193634033203125, -0.095367431640625, -0.08879852294921875, -0.0822296142578125, -0.07566070556640625, -0.069091796875, -0.06252288818359375, -0.0559539794921875, -0.04938507080078125, -0.042816162109375, -0.03624725341796875, -0.0296783447265625, -0.02310943603515625, -0.01654052734375, -0.00997161865234375, -0.0034027099609375, 0.00316619873046875, 0.009735107421875, 0.01630401611328125, 0.0228729248046875, 0.02944183349609375, 0.0360107421875, 0.04257965087890625, 0.0491485595703125, 0.05571746826171875, 0.062286376953125, 0.06885528564453125, 0.0754241943359375, 0.08199310302734375, 0.08856201171875, 0.09513092041015625, 0.1016998291015625, 0.10826873779296875, 0.114837646484375, 0.12140655517578125, 0.1279754638671875, 0.13454437255859375, 0.14111328125, 0.14768218994140625, 0.1542510986328125, 0.16082000732421875, 0.167388916015625, 0.17395782470703125, 0.1805267333984375, 0.18709564208984375, 0.19366455078125, 0.20023345947265625, 0.2068023681640625, 0.21337127685546875, 0.219940185546875, 0.22650909423828125, 0.2330780029296875, 0.23964691162109375, 0.2462158203125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 10.0, 5.0, 10.0, 16.0, 28.0, 30.0, 65.0, 69.0, 106.0, 124.0, 142.0, 120.0, 92.0, 63.0, 48.0, 23.0, 13.0, 18.0, 6.0, 8.0, 5.0, 4.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001919269561767578, -0.0001851152628660202, -0.0001783035695552826, -0.00017149187624454498, -0.00016468018293380737, -0.00015786848962306976, -0.00015105679631233215, -0.00014424510300159454, -0.00013743340969085693, -0.00013062171638011932, -0.00012381002306938171, -0.0001169983297586441, -0.0001101866364479065, -0.00010337494313716888, -9.656324982643127e-05, -8.975155651569366e-05, -8.293986320495605e-05, -7.612816989421844e-05, -6.931647658348083e-05, -6.250478327274323e-05, -5.5693089962005615e-05, -4.8881396651268005e-05, -4.2069703340530396e-05, -3.5258010029792786e-05, -2.8446316719055176e-05, -2.1634623408317566e-05, -1.4822930097579956e-05, -8.011236786842346e-06, -1.1995434761047363e-06, 5.6121498346328735e-06, 1.2423843145370483e-05, 1.9235536456108093e-05, 2.6047229766845703e-05, 3.285892307758331e-05, 3.967061638832092e-05, 4.648230969905853e-05, 5.329400300979614e-05, 6.010569632053375e-05, 6.691738963127136e-05, 7.372908294200897e-05, 8.054077625274658e-05, 8.735246956348419e-05, 9.41641628742218e-05, 0.00010097585618495941, 0.00010778754949569702, 0.00011459924280643463, 0.00012141093611717224, 0.00012822262942790985, 0.00013503432273864746, 0.00014184601604938507, 0.00014865770936012268, 0.0001554694026708603, 0.0001622810959815979, 0.0001690927892923355, 0.00017590448260307312, 0.00018271617591381073, 0.00018952786922454834, 0.00019633956253528595, 0.00020315125584602356, 0.00020996294915676117, 0.00021677464246749878, 0.0002235863357782364, 0.000230398029088974, 0.0002372097223997116, 0.00024402141571044922]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 9.0, 5.0, 9.0, 10.0, 15.0, 35.0, 58.0, 84.0, 188.0, 353.0, 757.0, 2014.0, 7452.0, 55792.0, 730115.0, 229255.0, 16755.0, 3489.0, 1143.0, 492.0, 222.0, 126.0, 49.0, 46.0, 23.0, 18.0, 8.0, 9.0, 5.0, 4.0, 8.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1810302734375, -0.1749420166015625, -0.168853759765625, -0.1627655029296875, -0.15667724609375, -0.1505889892578125, -0.144500732421875, -0.1384124755859375, -0.13232421875, -0.1262359619140625, -0.120147705078125, -0.1140594482421875, -0.10797119140625, -0.1018829345703125, -0.095794677734375, -0.0897064208984375, -0.0836181640625, -0.0775299072265625, -0.071441650390625, -0.0653533935546875, -0.05926513671875, -0.0531768798828125, -0.047088623046875, -0.0410003662109375, -0.034912109375, -0.0288238525390625, -0.022735595703125, -0.0166473388671875, -0.01055908203125, -0.0044708251953125, 0.001617431640625, 0.0077056884765625, 0.0137939453125, 0.0198822021484375, 0.025970458984375, 0.0320587158203125, 0.03814697265625, 0.0442352294921875, 0.050323486328125, 0.0564117431640625, 0.0625, 0.0685882568359375, 0.074676513671875, 0.0807647705078125, 0.08685302734375, 0.0929412841796875, 0.099029541015625, 0.1051177978515625, 0.1112060546875, 0.1172943115234375, 0.123382568359375, 0.1294708251953125, 0.13555908203125, 0.1416473388671875, 0.147735595703125, 0.1538238525390625, 0.159912109375, 0.1660003662109375, 0.172088623046875, 0.1781768798828125, 0.18426513671875, 0.1903533935546875, 0.196441650390625, 0.2025299072265625, 0.2086181640625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 6.0, 5.0, 10.0, 11.0, 10.0, 26.0, 34.0, 71.0, 105.0, 134.0, 183.0, 140.0, 116.0, 65.0, 33.0, 14.0, 15.0, 7.0, 6.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.134521484375, -0.1299571990966797, -0.12539291381835938, -0.12082862854003906, -0.11626434326171875, -0.11170005798339844, -0.10713577270507812, -0.10257148742675781, -0.0980072021484375, -0.09344291687011719, -0.08887863159179688, -0.08431434631347656, -0.07975006103515625, -0.07518577575683594, -0.07062149047851562, -0.06605720520019531, -0.061492919921875, -0.05692863464355469, -0.052364349365234375, -0.04780006408691406, -0.04323577880859375, -0.03867149353027344, -0.034107208251953125, -0.029542922973632812, -0.0249786376953125, -0.020414352416992188, -0.015850067138671875, -0.011285781860351562, -0.00672149658203125, -0.0021572113037109375, 0.002407073974609375, 0.0069713592529296875, 0.01153564453125, 0.016099929809570312, 0.020664215087890625, 0.025228500366210938, 0.02979278564453125, 0.03435707092285156, 0.038921356201171875, 0.04348564147949219, 0.0480499267578125, 0.05261421203613281, 0.057178497314453125, 0.06174278259277344, 0.06630706787109375, 0.07087135314941406, 0.07543563842773438, 0.07999992370605469, 0.084564208984375, 0.08912849426269531, 0.09369277954101562, 0.09825706481933594, 0.10282135009765625, 0.10738563537597656, 0.11194992065429688, 0.11651420593261719, 0.1210784912109375, 0.1256427764892578, 0.13020706176757812, 0.13477134704589844, 0.13933563232421875, 0.14389991760253906, 0.14846420288085938, 0.1530284881591797, 0.1575927734375]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 6.0, 14.0, 40.0, 80.0, 241.0, 301.0, 183.0, 75.0, 37.0, 8.0, 10.0, 6.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3282575607299805, -3.192124605178833, -3.0559914112091064, -2.919858455657959, -2.7837252616882324, -2.647592306137085, -2.5114593505859375, -2.375326156616211, -2.2391929626464844, -2.103060007095337, -1.9669268131256104, -1.830793857574463, -1.6946606636047363, -1.5585277080535889, -1.4223946332931519, -1.2862615585327148, -1.1501286029815674, -1.0139955282211304, -0.8778624534606934, -0.7417294383049011, -0.6055963635444641, -0.4694632887840271, -0.33333027362823486, -0.19719719886779785, -0.06106412410736084, 0.07506893575191498, 0.2112019956111908, 0.3473350405693054, 0.48346811532974243, 0.6196011900901794, 0.7557342052459717, 0.8918672800064087, 1.0280003547668457, 1.1641334295272827, 1.3002665042877197, 1.4363994598388672, 1.5725326538085938, 1.7086656093597412, 1.8447986841201782, 1.9809317588806152, 2.117064952850342, 2.2531979084014893, 2.389331102371216, 2.5254640579223633, 2.66159725189209, 2.7977302074432373, 2.9338631629943848, 3.0699963569641113, 3.206129312515259, 3.3422622680664062, 3.478395462036133, 3.6145284175872803, 3.750661611557007, 3.8867945671081543, 4.022927761077881, 4.159060478210449, 4.295193672180176, 4.431326866149902, 4.567459583282471, 4.703592777252197, 4.839725971221924, 4.97585916519165, 5.111991882324219, 5.248125076293945, 5.384258270263672]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 5.0, 4.0, 6.0, 12.0, 12.0, 9.0, 10.0, 22.0, 34.0, 20.0, 28.0, 35.0, 32.0, 39.0, 35.0, 37.0, 50.0, 58.0, 49.0, 52.0, 55.0, 39.0, 32.0, 43.0, 42.0, 31.0, 21.0, 27.0, 31.0, 28.0, 15.0, 8.0, 15.0, 14.0, 12.0, 11.0, 12.0, 5.0, 4.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-1.8244390487670898, -1.764106273651123, -1.7037734985351562, -1.6434407234191895, -1.5831079483032227, -1.5227751731872559, -1.462442398071289, -1.4021096229553223, -1.3417768478393555, -1.2814440727233887, -1.2211112976074219, -1.160778522491455, -1.1004457473754883, -1.0401129722595215, -0.9797801375389099, -0.9194473624229431, -0.8591145277023315, -0.7987817525863647, -0.738448977470398, -0.6781162023544312, -0.6177834272384644, -0.5574506521224976, -0.497117817401886, -0.4367850422859192, -0.3764522671699524, -0.3161194920539856, -0.2557867169380188, -0.19545391201972961, -0.13512113690376282, -0.07478836178779602, -0.014455556869506836, 0.04587721824645996, 0.10620999336242676, 0.16654276847839355, 0.22687555849552155, 0.28720834851264954, 0.34754112362861633, 0.40787389874458313, 0.4682067036628723, 0.5285394787788391, 0.5888722538948059, 0.6492050290107727, 0.7095378041267395, 0.7698706388473511, 0.8302034139633179, 0.8905361890792847, 0.9508689641952515, 1.0112017393112183, 1.071534514427185, 1.1318672895431519, 1.1922000646591187, 1.2525328397750854, 1.3128656148910522, 1.373198390007019, 1.4335312843322754, 1.4938640594482422, 1.554196834564209, 1.6145296096801758, 1.6748623847961426, 1.7351951599121094, 1.7955279350280762, 1.855860710144043, 1.9161934852600098, 1.9765262603759766, 2.0368590354919434]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 5.0, 9.0, 18.0, 55.0, 171.0, 474.0, 1645.0, 7558.0, 62672.0, 4013969.0, 94875.0, 9070.0, 1997.0, 735.0, 332.0, 205.0, 116.0, 81.0, 63.0, 50.0, 39.0, 24.0, 17.0, 20.0, 17.0, 14.0, 8.0, 4.0, 8.0, 5.0, 10.0, 8.0, 4.0, 2.0, 0.0, 4.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.488525390625, -0.4463157653808594, -0.40410614013671875, -0.3618965148925781, -0.3196868896484375, -0.2774772644042969, -0.23526763916015625, -0.19305801391601562, -0.150848388671875, -0.10863876342773438, -0.06642913818359375, -0.024219512939453125, 0.0179901123046875, 0.060199737548828125, 0.10240936279296875, 0.14461898803710938, 0.18682861328125, 0.22903823852539062, 0.27124786376953125, 0.3134574890136719, 0.3556671142578125, 0.3978767395019531, 0.44008636474609375, 0.4822959899902344, 0.524505615234375, 0.5667152404785156, 0.6089248657226562, 0.6511344909667969, 0.6933441162109375, 0.7355537414550781, 0.7777633666992188, 0.8199729919433594, 0.8621826171875, 0.9043922424316406, 0.9466018676757812, 0.9888114929199219, 1.0310211181640625, 1.0732307434082031, 1.1154403686523438, 1.1576499938964844, 1.199859619140625, 1.2420692443847656, 1.2842788696289062, 1.3264884948730469, 1.3686981201171875, 1.4109077453613281, 1.4531173706054688, 1.4953269958496094, 1.53753662109375, 1.5797462463378906, 1.6219558715820312, 1.6641654968261719, 1.7063751220703125, 1.7485847473144531, 1.7907943725585938, 1.8330039978027344, 1.875213623046875, 1.9174232482910156, 1.9596328735351562, 2.001842498779297, 2.0440521240234375, 2.086261749267578, 2.1284713745117188, 2.1706809997558594, 2.212890625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 2.0, 12.0, 21.0, 42.0, 50.0, 88.0, 137.0, 142.0, 137.0, 128.0, 108.0, 58.0, 52.0, 18.0, 8.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07281494140625, -0.06629085540771484, -0.05976676940917969, -0.05324268341064453, -0.046718597412109375, -0.04019451141357422, -0.03367042541503906, -0.027146339416503906, -0.02062225341796875, -0.014098167419433594, -0.0075740814208984375, -0.0010499954223632812, 0.005474090576171875, 0.011998176574707031, 0.018522262573242188, 0.025046348571777344, 0.0315704345703125, 0.038094520568847656, 0.04461860656738281, 0.05114269256591797, 0.057666778564453125, 0.06419086456298828, 0.07071495056152344, 0.0772390365600586, 0.08376312255859375, 0.0902872085571289, 0.09681129455566406, 0.10333538055419922, 0.10985946655273438, 0.11638355255126953, 0.12290763854980469, 0.12943172454833984, 0.135955810546875, 0.14247989654541016, 0.1490039825439453, 0.15552806854248047, 0.16205215454101562, 0.16857624053955078, 0.17510032653808594, 0.1816244125366211, 0.18814849853515625, 0.1946725845336914, 0.20119667053222656, 0.20772075653076172, 0.21424484252929688, 0.22076892852783203, 0.2272930145263672, 0.23381710052490234, 0.2403411865234375, 0.24686527252197266, 0.2533893585205078, 0.25991344451904297, 0.2664375305175781, 0.2729616165161133, 0.27948570251464844, 0.2860097885131836, 0.29253387451171875, 0.2990579605102539, 0.30558204650878906, 0.3121061325073242, 0.3186302185058594, 0.32515430450439453, 0.3316783905029297, 0.33820247650146484, 0.3447265625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 4.0, 6.0, 10.0, 20.0, 40.0, 46.0, 109.0, 244.0, 931.0, 6807.0, 4112493.0, 68397.0, 3773.0, 823.0, 263.0, 116.0, 57.0, 42.0, 37.0, 28.0, 16.0, 11.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.41796875, -2.30712890625, -2.1962890625, -2.08544921875, -1.974609375, -1.86376953125, -1.7529296875, -1.64208984375, -1.53125, -1.42041015625, -1.3095703125, -1.19873046875, -1.087890625, -0.97705078125, -0.8662109375, -0.75537109375, -0.64453125, -0.53369140625, -0.4228515625, -0.31201171875, -0.201171875, -0.09033203125, 0.0205078125, 0.13134765625, 0.2421875, 0.35302734375, 0.4638671875, 0.57470703125, 0.685546875, 0.79638671875, 0.9072265625, 1.01806640625, 1.12890625, 1.23974609375, 1.3505859375, 1.46142578125, 1.572265625, 1.68310546875, 1.7939453125, 1.90478515625, 2.015625, 2.12646484375, 2.2373046875, 2.34814453125, 2.458984375, 2.56982421875, 2.6806640625, 2.79150390625, 2.90234375, 3.01318359375, 3.1240234375, 3.23486328125, 3.345703125, 3.45654296875, 3.5673828125, 3.67822265625, 3.7890625, 3.89990234375, 4.0107421875, 4.12158203125, 4.232421875, 4.34326171875, 4.4541015625, 4.56494140625, 4.67578125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 4.0, 4.0, 3.0, 5.0, 12.0, 25.0, 73.0, 2441.0, 1340.0, 102.0, 25.0, 16.0, 5.0, 5.0, 5.0, 2.0, 5.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.302978515625, -0.2753257751464844, -0.24767303466796875, -0.22002029418945312, -0.1923675537109375, -0.16471481323242188, -0.13706207275390625, -0.10940933227539062, -0.081756591796875, -0.054103851318359375, -0.02645111083984375, 0.001201629638671875, 0.0288543701171875, 0.056507110595703125, 0.08415985107421875, 0.11181259155273438, 0.13946533203125, 0.16711807250976562, 0.19477081298828125, 0.22242355346679688, 0.2500762939453125, 0.2777290344238281, 0.30538177490234375, 0.3330345153808594, 0.360687255859375, 0.3883399963378906, 0.41599273681640625, 0.4436454772949219, 0.4712982177734375, 0.4989509582519531, 0.5266036987304688, 0.5542564392089844, 0.5819091796875, 0.6095619201660156, 0.6372146606445312, 0.6648674011230469, 0.6925201416015625, 0.7201728820800781, 0.7478256225585938, 0.7754783630371094, 0.803131103515625, 0.8307838439941406, 0.8584365844726562, 0.8860893249511719, 0.9137420654296875, 0.9413948059082031, 0.9690475463867188, 0.9967002868652344, 1.02435302734375, 1.0520057678222656, 1.0796585083007812, 1.1073112487792969, 1.1349639892578125, 1.1626167297363281, 1.1902694702148438, 1.2179222106933594, 1.245574951171875, 1.2732276916503906, 1.3008804321289062, 1.3285331726074219, 1.3561859130859375, 1.3838386535644531, 1.4114913940429688, 1.4391441345214844, 1.466796875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 15.0, 74.0, 447.0, 370.0, 62.0, 21.0, 7.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.511024236679077, -2.3305482864379883, -2.1500725746154785, -1.9695967435836792, -1.7891209125518799, -1.6086450815200806, -1.4281692504882812, -1.247693419456482, -1.0672175884246826, -0.8867417573928833, -0.706265926361084, -0.5257900953292847, -0.34531426429748535, -0.16483843326568604, 0.01563739776611328, 0.1961132287979126, 0.3765890598297119, 0.5570648908615112, 0.7375407218933105, 0.9180165529251099, 1.0984923839569092, 1.2789682149887085, 1.4594440460205078, 1.6399198770523071, 1.8203957080841064, 2.0008716583251953, 2.181347370147705, 2.361823081970215, 2.5422990322113037, 2.7227749824523926, 2.9032506942749023, 3.083726406097412, 3.264202117919922, 3.4446778297424316, 3.6251537799835205, 3.8056297302246094, 3.986105442047119, 4.166581153869629, 4.347057342529297, 4.527533054351807, 4.708008766174316, 4.888484477996826, 5.068960189819336, 5.249436378479004, 5.429912090301514, 5.610387802124023, 5.790863990783691, 5.971339702606201, 6.151815414428711, 6.332291126251221, 6.5127668380737305, 6.693243026733398, 6.873718738555908, 7.054194450378418, 7.234670639038086, 7.415146350860596, 7.5956220626831055, 7.776097774505615, 7.956573486328125, 8.137049674987793, 8.317525863647461, 8.498001098632812, 8.67847728729248, 8.858952522277832, 9.0394287109375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 6.0, 12.0, 36.0, 61.0, 98.0, 131.0, 148.0, 174.0, 139.0, 77.0, 66.0, 36.0, 12.0, 8.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7043089866638184, -3.5832324028015137, -3.462155818939209, -3.3410792350769043, -3.2200026512145996, -3.098926067352295, -2.9778494834899902, -2.8567731380462646, -2.73569655418396, -2.6146199703216553, -2.4935433864593506, -2.372466802597046, -2.251390218734741, -2.1303138732910156, -2.009237289428711, -1.8881607055664062, -1.767084002494812, -1.6460074186325073, -1.5249308347702026, -1.4038543701171875, -1.2827777862548828, -1.1617012023925781, -1.0406246185302734, -0.9195480942726135, -0.7984715104103088, -0.6773949265480042, -0.5563184022903442, -0.43524181842803955, -0.31416526436805725, -0.19308871030807495, -0.07201212644577026, 0.04906439781188965, 0.17014098167419434, 0.29121753573417664, 0.41229408979415894, 0.5333706736564636, 0.6544471979141235, 0.7755237817764282, 0.8966003656387329, 1.017676830291748, 1.1387534141540527, 1.2598299980163574, 1.380906581878662, 1.5019831657409668, 1.623059630393982, 1.7441362142562866, 1.8652127981185913, 1.9862892627716064, 2.1073660850524902, 2.228442668914795, 2.3495192527770996, 2.4705958366394043, 2.591672420501709, 2.7127490043640137, 2.8338255882263184, 2.954901933670044, 3.0759785175323486, 3.1970551013946533, 3.318131685256958, 3.4392082691192627, 3.5602848529815674, 3.681361198425293, 3.8024377822875977, 3.9235143661499023, 4.044590950012207]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 3.0, 4.0, 12.0, 14.0, 20.0, 26.0, 32.0, 54.0, 86.0, 95.0, 193.0, 356.0, 633.0, 1755.0, 9214.0, 147327.0, 832089.0, 49430.0, 4734.0, 1175.0, 511.0, 282.0, 158.0, 101.0, 66.0, 50.0, 42.0, 24.0, 14.0, 17.0, 12.0, 9.0, 6.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1572265625, -1.1262283325195312, -1.0952301025390625, -1.0642318725585938, -1.033233642578125, -1.0022354125976562, -0.9712371826171875, -0.9402389526367188, -0.90924072265625, -0.8782424926757812, -0.8472442626953125, -0.8162460327148438, -0.785247802734375, -0.7542495727539062, -0.7232513427734375, -0.6922531127929688, -0.6612548828125, -0.6302566528320312, -0.5992584228515625, -0.5682601928710938, -0.537261962890625, -0.5062637329101562, -0.4752655029296875, -0.44426727294921875, -0.41326904296875, -0.38227081298828125, -0.3512725830078125, -0.32027435302734375, -0.289276123046875, -0.25827789306640625, -0.2272796630859375, -0.19628143310546875, -0.165283203125, -0.13428497314453125, -0.1032867431640625, -0.07228851318359375, -0.041290283203125, -0.01029205322265625, 0.0207061767578125, 0.05170440673828125, 0.08270263671875, 0.11370086669921875, 0.1446990966796875, 0.17569732666015625, 0.206695556640625, 0.23769378662109375, 0.2686920166015625, 0.29969024658203125, 0.3306884765625, 0.36168670654296875, 0.3926849365234375, 0.42368316650390625, 0.454681396484375, 0.48567962646484375, 0.5166778564453125, 0.5476760864257812, 0.57867431640625, 0.6096725463867188, 0.6406707763671875, 0.6716690063476562, 0.702667236328125, 0.7336654663085938, 0.7646636962890625, 0.7956619262695312, 0.82666015625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 8.0, 16.0, 39.0, 72.0, 137.0, 164.0, 153.0, 158.0, 117.0, 76.0, 45.0, 17.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2000732421875, -0.19156455993652344, -0.18305587768554688, -0.1745471954345703, -0.16603851318359375, -0.1575298309326172, -0.14902114868164062, -0.14051246643066406, -0.1320037841796875, -0.12349510192871094, -0.11498641967773438, -0.10647773742675781, -0.09796905517578125, -0.08946037292480469, -0.08095169067382812, -0.07244300842285156, -0.063934326171875, -0.05542564392089844, -0.046916961669921875, -0.03840827941894531, -0.02989959716796875, -0.021390914916992188, -0.012882232666015625, -0.0043735504150390625, 0.0041351318359375, 0.012643814086914062, 0.021152496337890625, 0.029661178588867188, 0.03816986083984375, 0.04667854309082031, 0.055187225341796875, 0.06369590759277344, 0.07220458984375, 0.08071327209472656, 0.08922195434570312, 0.09773063659667969, 0.10623931884765625, 0.11474800109863281, 0.12325668334960938, 0.13176536560058594, 0.1402740478515625, 0.14878273010253906, 0.15729141235351562, 0.1658000946044922, 0.17430877685546875, 0.1828174591064453, 0.19132614135742188, 0.19983482360839844, 0.208343505859375, 0.21685218811035156, 0.22536087036132812, 0.2338695526123047, 0.24237823486328125, 0.2508869171142578, 0.2593955993652344, 0.26790428161621094, 0.2764129638671875, 0.28492164611816406, 0.2934303283691406, 0.3019390106201172, 0.31044769287109375, 0.3189563751220703, 0.3274650573730469, 0.33597373962402344, 0.344482421875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 5.0, 7.0, 7.0, 14.0, 12.0, 20.0, 29.0, 40.0, 77.0, 129.0, 256.0, 553.0, 1413.0, 4775.0, 20745.0, 151283.0, 701305.0, 140833.0, 19910.0, 4667.0, 1397.0, 510.0, 223.0, 134.0, 64.0, 44.0, 36.0, 19.0, 18.0, 9.0, 9.0, 7.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38330078125, -0.369354248046875, -0.35540771484375, -0.341461181640625, -0.3275146484375, -0.313568115234375, -0.29962158203125, -0.285675048828125, -0.271728515625, -0.257781982421875, -0.24383544921875, -0.229888916015625, -0.2159423828125, -0.201995849609375, -0.18804931640625, -0.174102783203125, -0.16015625, -0.146209716796875, -0.13226318359375, -0.118316650390625, -0.1043701171875, -0.090423583984375, -0.07647705078125, -0.062530517578125, -0.048583984375, -0.034637451171875, -0.02069091796875, -0.006744384765625, 0.0072021484375, 0.021148681640625, 0.03509521484375, 0.049041748046875, 0.06298828125, 0.076934814453125, 0.09088134765625, 0.104827880859375, 0.1187744140625, 0.132720947265625, 0.14666748046875, 0.160614013671875, 0.174560546875, 0.188507080078125, 0.20245361328125, 0.216400146484375, 0.2303466796875, 0.244293212890625, 0.25823974609375, 0.272186279296875, 0.2861328125, 0.300079345703125, 0.31402587890625, 0.327972412109375, 0.3419189453125, 0.355865478515625, 0.36981201171875, 0.383758544921875, 0.397705078125, 0.411651611328125, 0.42559814453125, 0.439544677734375, 0.4534912109375, 0.467437744140625, 0.48138427734375, 0.495330810546875, 0.50927734375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 7.0, 2.0, 2.0, 5.0, 7.0, 10.0, 6.0, 9.0, 15.0, 9.0, 21.0, 24.0, 31.0, 29.0, 41.0, 35.0, 51.0, 47.0, 41.0, 51.0, 50.0, 48.0, 59.0, 64.0, 55.0, 52.0, 46.0, 32.0, 39.0, 14.0, 28.0, 16.0, 11.0, 14.0, 11.0, 10.0, 5.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27880859375, -0.2684898376464844, -0.25817108154296875, -0.24785232543945312, -0.2375335693359375, -0.22721481323242188, -0.21689605712890625, -0.20657730102539062, -0.196258544921875, -0.18593978881835938, -0.17562103271484375, -0.16530227661132812, -0.1549835205078125, -0.14466476440429688, -0.13434600830078125, -0.12402725219726562, -0.11370849609375, -0.10338973999023438, -0.09307098388671875, -0.08275222778320312, -0.0724334716796875, -0.062114715576171875, -0.05179595947265625, -0.041477203369140625, -0.031158447265625, -0.020839691162109375, -0.01052093505859375, -0.000202178955078125, 0.0101165771484375, 0.020435333251953125, 0.03075408935546875, 0.041072845458984375, 0.0513916015625, 0.061710357666015625, 0.07202911376953125, 0.08234786987304688, 0.0926666259765625, 0.10298538208007812, 0.11330413818359375, 0.12362289428710938, 0.133941650390625, 0.14426040649414062, 0.15457916259765625, 0.16489791870117188, 0.1752166748046875, 0.18553543090820312, 0.19585418701171875, 0.20617294311523438, 0.21649169921875, 0.22681045532226562, 0.23712921142578125, 0.24744796752929688, 0.2577667236328125, 0.2680854797363281, 0.27840423583984375, 0.2887229919433594, 0.299041748046875, 0.3093605041503906, 0.31967926025390625, 0.3299980163574219, 0.3403167724609375, 0.3506355285644531, 0.36095428466796875, 0.3712730407714844, 0.381591796875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 8.0, 4.0, 10.0, 10.0, 16.0, 36.0, 63.0, 99.0, 194.0, 334.0, 739.0, 1841.0, 5987.0, 31854.0, 274944.0, 600614.0, 111402.0, 14493.0, 3461.0, 1262.0, 562.0, 279.0, 139.0, 81.0, 39.0, 30.0, 17.0, 10.0, 8.0, 8.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.15625, -0.15169334411621094, -0.14713668823242188, -0.1425800323486328, -0.13802337646484375, -0.1334667205810547, -0.12891006469726562, -0.12435340881347656, -0.1197967529296875, -0.11524009704589844, -0.11068344116210938, -0.10612678527832031, -0.10157012939453125, -0.09701347351074219, -0.09245681762695312, -0.08790016174316406, -0.083343505859375, -0.07878684997558594, -0.07423019409179688, -0.06967353820800781, -0.06511688232421875, -0.06056022644042969, -0.056003570556640625, -0.05144691467285156, -0.0468902587890625, -0.04233360290527344, -0.037776947021484375, -0.03322029113769531, -0.02866363525390625, -0.024106979370117188, -0.019550323486328125, -0.014993667602539062, -0.01043701171875, -0.0058803558349609375, -0.001323699951171875, 0.0032329559326171875, 0.00778961181640625, 0.012346267700195312, 0.016902923583984375, 0.021459579467773438, 0.0260162353515625, 0.030572891235351562, 0.035129547119140625, 0.03968620300292969, 0.04424285888671875, 0.04879951477050781, 0.053356170654296875, 0.05791282653808594, 0.062469482421875, 0.06702613830566406, 0.07158279418945312, 0.07613945007324219, 0.08069610595703125, 0.08525276184082031, 0.08980941772460938, 0.09436607360839844, 0.0989227294921875, 0.10347938537597656, 0.10803604125976562, 0.11259269714355469, 0.11714935302734375, 0.12170600891113281, 0.12626266479492188, 0.13081932067871094, 0.1353759765625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 3.0, 11.0, 13.0, 23.0, 38.0, 74.0, 139.0, 196.0, 173.0, 135.0, 90.0, 43.0, 32.0, 17.0, 8.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019407272338867188, -0.00018336623907089233, -0.0001726597547531128, -0.00016195327043533325, -0.0001512467861175537, -0.00014054030179977417, -0.00012983381748199463, -0.00011912733316421509, -0.00010842084884643555, -9.7714364528656e-05, -8.700788021087646e-05, -7.630139589309692e-05, -6.559491157531738e-05, -5.488842725753784e-05, -4.41819429397583e-05, -3.347545862197876e-05, -2.276897430419922e-05, -1.2062489986419678e-05, -1.3560056686401367e-06, 9.350478649139404e-06, 2.0056962966918945e-05, 3.0763447284698486e-05, 4.146993160247803e-05, 5.217641592025757e-05, 6.288290023803711e-05, 7.358938455581665e-05, 8.429586887359619e-05, 9.500235319137573e-05, 0.00010570883750915527, 0.00011641532182693481, 0.00012712180614471436, 0.0001378282904624939, 0.00014853477478027344, 0.00015924125909805298, 0.00016994774341583252, 0.00018065422773361206, 0.0001913607120513916, 0.00020206719636917114, 0.00021277368068695068, 0.00022348016500473022, 0.00023418664932250977, 0.0002448931336402893, 0.00025559961795806885, 0.0002663061022758484, 0.00027701258659362793, 0.00028771907091140747, 0.000298425555229187, 0.00030913203954696655, 0.0003198385238647461, 0.00033054500818252563, 0.0003412514925003052, 0.0003519579768180847, 0.00036266446113586426, 0.0003733709454536438, 0.00038407742977142334, 0.0003947839140892029, 0.0004054903984069824, 0.00041619688272476196, 0.0004269033670425415, 0.00043760985136032104, 0.0004483163356781006, 0.0004590228199958801, 0.00046972930431365967, 0.0004804357886314392, 0.0004911422729492188]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 5.0, 5.0, 6.0, 4.0, 11.0, 23.0, 26.0, 51.0, 87.0, 171.0, 351.0, 722.0, 2108.0, 7758.0, 44707.0, 397484.0, 515370.0, 65506.0, 9868.0, 2593.0, 859.0, 404.0, 188.0, 103.0, 45.0, 28.0, 16.0, 14.0, 10.0, 9.0, 10.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.152099609375, -0.14750289916992188, -0.14290618896484375, -0.13830947875976562, -0.1337127685546875, -0.12911605834960938, -0.12451934814453125, -0.11992263793945312, -0.115325927734375, -0.11072921752929688, -0.10613250732421875, -0.10153579711914062, -0.0969390869140625, -0.09234237670898438, -0.08774566650390625, -0.08314895629882812, -0.07855224609375, -0.07395553588867188, -0.06935882568359375, -0.06476211547851562, -0.0601654052734375, -0.055568695068359375, -0.05097198486328125, -0.046375274658203125, -0.041778564453125, -0.037181854248046875, -0.03258514404296875, -0.027988433837890625, -0.0233917236328125, -0.018795013427734375, -0.01419830322265625, -0.009601593017578125, -0.0050048828125, -0.000408172607421875, 0.00418853759765625, 0.008785247802734375, 0.0133819580078125, 0.017978668212890625, 0.02257537841796875, 0.027172088623046875, 0.031768798828125, 0.036365509033203125, 0.04096221923828125, 0.045558929443359375, 0.0501556396484375, 0.054752349853515625, 0.05934906005859375, 0.06394577026367188, 0.06854248046875, 0.07313919067382812, 0.07773590087890625, 0.08233261108398438, 0.0869293212890625, 0.09152603149414062, 0.09612274169921875, 0.10071945190429688, 0.105316162109375, 0.10991287231445312, 0.11450958251953125, 0.11910629272460938, 0.1237030029296875, 0.12829971313476562, 0.13289642333984375, 0.13749313354492188, 0.14208984375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 10.0, 10.0, 14.0, 26.0, 29.0, 41.0, 71.0, 97.0, 117.0, 113.0, 121.0, 104.0, 71.0, 48.0, 37.0, 39.0, 20.0, 7.0, 8.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1005859375, -0.09651374816894531, -0.09244155883789062, -0.08836936950683594, -0.08429718017578125, -0.08022499084472656, -0.07615280151367188, -0.07208061218261719, -0.0680084228515625, -0.06393623352050781, -0.059864044189453125, -0.05579185485839844, -0.05171966552734375, -0.04764747619628906, -0.043575286865234375, -0.03950309753417969, -0.035430908203125, -0.03135871887207031, -0.027286529541015625, -0.023214340209960938, -0.01914215087890625, -0.015069961547851562, -0.010997772216796875, -0.0069255828857421875, -0.0028533935546875, 0.0012187957763671875, 0.005290985107421875, 0.009363174438476562, 0.01343536376953125, 0.017507553100585938, 0.021579742431640625, 0.025651931762695312, 0.02972412109375, 0.03379631042480469, 0.037868499755859375, 0.04194068908691406, 0.04601287841796875, 0.05008506774902344, 0.054157257080078125, 0.05822944641113281, 0.0623016357421875, 0.06637382507324219, 0.07044601440429688, 0.07451820373535156, 0.07859039306640625, 0.08266258239746094, 0.08673477172851562, 0.09080696105957031, 0.094879150390625, 0.09895133972167969, 0.10302352905273438, 0.10709571838378906, 0.11116790771484375, 0.11524009704589844, 0.11931228637695312, 0.12338447570800781, 0.1274566650390625, 0.1315288543701172, 0.13560104370117188, 0.13967323303222656, 0.14374542236328125, 0.14781761169433594, 0.15188980102539062, 0.1559619903564453, 0.1600341796875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 3.0, 9.0, 13.0, 15.0, 25.0, 48.0, 87.0, 184.0, 222.0, 194.0, 98.0, 52.0, 23.0, 15.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.639617919921875, -2.558884859085083, -2.478151798248291, -2.397418737411499, -2.316685676574707, -2.235952615737915, -2.155219554901123, -2.074486255645752, -1.9937533140182495, -1.9130202531814575, -1.8322871923446655, -1.7515541315078735, -1.670820951461792, -1.590087890625, -1.509354829788208, -1.428621768951416, -1.347888708114624, -1.267155647277832, -1.18642258644104, -1.105689525604248, -1.024956464767456, -0.9442233443260193, -0.8634902238845825, -0.7827571630477905, -0.7020241022109985, -0.6212910413742065, -0.5405579805374146, -0.4598248600959778, -0.3790917992591858, -0.2983587384223938, -0.21762564778327942, -0.13689255714416504, -0.056159257888793945, 0.02457381784915924, 0.10530689358711243, 0.1860399693250656, 0.2667730450630188, 0.3475061058998108, 0.42823919653892517, 0.5089722871780396, 0.5897053480148315, 0.6704384088516235, 0.7511714696884155, 0.8319045901298523, 0.9126376509666443, 0.9933707118034363, 1.074103832244873, 1.154836893081665, 1.235569953918457, 1.316303014755249, 1.397036075592041, 1.477769136428833, 1.558502197265625, 1.639235258102417, 1.7199684381484985, 1.8007014989852905, 1.8814345598220825, 1.9621676206588745, 2.042900800704956, 2.123633861541748, 2.20436692237854, 2.285099983215332, 2.365833044052124, 2.446566104888916, 2.527299165725708]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 3.0, 10.0, 8.0, 9.0, 20.0, 22.0, 19.0, 28.0, 38.0, 41.0, 39.0, 54.0, 48.0, 61.0, 72.0, 65.0, 75.0, 55.0, 55.0, 56.0, 48.0, 37.0, 30.0, 22.0, 18.0, 15.0, 21.0, 15.0, 11.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.3562161922454834, -2.291783332824707, -2.2273507118225098, -2.1629178524017334, -2.098484992980957, -2.0340521335601807, -1.9696193933486938, -1.905186653137207, -1.8407537937164307, -1.7763209342956543, -1.7118881940841675, -1.6474554538726807, -1.5830225944519043, -1.518589735031128, -1.4541569948196411, -1.3897242546081543, -1.325291395187378, -1.2608585357666016, -1.1964257955551147, -1.131993055343628, -1.0675601959228516, -1.0031273365020752, -0.9386945962905884, -0.8742617964744568, -0.8098289966583252, -0.7453961968421936, -0.680963397026062, -0.6165305972099304, -0.5520977973937988, -0.48766499757766724, -0.42323219776153564, -0.35879939794540405, -0.29436659812927246, -0.22993379831314087, -0.16550099849700928, -0.10106819868087769, -0.036635398864746094, 0.027797400951385498, 0.09223020076751709, 0.15666300058364868, 0.22109580039978027, 0.28552860021591187, 0.34996140003204346, 0.41439419984817505, 0.47882699966430664, 0.5432597994804382, 0.6076925992965698, 0.6721253991127014, 0.736558198928833, 0.8009909987449646, 0.8654237985610962, 0.9298565983772278, 0.9942893981933594, 1.0587222576141357, 1.1231549978256226, 1.1875877380371094, 1.2520205974578857, 1.316453456878662, 1.380886197090149, 1.4453189373016357, 1.509751796722412, 1.5741846561431885, 1.6386173963546753, 1.703050136566162, 1.7674829959869385]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 4.0, 7.0, 12.0, 24.0, 43.0, 122.0, 297.0, 786.0, 4169.0, 197155.0, 3980725.0, 8616.0, 1326.0, 487.0, 227.0, 116.0, 61.0, 30.0, 23.0, 18.0, 18.0, 4.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.96240234375, -0.9121170043945312, -0.8618316650390625, -0.8115463256835938, -0.761260986328125, -0.7109756469726562, -0.6606903076171875, -0.6104049682617188, -0.56011962890625, -0.5098342895507812, -0.4595489501953125, -0.40926361083984375, -0.358978271484375, -0.30869293212890625, -0.2584075927734375, -0.20812225341796875, -0.1578369140625, -0.10755157470703125, -0.0572662353515625, -0.00698089599609375, 0.043304443359375, 0.09358978271484375, 0.1438751220703125, 0.19416046142578125, 0.24444580078125, 0.29473114013671875, 0.3450164794921875, 0.39530181884765625, 0.445587158203125, 0.49587249755859375, 0.5461578369140625, 0.5964431762695312, 0.646728515625, 0.6970138549804688, 0.7472991943359375, 0.7975845336914062, 0.847869873046875, 0.8981552124023438, 0.9484405517578125, 0.9987258911132812, 1.04901123046875, 1.0992965698242188, 1.1495819091796875, 1.1998672485351562, 1.250152587890625, 1.3004379272460938, 1.3507232666015625, 1.4010086059570312, 1.4512939453125, 1.5015792846679688, 1.5518646240234375, 1.6021499633789062, 1.652435302734375, 1.7027206420898438, 1.7530059814453125, 1.8032913208007812, 1.85357666015625, 1.9038619995117188, 1.9541473388671875, 2.0044326782226562, 2.054718017578125, 2.1050033569335938, 2.1552886962890625, 2.2055740356445312, 2.255859375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 17.0, 32.0, 67.0, 105.0, 144.0, 144.0, 140.0, 138.0, 102.0, 62.0, 31.0, 18.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.180419921875, -0.1722259521484375, -0.164031982421875, -0.1558380126953125, -0.14764404296875, -0.1394500732421875, -0.131256103515625, -0.1230621337890625, -0.1148681640625, -0.1066741943359375, -0.098480224609375, -0.0902862548828125, -0.08209228515625, -0.0738983154296875, -0.065704345703125, -0.0575103759765625, -0.04931640625, -0.0411224365234375, -0.032928466796875, -0.0247344970703125, -0.01654052734375, -0.0083465576171875, -0.000152587890625, 0.0080413818359375, 0.0162353515625, 0.0244293212890625, 0.032623291015625, 0.0408172607421875, 0.04901123046875, 0.0572052001953125, 0.065399169921875, 0.0735931396484375, 0.081787109375, 0.0899810791015625, 0.098175048828125, 0.1063690185546875, 0.11456298828125, 0.1227569580078125, 0.130950927734375, 0.1391448974609375, 0.1473388671875, 0.1555328369140625, 0.163726806640625, 0.1719207763671875, 0.18011474609375, 0.1883087158203125, 0.196502685546875, 0.2046966552734375, 0.212890625, 0.2210845947265625, 0.229278564453125, 0.2374725341796875, 0.24566650390625, 0.2538604736328125, 0.262054443359375, 0.2702484130859375, 0.2784423828125, 0.2866363525390625, 0.294830322265625, 0.3030242919921875, 0.31121826171875, 0.3194122314453125, 0.327606201171875, 0.3358001708984375, 0.343994140625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 1.0, 3.0, 8.0, 11.0, 18.0, 30.0, 29.0, 37.0, 45.0, 54.0, 79.0, 130.0, 438.0, 8088.0, 4179044.0, 5613.0, 301.0, 124.0, 72.0, 44.0, 34.0, 20.0, 24.0, 16.0, 7.0, 7.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.59375, -2.516265869140625, -2.43878173828125, -2.361297607421875, -2.2838134765625, -2.206329345703125, -2.12884521484375, -2.051361083984375, -1.973876953125, -1.896392822265625, -1.81890869140625, -1.741424560546875, -1.6639404296875, -1.586456298828125, -1.50897216796875, -1.431488037109375, -1.35400390625, -1.276519775390625, -1.19903564453125, -1.121551513671875, -1.0440673828125, -0.966583251953125, -0.88909912109375, -0.811614990234375, -0.734130859375, -0.656646728515625, -0.57916259765625, -0.501678466796875, -0.4241943359375, -0.346710205078125, -0.26922607421875, -0.191741943359375, -0.1142578125, -0.036773681640625, 0.04071044921875, 0.118194580078125, 0.1956787109375, 0.273162841796875, 0.35064697265625, 0.428131103515625, 0.505615234375, 0.583099365234375, 0.66058349609375, 0.738067626953125, 0.8155517578125, 0.893035888671875, 0.97052001953125, 1.048004150390625, 1.12548828125, 1.202972412109375, 1.28045654296875, 1.357940673828125, 1.4354248046875, 1.512908935546875, 1.59039306640625, 1.667877197265625, 1.745361328125, 1.822845458984375, 1.90032958984375, 1.977813720703125, 2.0552978515625, 2.132781982421875, 2.21026611328125, 2.287750244140625, 2.365234375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 8.0, 10.0, 32.0, 159.0, 3399.0, 407.0, 46.0, 14.0, 4.0, 4.0], "bins": [-1.076171875, -1.0578393936157227, -1.0395069122314453, -1.021174430847168, -1.0028419494628906, -0.9845094680786133, -0.9661769866943359, -0.9478445053100586, -0.9295120239257812, -0.9111795425415039, -0.8928470611572266, -0.8745145797729492, -0.8561820983886719, -0.8378496170043945, -0.8195171356201172, -0.8011846542358398, -0.7828521728515625, -0.7645196914672852, -0.7461872100830078, -0.7278547286987305, -0.7095222473144531, -0.6911897659301758, -0.6728572845458984, -0.6545248031616211, -0.6361923217773438, -0.6178598403930664, -0.5995273590087891, -0.5811948776245117, -0.5628623962402344, -0.544529914855957, -0.5261974334716797, -0.5078649520874023, -0.489532470703125, -0.47119998931884766, -0.4528675079345703, -0.43453502655029297, -0.4162025451660156, -0.3978700637817383, -0.37953758239746094, -0.3612051010131836, -0.34287261962890625, -0.3245401382446289, -0.30620765686035156, -0.2878751754760742, -0.2695426940917969, -0.25121021270751953, -0.2328777313232422, -0.21454524993896484, -0.1962127685546875, -0.17788028717041016, -0.1595478057861328, -0.14121532440185547, -0.12288284301757812, -0.10455036163330078, -0.08621788024902344, -0.0678853988647461, -0.04955291748046875, -0.031220436096191406, -0.012887954711914062, 0.005444526672363281, 0.023777008056640625, 0.04210948944091797, 0.06044197082519531, 0.07877445220947266, 0.09710693359375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 30.0, 823.0, 146.0, 11.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.311243057250977, -12.036275863647461, -11.761307716369629, -11.486340522766113, -11.211372375488281, -10.936405181884766, -10.66143798828125, -10.386469841003418, -10.111502647399902, -9.836535453796387, -9.561567306518555, -9.286600112915039, -9.011631965637207, -8.736664772033691, -8.46169662475586, -8.186729431152344, -7.91176176071167, -7.636794090270996, -7.361826419830322, -7.086858749389648, -6.811891555786133, -6.536923885345459, -6.261956214904785, -5.986988544464111, -5.7120208740234375, -5.437053203582764, -5.16208553314209, -4.887118339538574, -4.6121506690979, -4.337182998657227, -4.062215328216553, -3.787247657775879, -3.512279987335205, -3.2373123168945312, -2.9623448848724365, -2.6873772144317627, -2.412409782409668, -2.137442111968994, -1.8624744415283203, -1.587506890296936, -1.3125393390655518, -1.0375717878341675, -0.7626041769981384, -0.4876365661621094, -0.2126690149307251, 0.06229853630065918, 0.337266206741333, 0.6122337579727173, 0.8872013092041016, 1.1621688604354858, 1.4371364116668701, 1.712104082107544, 1.9870716333389282, 2.2620391845703125, 2.5370068550109863, 2.81197452545166, 3.086941957473755, 3.3619096279144287, 3.6368770599365234, 3.9118447303771973, 4.186812400817871, 4.461779594421387, 4.736747741699219, 5.011714935302734, 5.286682605743408]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 7.0, 9.0, 43.0, 83.0, 171.0, 241.0, 229.0, 139.0, 58.0, 22.0, 7.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.085524082183838, -2.99118709564209, -2.8968498706817627, -2.8025128841400146, -2.7081756591796875, -2.6138386726379395, -2.5195016860961914, -2.4251644611358643, -2.330827236175537, -2.236490249633789, -2.142153024673462, -2.047816038131714, -1.9534788131713867, -1.8591418266296387, -1.764804720878601, -1.6704676151275635, -1.5761306285858154, -1.4817935228347778, -1.3874564170837402, -1.2931194305419922, -1.198782205581665, -1.104445219039917, -1.0101081132888794, -0.9157710075378418, -0.8214339017868042, -0.7270967960357666, -0.632759690284729, -0.5384226441383362, -0.4440855383872986, -0.349748432636261, -0.25541138648986816, -0.16107428073883057, -0.06673693656921387, 0.027600154280662537, 0.12193724513053894, 0.21627432107925415, 0.31061142683029175, 0.40494853258132935, 0.49928557872772217, 0.5936226844787598, 0.6879597902297974, 0.782296895980835, 0.8766340017318726, 0.9709710478782654, 1.0653080940246582, 1.1596453189849854, 1.2539823055267334, 1.348319411277771, 1.4426565170288086, 1.5369936227798462, 1.6313307285308838, 1.7256677150726318, 1.820004940032959, 1.914341926574707, 2.008678913116455, 2.1030161380767822, 2.1973533630371094, 2.2916903495788574, 2.3860275745391846, 2.4803645610809326, 2.5747017860412598, 2.669038772583008, 2.763375759124756, 2.857712984085083, 2.952049970626831]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 8.0, 5.0, 7.0, 5.0, 9.0, 13.0, 23.0, 29.0, 33.0, 40.0, 72.0, 102.0, 132.0, 192.0, 309.0, 548.0, 1069.0, 2643.0, 8909.0, 47131.0, 394717.0, 513222.0, 62248.0, 11074.0, 3083.0, 1232.0, 633.0, 378.0, 189.0, 144.0, 98.0, 59.0, 55.0, 42.0, 34.0, 23.0, 9.0, 7.0, 11.0, 4.0, 9.0, 4.0, 4.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5302734375, -0.5137405395507812, -0.4972076416015625, -0.48067474365234375, -0.464141845703125, -0.44760894775390625, -0.4310760498046875, -0.41454315185546875, -0.39801025390625, -0.38147735595703125, -0.3649444580078125, -0.34841156005859375, -0.331878662109375, -0.31534576416015625, -0.2988128662109375, -0.28227996826171875, -0.2657470703125, -0.24921417236328125, -0.2326812744140625, -0.21614837646484375, -0.199615478515625, -0.18308258056640625, -0.1665496826171875, -0.15001678466796875, -0.13348388671875, -0.11695098876953125, -0.1004180908203125, -0.08388519287109375, -0.067352294921875, -0.05081939697265625, -0.0342864990234375, -0.01775360107421875, -0.001220703125, 0.01531219482421875, 0.0318450927734375, 0.04837799072265625, 0.064910888671875, 0.08144378662109375, 0.0979766845703125, 0.11450958251953125, 0.13104248046875, 0.14757537841796875, 0.1641082763671875, 0.18064117431640625, 0.197174072265625, 0.21370697021484375, 0.2302398681640625, 0.24677276611328125, 0.2633056640625, 0.27983856201171875, 0.2963714599609375, 0.31290435791015625, 0.329437255859375, 0.34597015380859375, 0.3625030517578125, 0.37903594970703125, 0.39556884765625, 0.41210174560546875, 0.4286346435546875, 0.44516754150390625, 0.461700439453125, 0.47823333740234375, 0.4947662353515625, 0.5112991333007812, 0.52783203125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 12.0, 13.0, 24.0, 51.0, 80.0, 75.0, 120.0, 114.0, 138.0, 121.0, 98.0, 79.0, 34.0, 24.0, 13.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1778564453125, -0.17172622680664062, -0.16559600830078125, -0.15946578979492188, -0.1533355712890625, -0.14720535278320312, -0.14107513427734375, -0.13494491577148438, -0.128814697265625, -0.12268447875976562, -0.11655426025390625, -0.11042404174804688, -0.1042938232421875, -0.09816360473632812, -0.09203338623046875, -0.08590316772460938, -0.07977294921875, -0.07364273071289062, -0.06751251220703125, -0.061382293701171875, -0.0552520751953125, -0.049121856689453125, -0.04299163818359375, -0.036861419677734375, -0.030731201171875, -0.024600982666015625, -0.01847076416015625, -0.012340545654296875, -0.0062103271484375, -8.0108642578125e-05, 0.00605010986328125, 0.012180328369140625, 0.018310546875, 0.024440765380859375, 0.03057098388671875, 0.036701202392578125, 0.0428314208984375, 0.048961639404296875, 0.05509185791015625, 0.061222076416015625, 0.067352294921875, 0.07348251342773438, 0.07961273193359375, 0.08574295043945312, 0.0918731689453125, 0.09800338745117188, 0.10413360595703125, 0.11026382446289062, 0.11639404296875, 0.12252426147460938, 0.12865447998046875, 0.13478469848632812, 0.1409149169921875, 0.14704513549804688, 0.15317535400390625, 0.15930557250976562, 0.165435791015625, 0.17156600952148438, 0.17769622802734375, 0.18382644653320312, 0.1899566650390625, 0.19608688354492188, 0.20221710205078125, 0.20834732055664062, 0.2144775390625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 3.0, 5.0, 7.0, 13.0, 18.0, 12.0, 22.0, 30.0, 48.0, 64.0, 78.0, 124.0, 185.0, 337.0, 536.0, 995.0, 2011.0, 4528.0, 11690.0, 33327.0, 114192.0, 420331.0, 332558.0, 84531.0, 25815.0, 9425.0, 3823.0, 1651.0, 861.0, 477.0, 291.0, 179.0, 109.0, 90.0, 55.0, 30.0, 33.0, 16.0, 13.0, 14.0, 8.0, 10.0, 1.0, 4.0, 7.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.258544921875, -0.2506828308105469, -0.24282073974609375, -0.23495864868164062, -0.2270965576171875, -0.21923446655273438, -0.21137237548828125, -0.20351028442382812, -0.195648193359375, -0.18778610229492188, -0.17992401123046875, -0.17206192016601562, -0.1641998291015625, -0.15633773803710938, -0.14847564697265625, -0.14061355590820312, -0.13275146484375, -0.12488937377929688, -0.11702728271484375, -0.10916519165039062, -0.1013031005859375, -0.09344100952148438, -0.08557891845703125, -0.07771682739257812, -0.069854736328125, -0.061992645263671875, -0.05413055419921875, -0.046268463134765625, -0.0384063720703125, -0.030544281005859375, -0.02268218994140625, -0.014820098876953125, -0.0069580078125, 0.000904083251953125, 0.00876617431640625, 0.016628265380859375, 0.0244903564453125, 0.032352447509765625, 0.04021453857421875, 0.048076629638671875, 0.055938720703125, 0.06380081176757812, 0.07166290283203125, 0.07952499389648438, 0.0873870849609375, 0.09524917602539062, 0.10311126708984375, 0.11097335815429688, 0.11883544921875, 0.12669754028320312, 0.13455963134765625, 0.14242172241210938, 0.1502838134765625, 0.15814590454101562, 0.16600799560546875, 0.17387008666992188, 0.181732177734375, 0.18959426879882812, 0.19745635986328125, 0.20531845092773438, 0.2131805419921875, 0.22104263305664062, 0.22890472412109375, 0.23676681518554688, 0.24462890625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 7.0, 4.0, 6.0, 8.0, 6.0, 6.0, 15.0, 14.0, 17.0, 21.0, 15.0, 29.0, 32.0, 27.0, 41.0, 45.0, 43.0, 33.0, 61.0, 50.0, 44.0, 35.0, 55.0, 42.0, 42.0, 36.0, 30.0, 29.0, 28.0, 30.0, 24.0, 22.0, 17.0, 21.0, 20.0, 7.0, 13.0, 8.0, 5.0, 6.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.306396484375, -0.2976531982421875, -0.288909912109375, -0.2801666259765625, -0.27142333984375, -0.2626800537109375, -0.253936767578125, -0.2451934814453125, -0.2364501953125, -0.2277069091796875, -0.218963623046875, -0.2102203369140625, -0.20147705078125, -0.1927337646484375, -0.183990478515625, -0.1752471923828125, -0.16650390625, -0.1577606201171875, -0.149017333984375, -0.1402740478515625, -0.13153076171875, -0.1227874755859375, -0.114044189453125, -0.1053009033203125, -0.0965576171875, -0.0878143310546875, -0.079071044921875, -0.0703277587890625, -0.06158447265625, -0.0528411865234375, -0.044097900390625, -0.0353546142578125, -0.026611328125, -0.0178680419921875, -0.009124755859375, -0.0003814697265625, 0.00836181640625, 0.0171051025390625, 0.025848388671875, 0.0345916748046875, 0.0433349609375, 0.0520782470703125, 0.060821533203125, 0.0695648193359375, 0.07830810546875, 0.0870513916015625, 0.095794677734375, 0.1045379638671875, 0.11328125, 0.1220245361328125, 0.130767822265625, 0.1395111083984375, 0.14825439453125, 0.1569976806640625, 0.165740966796875, 0.1744842529296875, 0.1832275390625, 0.1919708251953125, 0.200714111328125, 0.2094573974609375, 0.21820068359375, 0.2269439697265625, 0.235687255859375, 0.2444305419921875, 0.253173828125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 10.0, 7.0, 13.0, 20.0, 32.0, 81.0, 131.0, 327.0, 906.0, 3290.0, 23366.0, 405674.0, 572100.0, 36529.0, 4228.0, 1107.0, 398.0, 162.0, 79.0, 36.0, 19.0, 20.0, 6.0, 9.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.259521484375, -0.2537651062011719, -0.24800872802734375, -0.24225234985351562, -0.2364959716796875, -0.23073959350585938, -0.22498321533203125, -0.21922683715820312, -0.213470458984375, -0.20771408081054688, -0.20195770263671875, -0.19620132446289062, -0.1904449462890625, -0.18468856811523438, -0.17893218994140625, -0.17317581176757812, -0.16741943359375, -0.16166305541992188, -0.15590667724609375, -0.15015029907226562, -0.1443939208984375, -0.13863754272460938, -0.13288116455078125, -0.12712478637695312, -0.121368408203125, -0.11561203002929688, -0.10985565185546875, -0.10409927368164062, -0.0983428955078125, -0.09258651733398438, -0.08683013916015625, -0.08107376098632812, -0.0753173828125, -0.06956100463867188, -0.06380462646484375, -0.058048248291015625, -0.0522918701171875, -0.046535491943359375, -0.04077911376953125, -0.035022735595703125, -0.029266357421875, -0.023509979248046875, -0.01775360107421875, -0.011997222900390625, -0.0062408447265625, -0.000484466552734375, 0.00527191162109375, 0.011028289794921875, 0.01678466796875, 0.022541046142578125, 0.02829742431640625, 0.034053802490234375, 0.0398101806640625, 0.045566558837890625, 0.05132293701171875, 0.057079315185546875, 0.062835693359375, 0.06859207153320312, 0.07434844970703125, 0.08010482788085938, 0.0858612060546875, 0.09161758422851562, 0.09737396240234375, 0.10313034057617188, 0.10888671875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 3.0, 5.0, 9.0, 15.0, 13.0, 18.0, 27.0, 36.0, 34.0, 49.0, 85.0, 93.0, 102.0, 101.0, 98.0, 81.0, 51.0, 57.0, 30.0, 36.0, 16.0, 13.0, 12.0, 11.0, 6.0, 3.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00022554397583007812, -0.0002199411392211914, -0.0002143383026123047, -0.00020873546600341797, -0.00020313262939453125, -0.00019752979278564453, -0.0001919269561767578, -0.0001863241195678711, -0.00018072128295898438, -0.00017511844635009766, -0.00016951560974121094, -0.00016391277313232422, -0.0001583099365234375, -0.00015270709991455078, -0.00014710426330566406, -0.00014150142669677734, -0.00013589859008789062, -0.0001302957534790039, -0.0001246929168701172, -0.00011909008026123047, -0.00011348724365234375, -0.00010788440704345703, -0.00010228157043457031, -9.66787338256836e-05, -9.107589721679688e-05, -8.547306060791016e-05, -7.987022399902344e-05, -7.426738739013672e-05, -6.866455078125e-05, -6.306171417236328e-05, -5.745887756347656e-05, -5.1856040954589844e-05, -4.6253204345703125e-05, -4.0650367736816406e-05, -3.504753112792969e-05, -2.944469451904297e-05, -2.384185791015625e-05, -1.823902130126953e-05, -1.2636184692382812e-05, -7.033348083496094e-06, -1.430511474609375e-06, 4.172325134277344e-06, 9.775161743164062e-06, 1.537799835205078e-05, 2.09808349609375e-05, 2.658367156982422e-05, 3.218650817871094e-05, 3.7789344787597656e-05, 4.3392181396484375e-05, 4.8995018005371094e-05, 5.459785461425781e-05, 6.020069122314453e-05, 6.580352783203125e-05, 7.140636444091797e-05, 7.700920104980469e-05, 8.26120376586914e-05, 8.821487426757812e-05, 9.381771087646484e-05, 9.942054748535156e-05, 0.00010502338409423828, 0.000110626220703125, 0.00011622905731201172, 0.00012183189392089844, 0.00012743473052978516, 0.00013303756713867188]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 5.0, 11.0, 9.0, 18.0, 36.0, 76.0, 157.0, 334.0, 831.0, 2467.0, 11892.0, 145975.0, 752602.0, 119803.0, 10574.0, 2339.0, 826.0, 290.0, 130.0, 73.0, 46.0, 17.0, 13.0, 6.0, 8.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.19482421875, -0.1894817352294922, -0.18413925170898438, -0.17879676818847656, -0.17345428466796875, -0.16811180114746094, -0.16276931762695312, -0.1574268341064453, -0.1520843505859375, -0.1467418670654297, -0.14139938354492188, -0.13605690002441406, -0.13071441650390625, -0.12537193298339844, -0.12002944946289062, -0.11468696594238281, -0.109344482421875, -0.10400199890136719, -0.09865951538085938, -0.09331703186035156, -0.08797454833984375, -0.08263206481933594, -0.07728958129882812, -0.07194709777832031, -0.0666046142578125, -0.06126213073730469, -0.055919647216796875, -0.05057716369628906, -0.04523468017578125, -0.03989219665527344, -0.034549713134765625, -0.029207229614257812, -0.02386474609375, -0.018522262573242188, -0.013179779052734375, -0.007837295532226562, -0.00249481201171875, 0.0028476715087890625, 0.008190155029296875, 0.013532638549804688, 0.0188751220703125, 0.024217605590820312, 0.029560089111328125, 0.03490257263183594, 0.04024505615234375, 0.04558753967285156, 0.050930023193359375, 0.05627250671386719, 0.061614990234375, 0.06695747375488281, 0.07229995727539062, 0.07764244079589844, 0.08298492431640625, 0.08832740783691406, 0.09366989135742188, 0.09901237487792969, 0.1043548583984375, 0.10969734191894531, 0.11503982543945312, 0.12038230895996094, 0.12572479248046875, 0.13106727600097656, 0.13640975952148438, 0.1417522430419922, 0.1470947265625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 4.0, 8.0, 8.0, 16.0, 23.0, 44.0, 48.0, 78.0, 94.0, 108.0, 137.0, 107.0, 78.0, 82.0, 57.0, 38.0, 18.0, 22.0, 12.0, 3.0, 5.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0], "bins": [-0.1376953125, -0.1342153549194336, -0.1307353973388672, -0.12725543975830078, -0.12377548217773438, -0.12029552459716797, -0.11681556701660156, -0.11333560943603516, -0.10985565185546875, -0.10637569427490234, -0.10289573669433594, -0.09941577911376953, -0.09593582153320312, -0.09245586395263672, -0.08897590637207031, -0.0854959487915039, -0.0820159912109375, -0.0785360336303711, -0.07505607604980469, -0.07157611846923828, -0.06809616088867188, -0.06461620330810547, -0.06113624572753906, -0.057656288146972656, -0.05417633056640625, -0.050696372985839844, -0.04721641540527344, -0.04373645782470703, -0.040256500244140625, -0.03677654266357422, -0.03329658508300781, -0.029816627502441406, -0.026336669921875, -0.022856712341308594, -0.019376754760742188, -0.01589679718017578, -0.012416839599609375, -0.008936882019042969, -0.0054569244384765625, -0.0019769668579101562, 0.00150299072265625, 0.004982948303222656, 0.008462905883789062, 0.011942863464355469, 0.015422821044921875, 0.01890277862548828, 0.022382736206054688, 0.025862693786621094, 0.0293426513671875, 0.032822608947753906, 0.03630256652832031, 0.03978252410888672, 0.043262481689453125, 0.04674243927001953, 0.05022239685058594, 0.053702354431152344, 0.05718231201171875, 0.060662269592285156, 0.06414222717285156, 0.06762218475341797, 0.07110214233398438, 0.07458209991455078, 0.07806205749511719, 0.0815420150756836, 0.08502197265625]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 5.0, 8.0, 18.0, 41.0, 96.0, 224.0, 334.0, 181.0, 59.0, 19.0, 12.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9431120157241821, -1.8247101306915283, -1.7063082456588745, -1.5879063606262207, -1.469504475593567, -1.351102590560913, -1.2327005863189697, -1.1142988204956055, -0.9958968758583069, -0.8774949908256531, -0.7590931057929993, -0.6406911611557007, -0.5222892761230469, -0.40388739109039307, -0.28548550605773926, -0.16708362102508545, -0.04868173599243164, 0.06972015649080276, 0.18812204897403717, 0.3065239489078522, 0.424925833940506, 0.5433277487754822, 0.661729633808136, 0.7801315188407898, 0.8985334038734436, 1.0169353485107422, 1.135337233543396, 1.2537391185760498, 1.3721410036087036, 1.4905428886413574, 1.6089447736740112, 1.727346658706665, 1.8457486629486084, 1.9641505479812622, 2.082552433013916, 2.2009544372558594, 2.3193562030792236, 2.437758207321167, 2.5561599731445312, 2.6745619773864746, 2.792963743209839, 2.9113657474517822, 3.0297675132751465, 3.14816951751709, 3.266571283340454, 3.3849732875823975, 3.5033750534057617, 3.621777057647705, 3.7401790618896484, 3.858581066131592, 3.976982831954956, 4.09538459777832, 4.213786602020264, 4.332188606262207, 4.45059061050415, 4.5689921379089355, 4.687394142150879, 4.805796146392822, 4.924198150634766, 5.042599678039551, 5.161001682281494, 5.2794036865234375, 5.397805690765381, 5.516207218170166, 5.634609222412109]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 4.0, 3.0, 4.0, 3.0, 4.0, 7.0, 8.0, 10.0, 11.0, 11.0, 17.0, 10.0, 24.0, 15.0, 26.0, 31.0, 31.0, 26.0, 38.0, 38.0, 42.0, 45.0, 62.0, 42.0, 42.0, 42.0, 50.0, 38.0, 29.0, 38.0, 30.0, 33.0, 23.0, 30.0, 23.0, 15.0, 16.0, 10.0, 17.0, 15.0, 11.0, 5.0, 5.0, 8.0, 4.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0], "bins": [-1.556401014328003, -1.510414481163025, -1.4644279479980469, -1.4184414148330688, -1.3724548816680908, -1.3264684677124023, -1.2804818153381348, -1.2344954013824463, -1.1885088682174683, -1.1425223350524902, -1.0965358018875122, -1.0505492687225342, -1.0045627355575562, -0.9585762619972229, -0.9125897288322449, -0.8666032552719116, -0.8206166625022888, -0.7746301293373108, -0.7286435961723328, -0.6826571226119995, -0.6366705894470215, -0.5906840562820435, -0.5446975231170654, -0.4987110197544098, -0.45272448658943176, -0.40673795342445374, -0.3607514500617981, -0.31476491689682007, -0.26877838373184204, -0.2227918803691864, -0.17680534720420837, -0.13081884384155273, -0.08483231067657471, -0.038845788687467575, 0.007140733301639557, 0.05312725901603699, 0.09911377727985382, 0.14510029554367065, 0.19108682870864868, 0.23707333207130432, 0.28305986523628235, 0.3290463984012604, 0.375032901763916, 0.42101943492889404, 0.46700596809387207, 0.5129925012588501, 0.5589790344238281, 0.6049655079841614, 0.6509520411491394, 0.6969385743141174, 0.7429251074790955, 0.7889115810394287, 0.8348981142044067, 0.8808846473693848, 0.9268711805343628, 0.9728577136993408, 1.0188442468643188, 1.0648307800292969, 1.110817313194275, 1.156803846359253, 1.202790379524231, 1.248776912689209, 1.2947633266448975, 1.3407498598098755, 1.3867363929748535]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 7.0, 9.0, 18.0, 34.0, 57.0, 125.0, 335.0, 1072.0, 8690.0, 4060158.0, 119018.0, 3427.0, 786.0, 272.0, 130.0, 67.0, 40.0, 16.0, 10.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4189453125, -1.3639678955078125, -1.308990478515625, -1.2540130615234375, -1.19903564453125, -1.1440582275390625, -1.089080810546875, -1.0341033935546875, -0.9791259765625, -0.9241485595703125, -0.869171142578125, -0.8141937255859375, -0.75921630859375, -0.7042388916015625, -0.649261474609375, -0.5942840576171875, -0.539306640625, -0.4843292236328125, -0.429351806640625, -0.3743743896484375, -0.31939697265625, -0.2644195556640625, -0.209442138671875, -0.1544647216796875, -0.0994873046875, -0.0445098876953125, 0.010467529296875, 0.0654449462890625, 0.12042236328125, 0.1753997802734375, 0.230377197265625, 0.2853546142578125, 0.34033203125, 0.3953094482421875, 0.450286865234375, 0.5052642822265625, 0.56024169921875, 0.6152191162109375, 0.670196533203125, 0.7251739501953125, 0.7801513671875, 0.8351287841796875, 0.890106201171875, 0.9450836181640625, 1.00006103515625, 1.0550384521484375, 1.110015869140625, 1.1649932861328125, 1.219970703125, 1.2749481201171875, 1.329925537109375, 1.3849029541015625, 1.43988037109375, 1.4948577880859375, 1.549835205078125, 1.6048126220703125, 1.6597900390625, 1.7147674560546875, 1.769744873046875, 1.8247222900390625, 1.87969970703125, 1.9346771240234375, 1.989654541015625, 2.0446319580078125, 2.099609375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 18.0, 16.0, 35.0, 51.0, 76.0, 97.0, 111.0, 124.0, 107.0, 118.0, 92.0, 56.0, 42.0, 32.0, 13.0, 8.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.177978515625, -0.17180252075195312, -0.16562652587890625, -0.15945053100585938, -0.1532745361328125, -0.14709854125976562, -0.14092254638671875, -0.13474655151367188, -0.128570556640625, -0.12239456176757812, -0.11621856689453125, -0.11004257202148438, -0.1038665771484375, -0.09769058227539062, -0.09151458740234375, -0.08533859252929688, -0.07916259765625, -0.07298660278320312, -0.06681060791015625, -0.060634613037109375, -0.0544586181640625, -0.048282623291015625, -0.04210662841796875, -0.035930633544921875, -0.029754638671875, -0.023578643798828125, -0.01740264892578125, -0.011226654052734375, -0.0050506591796875, 0.001125335693359375, 0.00730133056640625, 0.013477325439453125, 0.0196533203125, 0.025829315185546875, 0.03200531005859375, 0.038181304931640625, 0.0443572998046875, 0.050533294677734375, 0.05670928955078125, 0.06288528442382812, 0.069061279296875, 0.07523727416992188, 0.08141326904296875, 0.08758926391601562, 0.0937652587890625, 0.09994125366210938, 0.10611724853515625, 0.11229324340820312, 0.11846923828125, 0.12464523315429688, 0.13082122802734375, 0.13699722290039062, 0.1431732177734375, 0.14934921264648438, 0.15552520751953125, 0.16170120239257812, 0.167877197265625, 0.17405319213867188, 0.18022918701171875, 0.18640518188476562, 0.1925811767578125, 0.19875717163085938, 0.20493316650390625, 0.21110916137695312, 0.21728515625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 6.0, 3.0, 6.0, 10.0, 27.0, 50.0, 81.0, 135.0, 261.0, 468.0, 999.0, 2248.0, 6915.0, 56262.0, 3847918.0, 259021.0, 14336.0, 3141.0, 1184.0, 549.0, 287.0, 148.0, 104.0, 55.0, 24.0, 21.0, 7.0, 8.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52685546875, -0.509124755859375, -0.49139404296875, -0.473663330078125, -0.4559326171875, -0.438201904296875, -0.42047119140625, -0.402740478515625, -0.385009765625, -0.367279052734375, -0.34954833984375, -0.331817626953125, -0.3140869140625, -0.296356201171875, -0.27862548828125, -0.260894775390625, -0.2431640625, -0.225433349609375, -0.20770263671875, -0.189971923828125, -0.1722412109375, -0.154510498046875, -0.13677978515625, -0.119049072265625, -0.101318359375, -0.083587646484375, -0.06585693359375, -0.048126220703125, -0.0303955078125, -0.012664794921875, 0.00506591796875, 0.022796630859375, 0.04052734375, 0.058258056640625, 0.07598876953125, 0.093719482421875, 0.1114501953125, 0.129180908203125, 0.14691162109375, 0.164642333984375, 0.182373046875, 0.200103759765625, 0.21783447265625, 0.235565185546875, 0.2532958984375, 0.271026611328125, 0.28875732421875, 0.306488037109375, 0.32421875, 0.341949462890625, 0.35968017578125, 0.377410888671875, 0.3951416015625, 0.412872314453125, 0.43060302734375, 0.448333740234375, 0.466064453125, 0.483795166015625, 0.50152587890625, 0.519256591796875, 0.5369873046875, 0.554718017578125, 0.57244873046875, 0.590179443359375, 0.60791015625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 4.0, 0.0, 4.0, 7.0, 6.0, 11.0, 19.0, 14.0, 55.0, 105.0, 340.0, 2152.0, 944.0, 228.0, 93.0, 42.0, 20.0, 10.0, 9.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.232666015625, -0.22510910034179688, -0.21755218505859375, -0.20999526977539062, -0.2024383544921875, -0.19488143920898438, -0.18732452392578125, -0.17976760864257812, -0.172210693359375, -0.16465377807617188, -0.15709686279296875, -0.14953994750976562, -0.1419830322265625, -0.13442611694335938, -0.12686920166015625, -0.11931228637695312, -0.11175537109375, -0.10419845581054688, -0.09664154052734375, -0.08908462524414062, -0.0815277099609375, -0.07397079467773438, -0.06641387939453125, -0.058856964111328125, -0.051300048828125, -0.043743133544921875, -0.03618621826171875, -0.028629302978515625, -0.0210723876953125, -0.013515472412109375, -0.00595855712890625, 0.001598358154296875, 0.0091552734375, 0.016712188720703125, 0.02426910400390625, 0.031826019287109375, 0.0393829345703125, 0.046939849853515625, 0.05449676513671875, 0.062053680419921875, 0.069610595703125, 0.07716751098632812, 0.08472442626953125, 0.09228134155273438, 0.0998382568359375, 0.10739517211914062, 0.11495208740234375, 0.12250900268554688, 0.13006591796875, 0.13762283325195312, 0.14517974853515625, 0.15273666381835938, 0.1602935791015625, 0.16785049438476562, 0.17540740966796875, 0.18296432495117188, 0.190521240234375, 0.19807815551757812, 0.20563507080078125, 0.21319198608398438, 0.2207489013671875, 0.22830581665039062, 0.23586273193359375, 0.24341964721679688, 0.2509765625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 23.0, 72.0, 290.0, 405.0, 138.0, 43.0, 16.0, 9.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.630551338195801, -3.556957960128784, -3.4833643436431885, -3.409770965576172, -3.336177349090576, -3.2625839710235596, -3.188990354537964, -3.1153969764709473, -3.0418033599853516, -2.968209981918335, -2.8946163654327393, -2.8210229873657227, -2.747429370880127, -2.6738359928131104, -2.6002423763275146, -2.526648998260498, -2.4530556201934814, -2.379462242126465, -2.305868625640869, -2.2322752475738525, -2.158681631088257, -2.0850882530212402, -2.0114946365356445, -1.937901258468628, -1.8643077611923218, -1.7907142639160156, -1.7171207666397095, -1.6435272693634033, -1.5699338912963867, -1.496340274810791, -1.4227468967437744, -1.3491533994674683, -1.275559902191162, -1.201966404914856, -1.1283729076385498, -1.0547794103622437, -0.9811859726905823, -0.9075924754142761, -0.8339990377426147, -0.7604055404663086, -0.6868120431900024, -0.6132185459136963, -0.5396250486373901, -0.46603161096572876, -0.3924381136894226, -0.31884461641311646, -0.2452511489391327, -0.17165768146514893, -0.09806418418884277, -0.024470701813697815, 0.049122780561447144, 0.1227162629365921, 0.19630974531173706, 0.2699032425880432, 0.343496710062027, 0.41709017753601074, 0.4906836748123169, 0.564277172088623, 0.6378706693649292, 0.7114641070365906, 0.7850576043128967, 0.8586511015892029, 0.9322445392608643, 1.0058380365371704, 1.0794315338134766]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 5.0, 5.0, 8.0, 15.0, 13.0, 17.0, 31.0, 31.0, 45.0, 49.0, 79.0, 85.0, 62.0, 65.0, 66.0, 67.0, 76.0, 54.0, 48.0, 66.0, 29.0, 28.0, 17.0, 15.0, 13.0, 10.0, 6.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9534122943878174, -0.9284040331840515, -0.9033958315849304, -0.8783875703811646, -0.8533793091773987, -0.8283711075782776, -0.8033628463745117, -0.7783546447753906, -0.7533463835716248, -0.7283381223678589, -0.7033299207687378, -0.6783216595649719, -0.653313398361206, -0.628305196762085, -0.6032969355583191, -0.5782886743545532, -0.5532804727554321, -0.5282722115516663, -0.5032640099525452, -0.4782557487487793, -0.4532475173473358, -0.42823928594589233, -0.40323102474212646, -0.378222793340683, -0.3532145023345947, -0.32820627093315125, -0.3031980097293854, -0.2781897783279419, -0.2531815469264984, -0.22817330062389374, -0.20316505432128906, -0.17815682291984558, -0.1531485915184021, -0.12814034521579742, -0.10313211381435394, -0.07812386751174927, -0.05311562865972519, -0.02810738980770111, -0.0030991435050964355, 0.021909087896347046, 0.04691733419895172, 0.0719255730509758, 0.09693381190299988, 0.12194205820560455, 0.14695030450820923, 0.1719585359096527, 0.19696678221225739, 0.22197501361370087, 0.24698325991630554, 0.271991491317749, 0.2969997525215149, 0.3220079839229584, 0.34701621532440186, 0.3720244765281677, 0.3970327079296112, 0.4220409393310547, 0.44704920053482056, 0.47205743193626404, 0.4970656931400299, 0.5220739245414734, 0.5470821857452393, 0.5720903873443604, 0.5970986485481262, 0.6221069097518921, 0.6471151113510132]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 6.0, 2.0, 7.0, 8.0, 17.0, 18.0, 33.0, 63.0, 105.0, 168.0, 423.0, 912.0, 2801.0, 13719.0, 295931.0, 703448.0, 24882.0, 3812.0, 1173.0, 498.0, 215.0, 141.0, 57.0, 39.0, 33.0, 11.0, 7.0, 10.0, 4.0, 6.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.869140625, -0.8402938842773438, -0.8114471435546875, -0.7826004028320312, -0.753753662109375, -0.7249069213867188, -0.6960601806640625, -0.6672134399414062, -0.63836669921875, -0.6095199584960938, -0.5806732177734375, -0.5518264770507812, -0.522979736328125, -0.49413299560546875, -0.4652862548828125, -0.43643951416015625, -0.4075927734375, -0.37874603271484375, -0.3498992919921875, -0.32105255126953125, -0.292205810546875, -0.26335906982421875, -0.2345123291015625, -0.20566558837890625, -0.17681884765625, -0.14797210693359375, -0.1191253662109375, -0.09027862548828125, -0.061431884765625, -0.03258514404296875, -0.0037384033203125, 0.02510833740234375, 0.053955078125, 0.08280181884765625, 0.1116485595703125, 0.14049530029296875, 0.169342041015625, 0.19818878173828125, 0.2270355224609375, 0.25588226318359375, 0.28472900390625, 0.31357574462890625, 0.3424224853515625, 0.37126922607421875, 0.400115966796875, 0.42896270751953125, 0.4578094482421875, 0.48665618896484375, 0.5155029296875, 0.5443496704101562, 0.5731964111328125, 0.6020431518554688, 0.630889892578125, 0.6597366333007812, 0.6885833740234375, 0.7174301147460938, 0.74627685546875, 0.7751235961914062, 0.8039703369140625, 0.8328170776367188, 0.861663818359375, 0.8905105590820312, 0.9193572998046875, 0.9482040405273438, 0.97705078125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 11.0, 12.0, 14.0, 32.0, 47.0, 70.0, 87.0, 99.0, 94.0, 116.0, 110.0, 99.0, 70.0, 52.0, 36.0, 29.0, 9.0, 10.0, 3.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1767578125, -0.1710987091064453, -0.16543960571289062, -0.15978050231933594, -0.15412139892578125, -0.14846229553222656, -0.14280319213867188, -0.1371440887451172, -0.1314849853515625, -0.1258258819580078, -0.12016677856445312, -0.11450767517089844, -0.10884857177734375, -0.10318946838378906, -0.09753036499023438, -0.09187126159667969, -0.086212158203125, -0.08055305480957031, -0.07489395141601562, -0.06923484802246094, -0.06357574462890625, -0.05791664123535156, -0.052257537841796875, -0.04659843444824219, -0.0409393310546875, -0.03528022766113281, -0.029621124267578125, -0.023962020874023438, -0.01830291748046875, -0.012643814086914062, -0.006984710693359375, -0.0013256072998046875, 0.00433349609375, 0.009992599487304688, 0.015651702880859375, 0.021310806274414062, 0.02696990966796875, 0.03262901306152344, 0.038288116455078125, 0.04394721984863281, 0.0496063232421875, 0.05526542663574219, 0.060924530029296875, 0.06658363342285156, 0.07224273681640625, 0.07790184020996094, 0.08356094360351562, 0.08922004699707031, 0.094879150390625, 0.10053825378417969, 0.10619735717773438, 0.11185646057128906, 0.11751556396484375, 0.12317466735839844, 0.12883377075195312, 0.1344928741455078, 0.1401519775390625, 0.1458110809326172, 0.15147018432617188, 0.15712928771972656, 0.16278839111328125, 0.16844749450683594, 0.17410659790039062, 0.1797657012939453, 0.1854248046875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 7.0, 3.0, 5.0, 5.0, 12.0, 2.0, 15.0, 15.0, 18.0, 28.0, 45.0, 67.0, 108.0, 156.0, 293.0, 646.0, 1677.0, 5105.0, 20999.0, 158455.0, 730310.0, 107785.0, 16109.0, 4136.0, 1306.0, 525.0, 285.0, 165.0, 93.0, 53.0, 39.0, 23.0, 14.0, 9.0, 8.0, 11.0, 4.0, 4.0, 5.0, 3.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.486572265625, -0.4728355407714844, -0.45909881591796875, -0.4453620910644531, -0.4316253662109375, -0.4178886413574219, -0.40415191650390625, -0.3904151916503906, -0.376678466796875, -0.3629417419433594, -0.34920501708984375, -0.3354682922363281, -0.3217315673828125, -0.3079948425292969, -0.29425811767578125, -0.2805213928222656, -0.26678466796875, -0.2530479431152344, -0.23931121826171875, -0.22557449340820312, -0.2118377685546875, -0.19810104370117188, -0.18436431884765625, -0.17062759399414062, -0.156890869140625, -0.14315414428710938, -0.12941741943359375, -0.11568069458007812, -0.1019439697265625, -0.08820724487304688, -0.07447052001953125, -0.060733795166015625, -0.0469970703125, -0.033260345458984375, -0.01952362060546875, -0.005786895751953125, 0.0079498291015625, 0.021686553955078125, 0.03542327880859375, 0.049160003662109375, 0.062896728515625, 0.07663345336914062, 0.09037017822265625, 0.10410690307617188, 0.1178436279296875, 0.13158035278320312, 0.14531707763671875, 0.15905380249023438, 0.17279052734375, 0.18652725219726562, 0.20026397705078125, 0.21400070190429688, 0.2277374267578125, 0.24147415161132812, 0.25521087646484375, 0.2689476013183594, 0.282684326171875, 0.2964210510253906, 0.31015777587890625, 0.3238945007324219, 0.3376312255859375, 0.3513679504394531, 0.36510467529296875, 0.3788414001464844, 0.392578125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 3.0, 8.0, 11.0, 4.0, 10.0, 15.0, 13.0, 6.0, 25.0, 19.0, 19.0, 37.0, 44.0, 36.0, 46.0, 43.0, 46.0, 59.0, 43.0, 58.0, 45.0, 49.0, 39.0, 50.0, 40.0, 40.0, 24.0, 23.0, 28.0, 19.0, 23.0, 18.0, 8.0, 8.0, 7.0, 9.0, 5.0, 6.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.32275390625, -0.31243896484375, -0.3021240234375, -0.29180908203125, -0.281494140625, -0.27117919921875, -0.2608642578125, -0.25054931640625, -0.240234375, -0.22991943359375, -0.2196044921875, -0.20928955078125, -0.198974609375, -0.18865966796875, -0.1783447265625, -0.16802978515625, -0.15771484375, -0.14739990234375, -0.1370849609375, -0.12677001953125, -0.116455078125, -0.10614013671875, -0.0958251953125, -0.08551025390625, -0.0751953125, -0.06488037109375, -0.0545654296875, -0.04425048828125, -0.033935546875, -0.02362060546875, -0.0133056640625, -0.00299072265625, 0.00732421875, 0.01763916015625, 0.0279541015625, 0.03826904296875, 0.048583984375, 0.05889892578125, 0.0692138671875, 0.07952880859375, 0.08984375, 0.10015869140625, 0.1104736328125, 0.12078857421875, 0.131103515625, 0.14141845703125, 0.1517333984375, 0.16204833984375, 0.17236328125, 0.18267822265625, 0.1929931640625, 0.20330810546875, 0.213623046875, 0.22393798828125, 0.2342529296875, 0.24456787109375, 0.2548828125, 0.26519775390625, 0.2755126953125, 0.28582763671875, 0.296142578125, 0.30645751953125, 0.3167724609375, 0.32708740234375, 0.33740234375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 12.0, 20.0, 62.0, 210.0, 947.0, 21864.0, 1017566.0, 7075.0, 559.0, 146.0, 48.0, 17.0, 11.0, 8.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65625, -0.6359786987304688, -0.6157073974609375, -0.5954360961914062, -0.575164794921875, -0.5548934936523438, -0.5346221923828125, -0.5143508911132812, -0.49407958984375, -0.47380828857421875, -0.4535369873046875, -0.43326568603515625, -0.412994384765625, -0.39272308349609375, -0.3724517822265625, -0.35218048095703125, -0.3319091796875, -0.31163787841796875, -0.2913665771484375, -0.27109527587890625, -0.250823974609375, -0.23055267333984375, -0.2102813720703125, -0.19001007080078125, -0.16973876953125, -0.14946746826171875, -0.1291961669921875, -0.10892486572265625, -0.088653564453125, -0.06838226318359375, -0.0481109619140625, -0.02783966064453125, -0.007568359375, 0.01270294189453125, 0.0329742431640625, 0.05324554443359375, 0.073516845703125, 0.09378814697265625, 0.1140594482421875, 0.13433074951171875, 0.15460205078125, 0.17487335205078125, 0.1951446533203125, 0.21541595458984375, 0.235687255859375, 0.25595855712890625, 0.2762298583984375, 0.29650115966796875, 0.3167724609375, 0.33704376220703125, 0.3573150634765625, 0.37758636474609375, 0.397857666015625, 0.41812896728515625, 0.4384002685546875, 0.45867156982421875, 0.47894287109375, 0.49921417236328125, 0.5194854736328125, 0.5397567749023438, 0.560028076171875, 0.5802993774414062, 0.6005706787109375, 0.6208419799804688, 0.64111328125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 9.0, 15.0, 46.0, 110.0, 212.0, 309.0, 171.0, 85.0, 30.0, 14.0, 7.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007557868957519531, -0.0007323622703552246, -0.0007089376449584961, -0.0006855130195617676, -0.0006620883941650391, -0.0006386637687683105, -0.000615239143371582, -0.0005918145179748535, -0.000568389892578125, -0.0005449652671813965, -0.000521540641784668, -0.0004981160163879395, -0.00047469139099121094, -0.0004512667655944824, -0.0004278421401977539, -0.0004044175148010254, -0.0003809928894042969, -0.00035756826400756836, -0.00033414363861083984, -0.00031071901321411133, -0.0002872943878173828, -0.0002638697624206543, -0.00024044513702392578, -0.00021702051162719727, -0.00019359588623046875, -0.00017017126083374023, -0.00014674663543701172, -0.0001233220100402832, -9.989738464355469e-05, -7.647275924682617e-05, -5.3048133850097656e-05, -2.962350845336914e-05, -6.198883056640625e-06, 1.722574234008789e-05, 4.0650367736816406e-05, 6.407499313354492e-05, 8.749961853027344e-05, 0.00011092424392700195, 0.00013434886932373047, 0.00015777349472045898, 0.0001811981201171875, 0.00020462274551391602, 0.00022804737091064453, 0.00025147199630737305, 0.00027489662170410156, 0.0002983212471008301, 0.0003217458724975586, 0.0003451704978942871, 0.0003685951232910156, 0.00039201974868774414, 0.00041544437408447266, 0.00043886899948120117, 0.0004622936248779297, 0.0004857182502746582, 0.0005091428756713867, 0.0005325675010681152, 0.0005559921264648438, 0.0005794167518615723, 0.0006028413772583008, 0.0006262660026550293, 0.0006496906280517578, 0.0006731152534484863, 0.0006965398788452148, 0.0007199645042419434, 0.0007433891296386719]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 4.0, 12.0, 16.0, 35.0, 57.0, 103.0, 138.0, 297.0, 973.0, 24873.0, 1012579.0, 8239.0, 651.0, 244.0, 146.0, 78.0, 51.0, 25.0, 10.0, 8.0, 7.0, 4.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.65576171875, -0.6377372741699219, -0.6197128295898438, -0.6016883850097656, -0.5836639404296875, -0.5656394958496094, -0.5476150512695312, -0.5295906066894531, -0.511566162109375, -0.4935417175292969, -0.47551727294921875, -0.4574928283691406, -0.4394683837890625, -0.4214439392089844, -0.40341949462890625, -0.3853950500488281, -0.36737060546875, -0.3493461608886719, -0.33132171630859375, -0.3132972717285156, -0.2952728271484375, -0.2772483825683594, -0.25922393798828125, -0.24119949340820312, -0.223175048828125, -0.20515060424804688, -0.18712615966796875, -0.16910171508789062, -0.1510772705078125, -0.13305282592773438, -0.11502838134765625, -0.09700393676757812, -0.0789794921875, -0.060955047607421875, -0.04293060302734375, -0.024906158447265625, -0.0068817138671875, 0.011142730712890625, 0.02916717529296875, 0.047191619873046875, 0.065216064453125, 0.08324050903320312, 0.10126495361328125, 0.11928939819335938, 0.1373138427734375, 0.15533828735351562, 0.17336273193359375, 0.19138717651367188, 0.20941162109375, 0.22743606567382812, 0.24546051025390625, 0.2634849548339844, 0.2815093994140625, 0.2995338439941406, 0.31755828857421875, 0.3355827331542969, 0.353607177734375, 0.3716316223144531, 0.38965606689453125, 0.4076805114746094, 0.4257049560546875, 0.4437294006347656, 0.46175384521484375, 0.4797782897949219, 0.497802734375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 14.0, 24.0, 135.0, 455.0, 301.0, 57.0, 14.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53125, -0.5134124755859375, -0.495574951171875, -0.4777374267578125, -0.45989990234375, -0.4420623779296875, -0.424224853515625, -0.4063873291015625, -0.3885498046875, -0.3707122802734375, -0.352874755859375, -0.3350372314453125, -0.31719970703125, -0.2993621826171875, -0.281524658203125, -0.2636871337890625, -0.245849609375, -0.2280120849609375, -0.210174560546875, -0.1923370361328125, -0.17449951171875, -0.1566619873046875, -0.138824462890625, -0.1209869384765625, -0.1031494140625, -0.0853118896484375, -0.067474365234375, -0.0496368408203125, -0.03179931640625, -0.0139617919921875, 0.003875732421875, 0.0217132568359375, 0.03955078125, 0.0573883056640625, 0.075225830078125, 0.0930633544921875, 0.11090087890625, 0.1287384033203125, 0.146575927734375, 0.1644134521484375, 0.1822509765625, 0.2000885009765625, 0.217926025390625, 0.2357635498046875, 0.25360107421875, 0.2714385986328125, 0.289276123046875, 0.3071136474609375, 0.324951171875, 0.3427886962890625, 0.360626220703125, 0.3784637451171875, 0.39630126953125, 0.4141387939453125, 0.431976318359375, 0.4498138427734375, 0.4676513671875, 0.4854888916015625, 0.503326416015625, 0.5211639404296875, 0.53900146484375, 0.5568389892578125, 0.574676513671875, 0.5925140380859375, 0.6103515625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 7.0, 16.0, 46.0, 121.0, 320.0, 338.0, 117.0, 28.0, 7.0, 2.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.74886417388916, -4.591914176940918, -4.434964656829834, -4.278014659881592, -4.121065139770508, -3.9641153812408447, -3.8071656227111816, -3.6502156257629395, -3.4932661056518555, -3.3363163471221924, -3.1793665885925293, -3.022416830062866, -2.865467071533203, -2.70851731300354, -2.551567554473877, -2.3946175575256348, -2.2376677989959717, -2.0807180404663086, -1.9237682819366455, -1.7668185234069824, -1.6098687648773193, -1.4529190063476562, -1.2959691286087036, -1.1390193700790405, -0.9820696115493774, -0.8251198530197144, -0.6681700944900513, -0.5112202763557434, -0.3542705178260803, -0.19732075929641724, -0.040370941162109375, 0.11657881736755371, 0.2735285758972168, 0.4304783344268799, 0.587428092956543, 0.7443779110908508, 0.9013276696205139, 1.0582773685455322, 1.2152272462844849, 1.372177004814148, 1.529126763343811, 1.6860765218734741, 1.8430262804031372, 1.9999761581420898, 2.156925916671753, 2.313875675201416, 2.470825433731079, 2.627775192260742, 2.7847249507904053, 2.9416747093200684, 3.0986244678497314, 3.2555742263793945, 3.4125239849090576, 3.5694737434387207, 3.726423740386963, 3.883373260498047, 4.040323257446289, 4.197273254394531, 4.354222774505615, 4.511172771453857, 4.668122291564941, 4.825072288513184, 4.982021808624268, 5.13897180557251, 5.295921325683594]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 4.0, 8.0, 8.0, 6.0, 7.0, 7.0, 11.0, 11.0, 18.0, 25.0, 14.0, 27.0, 31.0, 31.0, 31.0, 38.0, 40.0, 47.0, 49.0, 48.0, 40.0, 42.0, 35.0, 48.0, 47.0, 32.0, 40.0, 39.0, 32.0, 34.0, 24.0, 15.0, 15.0, 11.0, 11.0, 14.0, 12.0, 9.0, 4.0, 5.0, 5.0, 5.0, 4.0, 5.0, 5.0, 6.0, 4.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.5518990755081177, -1.5057920217514038, -1.4596848487854004, -1.4135777950286865, -1.367470622062683, -1.3213635683059692, -1.2752563953399658, -1.229149341583252, -1.183042287826538, -1.1369352340698242, -1.0908280611038208, -1.044721007347107, -0.9986138343811035, -0.9525067806243896, -0.906399667263031, -0.8602925539016724, -0.814185380935669, -0.7680782675743103, -0.7219711542129517, -0.6758641004562378, -0.6297569274902344, -0.5836498737335205, -0.5375427603721619, -0.4914356470108032, -0.4453285336494446, -0.39922142028808594, -0.3531143069267273, -0.30700722336769104, -0.2609001100063324, -0.21479299664497375, -0.1686859130859375, -0.12257879972457886, -0.07647180557250977, -0.03036469966173172, 0.015742406249046326, 0.061849504709243774, 0.10795661807060242, 0.15406373143196106, 0.20017081499099731, 0.24627792835235596, 0.2923850417137146, 0.33849215507507324, 0.3845992684364319, 0.43070635199546814, 0.4768134653568268, 0.5229206085205078, 0.5690276622772217, 0.6151347756385803, 0.661241888999939, 0.7073490023612976, 0.7534561157226562, 0.7995631694793701, 0.8456703424453735, 0.8917773962020874, 0.937884509563446, 0.9839916229248047, 1.0300986766815186, 1.0762057304382324, 1.1223129034042358, 1.1684199571609497, 1.2145271301269531, 1.260634183883667, 1.3067412376403809, 1.3528484106063843, 1.3989555835723877]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 1.0, 2.0, 5.0, 18.0, 12.0, 29.0, 41.0, 71.0, 175.0, 337.0, 902.0, 3066.0, 23734.0, 4068376.0, 89445.0, 5676.0, 1284.0, 541.0, 243.0, 137.0, 84.0, 40.0, 24.0, 12.0, 15.0, 5.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.10546875, -1.0736007690429688, -1.0417327880859375, -1.0098648071289062, -0.977996826171875, -0.9461288452148438, -0.9142608642578125, -0.8823928833007812, -0.85052490234375, -0.8186569213867188, -0.7867889404296875, -0.7549209594726562, -0.723052978515625, -0.6911849975585938, -0.6593170166015625, -0.6274490356445312, -0.5955810546875, -0.5637130737304688, -0.5318450927734375, -0.49997711181640625, -0.468109130859375, -0.43624114990234375, -0.4043731689453125, -0.37250518798828125, -0.34063720703125, -0.30876922607421875, -0.2769012451171875, -0.24503326416015625, -0.213165283203125, -0.18129730224609375, -0.1494293212890625, -0.11756134033203125, -0.085693359375, -0.05382537841796875, -0.0219573974609375, 0.00991058349609375, 0.041778564453125, 0.07364654541015625, 0.1055145263671875, 0.13738250732421875, 0.16925048828125, 0.20111846923828125, 0.2329864501953125, 0.26485443115234375, 0.296722412109375, 0.32859039306640625, 0.3604583740234375, 0.39232635498046875, 0.4241943359375, 0.45606231689453125, 0.4879302978515625, 0.5197982788085938, 0.551666259765625, 0.5835342407226562, 0.6154022216796875, 0.6472702026367188, 0.67913818359375, 0.7110061645507812, 0.7428741455078125, 0.7747421264648438, 0.806610107421875, 0.8384780883789062, 0.8703460693359375, 0.9022140502929688, 0.93408203125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 5.0, 7.0, 17.0, 23.0, 34.0, 62.0, 74.0, 87.0, 99.0, 106.0, 95.0, 94.0, 90.0, 68.0, 54.0, 36.0, 22.0, 11.0, 11.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1773681640625, -0.171630859375, -0.1658935546875, -0.16015625, -0.1544189453125, -0.148681640625, -0.1429443359375, -0.13720703125, -0.1314697265625, -0.125732421875, -0.1199951171875, -0.1142578125, -0.1085205078125, -0.102783203125, -0.0970458984375, -0.09130859375, -0.0855712890625, -0.079833984375, -0.0740966796875, -0.068359375, -0.0626220703125, -0.056884765625, -0.0511474609375, -0.04541015625, -0.0396728515625, -0.033935546875, -0.0281982421875, -0.0224609375, -0.0167236328125, -0.010986328125, -0.0052490234375, 0.00048828125, 0.0062255859375, 0.011962890625, 0.0177001953125, 0.0234375, 0.0291748046875, 0.034912109375, 0.0406494140625, 0.04638671875, 0.0521240234375, 0.057861328125, 0.0635986328125, 0.0693359375, 0.0750732421875, 0.080810546875, 0.0865478515625, 0.09228515625, 0.0980224609375, 0.103759765625, 0.1094970703125, 0.115234375, 0.1209716796875, 0.126708984375, 0.1324462890625, 0.13818359375, 0.1439208984375, 0.149658203125, 0.1553955078125, 0.1611328125, 0.1668701171875, 0.172607421875, 0.1783447265625, 0.18408203125, 0.1898193359375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 8.0, 17.0, 19.0, 32.0, 50.0, 87.0, 134.0, 239.0, 530.0, 1250.0, 4948.0, 54928.0, 4090656.0, 35265.0, 4023.0, 1100.0, 439.0, 237.0, 143.0, 65.0, 43.0, 26.0, 14.0, 18.0, 7.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.8916015625, -0.8623123168945312, -0.8330230712890625, -0.8037338256835938, -0.774444580078125, -0.7451553344726562, -0.7158660888671875, -0.6865768432617188, -0.65728759765625, -0.6279983520507812, -0.5987091064453125, -0.5694198608398438, -0.540130615234375, -0.5108413696289062, -0.4815521240234375, -0.45226287841796875, -0.4229736328125, -0.39368438720703125, -0.3643951416015625, -0.33510589599609375, -0.305816650390625, -0.27652740478515625, -0.2472381591796875, -0.21794891357421875, -0.18865966796875, -0.15937042236328125, -0.1300811767578125, -0.10079193115234375, -0.071502685546875, -0.04221343994140625, -0.0129241943359375, 0.01636505126953125, 0.045654296875, 0.07494354248046875, 0.1042327880859375, 0.13352203369140625, 0.162811279296875, 0.19210052490234375, 0.2213897705078125, 0.25067901611328125, 0.27996826171875, 0.30925750732421875, 0.3385467529296875, 0.36783599853515625, 0.397125244140625, 0.42641448974609375, 0.4557037353515625, 0.48499298095703125, 0.5142822265625, 0.5435714721679688, 0.5728607177734375, 0.6021499633789062, 0.631439208984375, 0.6607284545898438, 0.6900177001953125, 0.7193069458007812, 0.74859619140625, 0.7778854370117188, 0.8071746826171875, 0.8364639282226562, 0.865753173828125, 0.8950424194335938, 0.9243316650390625, 0.9536209106445312, 0.98291015625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 4.0, 10.0, 9.0, 10.0, 22.0, 49.0, 168.0, 1484.0, 2027.0, 182.0, 62.0, 22.0, 11.0, 8.0, 3.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.30224609375, -0.2930946350097656, -0.28394317626953125, -0.2747917175292969, -0.2656402587890625, -0.2564888000488281, -0.24733734130859375, -0.23818588256835938, -0.229034423828125, -0.21988296508789062, -0.21073150634765625, -0.20158004760742188, -0.1924285888671875, -0.18327713012695312, -0.17412567138671875, -0.16497421264648438, -0.15582275390625, -0.14667129516601562, -0.13751983642578125, -0.12836837768554688, -0.1192169189453125, -0.11006546020507812, -0.10091400146484375, -0.09176254272460938, -0.082611083984375, -0.07345962524414062, -0.06430816650390625, -0.055156707763671875, -0.0460052490234375, -0.036853790283203125, -0.02770233154296875, -0.018550872802734375, -0.0093994140625, -0.000247955322265625, 0.00890350341796875, 0.018054962158203125, 0.0272064208984375, 0.036357879638671875, 0.04550933837890625, 0.054660797119140625, 0.063812255859375, 0.07296371459960938, 0.08211517333984375, 0.09126663208007812, 0.1004180908203125, 0.10956954956054688, 0.11872100830078125, 0.12787246704101562, 0.13702392578125, 0.14617538452148438, 0.15532684326171875, 0.16447830200195312, 0.1736297607421875, 0.18278121948242188, 0.19193267822265625, 0.20108413696289062, 0.210235595703125, 0.21938705444335938, 0.22853851318359375, 0.23768997192382812, 0.2468414306640625, 0.2559928894042969, 0.26514434814453125, 0.2742958068847656, 0.283447265625]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 15.0, 55.0, 231.0, 422.0, 198.0, 47.0, 20.0, 2.0, 3.0, 1.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0669002532958984, -2.0030205249786377, -1.939140796661377, -1.8752609491348267, -1.811381220817566, -1.7475014925003052, -1.6836216449737549, -1.6197419166564941, -1.5558621883392334, -1.4919824600219727, -1.428102731704712, -1.3642228841781616, -1.3003431558609009, -1.2364634275436401, -1.1725835800170898, -1.108703851699829, -1.0448241233825684, -0.9809443950653076, -0.9170646071434021, -0.8531848192214966, -0.7893050909042358, -0.7254253625869751, -0.6615455746650696, -0.5976657867431641, -0.5337860584259033, -0.4699063003063202, -0.40602654218673706, -0.34214678406715393, -0.2782670259475708, -0.21438726782798767, -0.15050750970840454, -0.08662775158882141, -0.022748231887817383, 0.04113152623176575, 0.10501128435134888, 0.168891042470932, 0.23277080059051514, 0.29665055871009827, 0.3605303168296814, 0.4244100749492645, 0.48828983306884766, 0.5521695613861084, 0.6160493493080139, 0.6799291372299194, 0.7438088655471802, 0.8076885938644409, 0.8715683817863464, 0.935448169708252, 0.9993278980255127, 1.0632076263427734, 1.1270873546600342, 1.1909672021865845, 1.2548469305038452, 1.318726658821106, 1.3826065063476562, 1.446486234664917, 1.5103659629821777, 1.5742456912994385, 1.6381254196166992, 1.7020052671432495, 1.7658849954605103, 1.829764723777771, 1.8936445713043213, 1.957524299621582, 2.0214040279388428]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 4.0, 14.0, 16.0, 23.0, 30.0, 43.0, 67.0, 70.0, 90.0, 96.0, 92.0, 96.0, 82.0, 68.0, 67.0, 45.0, 28.0, 29.0, 14.0, 11.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6373637914657593, -0.6132196187973022, -0.5890754461288452, -0.5649312734603882, -0.5407871007919312, -0.5166428685188293, -0.4924986958503723, -0.4683545231819153, -0.44421035051345825, -0.4200661778450012, -0.3959220051765442, -0.37177780270576477, -0.34763363003730774, -0.3234894573688507, -0.2993452548980713, -0.27520108222961426, -0.2510569095611572, -0.2269127368927002, -0.20276854932308197, -0.17862436175346375, -0.1544801890850067, -0.13033601641654968, -0.10619182884693146, -0.08204764127731323, -0.0579034686088562, -0.03375928848981857, -0.009615108370780945, 0.014529071748256683, 0.03867325186729431, 0.06281743198633194, 0.08696161210536957, 0.11110579967498779, 0.13524991273880005, 0.15939408540725708, 0.1835382729768753, 0.20768246054649353, 0.23182663321495056, 0.2559708058834076, 0.280115008354187, 0.30425918102264404, 0.3284033536911011, 0.3525475263595581, 0.37669169902801514, 0.40083590149879456, 0.4249800741672516, 0.4491242468357086, 0.47326844930648804, 0.49741262197494507, 0.5215567946434021, 0.5457009673118591, 0.5698451399803162, 0.5939893126487732, 0.618133544921875, 0.642277717590332, 0.6664218902587891, 0.6905660629272461, 0.7147102355957031, 0.7388544082641602, 0.7629985809326172, 0.7871427536010742, 0.8112869262695312, 0.8354311585426331, 0.8595753312110901, 0.8837195038795471, 0.9078636765480042]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 4.0, 6.0, 12.0, 20.0, 25.0, 39.0, 78.0, 126.0, 231.0, 480.0, 1251.0, 4620.0, 34030.0, 664377.0, 320260.0, 18063.0, 3109.0, 936.0, 413.0, 196.0, 112.0, 71.0, 28.0, 30.0, 12.0, 7.0, 12.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.79296875, -0.7695541381835938, -0.7461395263671875, -0.7227249145507812, -0.699310302734375, -0.6758956909179688, -0.6524810791015625, -0.6290664672851562, -0.60565185546875, -0.5822372436523438, -0.5588226318359375, -0.5354080200195312, -0.511993408203125, -0.48857879638671875, -0.4651641845703125, -0.44174957275390625, -0.4183349609375, -0.39492034912109375, -0.3715057373046875, -0.34809112548828125, -0.324676513671875, -0.30126190185546875, -0.2778472900390625, -0.25443267822265625, -0.23101806640625, -0.20760345458984375, -0.1841888427734375, -0.16077423095703125, -0.137359619140625, -0.11394500732421875, -0.0905303955078125, -0.06711578369140625, -0.043701171875, -0.02028656005859375, 0.0031280517578125, 0.02654266357421875, 0.049957275390625, 0.07337188720703125, 0.0967864990234375, 0.12020111083984375, 0.14361572265625, 0.16703033447265625, 0.1904449462890625, 0.21385955810546875, 0.237274169921875, 0.26068878173828125, 0.2841033935546875, 0.30751800537109375, 0.3309326171875, 0.35434722900390625, 0.3777618408203125, 0.40117645263671875, 0.424591064453125, 0.44800567626953125, 0.4714202880859375, 0.49483489990234375, 0.51824951171875, 0.5416641235351562, 0.5650787353515625, 0.5884933471679688, 0.611907958984375, 0.6353225708007812, 0.6587371826171875, 0.6821517944335938, 0.70556640625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 2.0, 9.0, 17.0, 30.0, 39.0, 67.0, 73.0, 114.0, 87.0, 104.0, 112.0, 107.0, 83.0, 57.0, 49.0, 20.0, 15.0, 7.0, 6.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1917724609375, -0.18567848205566406, -0.17958450317382812, -0.1734905242919922, -0.16739654541015625, -0.1613025665283203, -0.15520858764648438, -0.14911460876464844, -0.1430206298828125, -0.13692665100097656, -0.13083267211914062, -0.12473869323730469, -0.11864471435546875, -0.11255073547363281, -0.10645675659179688, -0.10036277770996094, -0.094268798828125, -0.08817481994628906, -0.08208084106445312, -0.07598686218261719, -0.06989288330078125, -0.06379890441894531, -0.057704925537109375, -0.05161094665527344, -0.0455169677734375, -0.03942298889160156, -0.033329010009765625, -0.027235031127929688, -0.02114105224609375, -0.015047073364257812, -0.008953094482421875, -0.0028591156005859375, 0.00323486328125, 0.009328842163085938, 0.015422821044921875, 0.021516799926757812, 0.02761077880859375, 0.03370475769042969, 0.039798736572265625, 0.04589271545410156, 0.0519866943359375, 0.05808067321777344, 0.06417465209960938, 0.07026863098144531, 0.07636260986328125, 0.08245658874511719, 0.08855056762695312, 0.09464454650878906, 0.100738525390625, 0.10683250427246094, 0.11292648315429688, 0.11902046203613281, 0.12511444091796875, 0.1312084197998047, 0.13730239868164062, 0.14339637756347656, 0.1494903564453125, 0.15558433532714844, 0.16167831420898438, 0.1677722930908203, 0.17386627197265625, 0.1799602508544922, 0.18605422973632812, 0.19214820861816406, 0.1982421875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 6.0, 4.0, 8.0, 8.0, 19.0, 13.0, 17.0, 38.0, 35.0, 58.0, 79.0, 135.0, 258.0, 536.0, 1709.0, 5982.0, 28431.0, 201684.0, 650360.0, 132125.0, 20249.0, 4433.0, 1307.0, 497.0, 215.0, 112.0, 58.0, 54.0, 30.0, 19.0, 19.0, 16.0, 15.0, 4.0, 7.0, 4.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.322265625, -0.3116645812988281, -0.30106353759765625, -0.2904624938964844, -0.2798614501953125, -0.2692604064941406, -0.25865936279296875, -0.24805831909179688, -0.237457275390625, -0.22685623168945312, -0.21625518798828125, -0.20565414428710938, -0.1950531005859375, -0.18445205688476562, -0.17385101318359375, -0.16324996948242188, -0.15264892578125, -0.14204788208007812, -0.13144683837890625, -0.12084579467773438, -0.1102447509765625, -0.09964370727539062, -0.08904266357421875, -0.07844161987304688, -0.067840576171875, -0.057239532470703125, -0.04663848876953125, -0.036037445068359375, -0.0254364013671875, -0.014835357666015625, -0.00423431396484375, 0.006366729736328125, 0.0169677734375, 0.027568817138671875, 0.03816986083984375, 0.048770904541015625, 0.0593719482421875, 0.06997299194335938, 0.08057403564453125, 0.09117507934570312, 0.101776123046875, 0.11237716674804688, 0.12297821044921875, 0.13357925415039062, 0.1441802978515625, 0.15478134155273438, 0.16538238525390625, 0.17598342895507812, 0.18658447265625, 0.19718551635742188, 0.20778656005859375, 0.21838760375976562, 0.2289886474609375, 0.23958969116210938, 0.25019073486328125, 0.2607917785644531, 0.271392822265625, 0.2819938659667969, 0.29259490966796875, 0.3031959533691406, 0.3137969970703125, 0.3243980407714844, 0.33499908447265625, 0.3456001281738281, 0.356201171875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 2.0, 2.0, 12.0, 8.0, 9.0, 11.0, 14.0, 13.0, 13.0, 14.0, 25.0, 32.0, 32.0, 29.0, 30.0, 43.0, 48.0, 41.0, 34.0, 57.0, 47.0, 49.0, 35.0, 48.0, 40.0, 45.0, 33.0, 34.0, 28.0, 24.0, 27.0, 19.0, 32.0, 20.0, 7.0, 11.0, 10.0, 3.0, 5.0, 7.0, 2.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.273681640625, -0.2647056579589844, -0.25572967529296875, -0.24675369262695312, -0.2377777099609375, -0.22880172729492188, -0.21982574462890625, -0.21084976196289062, -0.201873779296875, -0.19289779663085938, -0.18392181396484375, -0.17494583129882812, -0.1659698486328125, -0.15699386596679688, -0.14801788330078125, -0.13904190063476562, -0.13006591796875, -0.12108993530273438, -0.11211395263671875, -0.10313796997070312, -0.0941619873046875, -0.08518600463867188, -0.07621002197265625, -0.06723403930664062, -0.058258056640625, -0.049282073974609375, -0.04030609130859375, -0.031330108642578125, -0.0223541259765625, -0.013378143310546875, -0.00440216064453125, 0.004573822021484375, 0.0135498046875, 0.022525787353515625, 0.03150177001953125, 0.040477752685546875, 0.0494537353515625, 0.058429718017578125, 0.06740570068359375, 0.07638168334960938, 0.085357666015625, 0.09433364868164062, 0.10330963134765625, 0.11228561401367188, 0.1212615966796875, 0.13023757934570312, 0.13921356201171875, 0.14818954467773438, 0.15716552734375, 0.16614151000976562, 0.17511749267578125, 0.18409347534179688, 0.1930694580078125, 0.20204544067382812, 0.21102142333984375, 0.21999740600585938, 0.228973388671875, 0.23794937133789062, 0.24692535400390625, 0.2559013366699219, 0.2648773193359375, 0.2738533020019531, 0.28282928466796875, 0.2918052673339844, 0.30078125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 2.0, 9.0, 3.0, 6.0, 22.0, 19.0, 34.0, 60.0, 76.0, 123.0, 210.0, 373.0, 839.0, 2303.0, 9453.0, 78605.0, 648914.0, 275873.0, 24622.0, 4485.0, 1281.0, 498.0, 274.0, 158.0, 95.0, 61.0, 47.0, 30.0, 25.0, 18.0, 14.0, 7.0, 5.0, 1.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1539306640625, -0.14908218383789062, -0.14423370361328125, -0.13938522338867188, -0.1345367431640625, -0.12968826293945312, -0.12483978271484375, -0.11999130249023438, -0.115142822265625, -0.11029434204101562, -0.10544586181640625, -0.10059738159179688, -0.0957489013671875, -0.09090042114257812, -0.08605194091796875, -0.08120346069335938, -0.07635498046875, -0.07150650024414062, -0.06665802001953125, -0.061809539794921875, -0.0569610595703125, -0.052112579345703125, -0.04726409912109375, -0.042415618896484375, -0.037567138671875, -0.032718658447265625, -0.02787017822265625, -0.023021697998046875, -0.0181732177734375, -0.013324737548828125, -0.00847625732421875, -0.003627777099609375, 0.001220703125, 0.006069183349609375, 0.01091766357421875, 0.015766143798828125, 0.0206146240234375, 0.025463104248046875, 0.03031158447265625, 0.035160064697265625, 0.040008544921875, 0.044857025146484375, 0.04970550537109375, 0.054553985595703125, 0.0594024658203125, 0.06425094604492188, 0.06909942626953125, 0.07394790649414062, 0.07879638671875, 0.08364486694335938, 0.08849334716796875, 0.09334182739257812, 0.0981903076171875, 0.10303878784179688, 0.10788726806640625, 0.11273574829101562, 0.117584228515625, 0.12243270874023438, 0.12728118896484375, 0.13212966918945312, 0.1369781494140625, 0.14182662963867188, 0.14667510986328125, 0.15152359008789062, 0.1563720703125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 3.0, 13.0, 24.0, 41.0, 75.0, 121.0, 182.0, 183.0, 151.0, 93.0, 53.0, 28.0, 13.0, 17.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004470348358154297, -0.00043696723878383636, -0.00042689964175224304, -0.0004168320447206497, -0.0004067644476890564, -0.0003966968506574631, -0.00038662925362586975, -0.00037656165659427643, -0.0003664940595626831, -0.0003564264625310898, -0.00034635886549949646, -0.00033629126846790314, -0.0003262236714363098, -0.0003161560744047165, -0.00030608847737312317, -0.00029602088034152985, -0.0002859532833099365, -0.0002758856862783432, -0.0002658180892467499, -0.00025575049221515656, -0.00024568289518356323, -0.0002356152981519699, -0.0002255477011203766, -0.00021548010408878326, -0.00020541250705718994, -0.00019534491002559662, -0.0001852773129940033, -0.00017520971596240997, -0.00016514211893081665, -0.00015507452189922333, -0.00014500692486763, -0.00013493932783603668, -0.00012487173080444336, -0.00011480413377285004, -0.00010473653674125671, -9.466893970966339e-05, -8.460134267807007e-05, -7.453374564647675e-05, -6.446614861488342e-05, -5.43985515832901e-05, -4.433095455169678e-05, -3.4263357520103455e-05, -2.4195760488510132e-05, -1.4128163456916809e-05, -4.060566425323486e-06, 6.0070306062698364e-06, 1.607462763786316e-05, 2.6142224669456482e-05, 3.6209821701049805e-05, 4.627741873264313e-05, 5.634501576423645e-05, 6.641261279582977e-05, 7.64802098274231e-05, 8.654780685901642e-05, 9.661540389060974e-05, 0.00010668300092220306, 0.00011675059795379639, 0.0001268181949853897, 0.00013688579201698303, 0.00014695338904857635, 0.00015702098608016968, 0.000167088583111763, 0.00017715618014335632, 0.00018722377717494965, 0.00019729137420654297]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 11.0, 9.0, 20.0, 29.0, 59.0, 144.0, 286.0, 815.0, 4432.0, 71730.0, 870650.0, 93860.0, 4921.0, 972.0, 319.0, 142.0, 67.0, 31.0, 18.0, 17.0, 6.0, 8.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1976318359375, -0.19045448303222656, -0.18327713012695312, -0.1760997772216797, -0.16892242431640625, -0.1617450714111328, -0.15456771850585938, -0.14739036560058594, -0.1402130126953125, -0.13303565979003906, -0.12585830688476562, -0.11868095397949219, -0.11150360107421875, -0.10432624816894531, -0.09714889526367188, -0.08997154235839844, -0.082794189453125, -0.07561683654785156, -0.06843948364257812, -0.06126213073730469, -0.05408477783203125, -0.04690742492675781, -0.039730072021484375, -0.03255271911621094, -0.0253753662109375, -0.018198013305664062, -0.011020660400390625, -0.0038433074951171875, 0.00333404541015625, 0.010511398315429688, 0.017688751220703125, 0.024866104125976562, 0.03204345703125, 0.03922080993652344, 0.046398162841796875, 0.05357551574707031, 0.06075286865234375, 0.06793022155761719, 0.07510757446289062, 0.08228492736816406, 0.0894622802734375, 0.09663963317871094, 0.10381698608398438, 0.11099433898925781, 0.11817169189453125, 0.1253490447998047, 0.13252639770507812, 0.13970375061035156, 0.146881103515625, 0.15405845642089844, 0.16123580932617188, 0.1684131622314453, 0.17559051513671875, 0.1827678680419922, 0.18994522094726562, 0.19712257385253906, 0.2042999267578125, 0.21147727966308594, 0.21865463256835938, 0.2258319854736328, 0.23300933837890625, 0.2401866912841797, 0.24736404418945312, 0.25454139709472656, 0.26171875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 15.0, 24.0, 30.0, 84.0, 131.0, 195.0, 202.0, 146.0, 90.0, 50.0, 17.0, 10.0, 6.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.178466796875, -0.17106246948242188, -0.16365814208984375, -0.15625381469726562, -0.1488494873046875, -0.14144515991210938, -0.13404083251953125, -0.12663650512695312, -0.119232177734375, -0.11182785034179688, -0.10442352294921875, -0.09701919555664062, -0.0896148681640625, -0.08221054077148438, -0.07480621337890625, -0.06740188598632812, -0.05999755859375, -0.052593231201171875, -0.04518890380859375, -0.037784576416015625, -0.0303802490234375, -0.022975921630859375, -0.01557159423828125, -0.008167266845703125, -0.000762939453125, 0.006641387939453125, 0.01404571533203125, 0.021450042724609375, 0.0288543701171875, 0.036258697509765625, 0.04366302490234375, 0.051067352294921875, 0.0584716796875, 0.06587600708007812, 0.07328033447265625, 0.08068466186523438, 0.0880889892578125, 0.09549331665039062, 0.10289764404296875, 0.11030197143554688, 0.117706298828125, 0.12511062622070312, 0.13251495361328125, 0.13991928100585938, 0.1473236083984375, 0.15472793579101562, 0.16213226318359375, 0.16953659057617188, 0.17694091796875, 0.18434524536132812, 0.19174957275390625, 0.19915390014648438, 0.2065582275390625, 0.21396255493164062, 0.22136688232421875, 0.22877120971679688, 0.236175537109375, 0.24357986450195312, 0.25098419189453125, 0.2583885192871094, 0.2657928466796875, 0.2731971740722656, 0.28060150146484375, 0.2880058288574219, 0.29541015625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 7.0, 11.0, 31.0, 77.0, 251.0, 360.0, 204.0, 51.0, 17.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.137864589691162, -2.9975500106811523, -2.8572354316711426, -2.716920852661133, -2.576606273651123, -2.4362916946411133, -2.2959768772125244, -2.1556622982025146, -2.015347719192505, -1.8750331401824951, -1.7347185611724854, -1.594403862953186, -1.4540892839431763, -1.3137747049331665, -1.1734600067138672, -1.0331454277038574, -0.8928308486938477, -0.7525162696838379, -0.6122016310691833, -0.4718870222568512, -0.33157241344451904, -0.19125783443450928, -0.050943195819854736, 0.0893714427947998, 0.22968602180480957, 0.3700006306171417, 0.5103152394294739, 0.6506298780441284, 0.7909444570541382, 0.931259036064148, 1.0715737342834473, 1.211888313293457, 1.352203369140625, 1.4925179481506348, 1.6328325271606445, 1.7731472253799438, 1.9134618043899536, 2.053776264190674, 2.1940910816192627, 2.3344056606292725, 2.4747202396392822, 2.615034818649292, 2.7553493976593018, 2.8956639766693115, 3.0359787940979004, 3.17629337310791, 3.31660795211792, 3.4569225311279297, 3.5972371101379395, 3.737551689147949, 3.877866268157959, 4.018180847167969, 4.1584954261779785, 4.298810005187988, 4.439124584197998, 4.579439163208008, 4.719754219055176, 4.8600687980651855, 5.000383377075195, 5.140697956085205, 5.281012535095215, 5.421327114105225, 5.561641693115234, 5.701956748962402, 5.842270851135254]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 2.0, 14.0, 13.0, 13.0, 18.0, 22.0, 26.0, 27.0, 30.0, 38.0, 39.0, 38.0, 40.0, 51.0, 55.0, 44.0, 70.0, 51.0, 40.0, 51.0, 51.0, 32.0, 43.0, 30.0, 31.0, 25.0, 24.0, 16.0, 16.0, 8.0, 11.0, 11.0, 7.0, 9.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.80057692527771, -1.7496801614761353, -1.6987833976745605, -1.6478866338729858, -1.5969898700714111, -1.5460931062698364, -1.4951963424682617, -1.444299578666687, -1.3934028148651123, -1.3425060510635376, -1.291609287261963, -1.2407125234603882, -1.1898157596588135, -1.1389189958572388, -1.088022232055664, -1.0371254682540894, -0.9862286448478699, -0.9353318810462952, -0.8844351172447205, -0.8335383534431458, -0.782641589641571, -0.7317447662353516, -0.6808480024337769, -0.6299512386322021, -0.5790544748306274, -0.5281577110290527, -0.477260947227478, -0.4263641834259033, -0.3754674196243286, -0.3245706260204315, -0.2736738622188568, -0.2227770984172821, -0.17188036441802979, -0.12098360061645508, -0.07008682936429977, -0.01919005811214447, 0.03170670568943024, 0.08260348439216614, 0.13350024819374084, 0.18439701199531555, 0.23529377579689026, 0.28619053959846497, 0.3370873034000397, 0.38798409700393677, 0.4388808608055115, 0.4897776246070862, 0.5406743884086609, 0.5915711522102356, 0.6424679160118103, 0.693364679813385, 0.7442614436149597, 0.7951582074165344, 0.8460549712181091, 0.8969517946243286, 0.9478485584259033, 0.998745322227478, 1.0496420860290527, 1.1005388498306274, 1.1514356136322021, 1.2023323774337769, 1.2532291412353516, 1.3041259050369263, 1.355022668838501, 1.4059194326400757, 1.4568161964416504]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 4.0, 6.0, 7.0, 11.0, 12.0, 26.0, 45.0, 71.0, 127.0, 245.0, 504.0, 1353.0, 4897.0, 35421.0, 4087816.0, 54870.0, 5985.0, 1537.0, 625.0, 301.0, 176.0, 98.0, 57.0, 31.0, 17.0, 10.0, 13.0, 7.0, 2.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.3095703125, -1.27056884765625, -1.2315673828125, -1.19256591796875, -1.153564453125, -1.11456298828125, -1.0755615234375, -1.03656005859375, -0.99755859375, -0.95855712890625, -0.9195556640625, -0.88055419921875, -0.841552734375, -0.80255126953125, -0.7635498046875, -0.72454833984375, -0.685546875, -0.64654541015625, -0.6075439453125, -0.56854248046875, -0.529541015625, -0.49053955078125, -0.4515380859375, -0.41253662109375, -0.37353515625, -0.33453369140625, -0.2955322265625, -0.25653076171875, -0.217529296875, -0.17852783203125, -0.1395263671875, -0.10052490234375, -0.0615234375, -0.02252197265625, 0.0164794921875, 0.05548095703125, 0.094482421875, 0.13348388671875, 0.1724853515625, 0.21148681640625, 0.25048828125, 0.28948974609375, 0.3284912109375, 0.36749267578125, 0.406494140625, 0.44549560546875, 0.4844970703125, 0.52349853515625, 0.5625, 0.60150146484375, 0.6405029296875, 0.67950439453125, 0.718505859375, 0.75750732421875, 0.7965087890625, 0.83551025390625, 0.87451171875, 0.91351318359375, 0.9525146484375, 0.99151611328125, 1.030517578125, 1.06951904296875, 1.1085205078125, 1.14752197265625, 1.1865234375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 6.0, 2.0, 12.0, 13.0, 27.0, 34.0, 58.0, 70.0, 85.0, 84.0, 91.0, 110.0, 83.0, 90.0, 74.0, 52.0, 41.0, 28.0, 19.0, 13.0, 8.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1939697265625, -0.1882762908935547, -0.18258285522460938, -0.17688941955566406, -0.17119598388671875, -0.16550254821777344, -0.15980911254882812, -0.1541156768798828, -0.1484222412109375, -0.1427288055419922, -0.13703536987304688, -0.13134193420410156, -0.12564849853515625, -0.11995506286621094, -0.11426162719726562, -0.10856819152832031, -0.102874755859375, -0.09718132019042969, -0.09148788452148438, -0.08579444885253906, -0.08010101318359375, -0.07440757751464844, -0.06871414184570312, -0.06302070617675781, -0.0573272705078125, -0.05163383483886719, -0.045940399169921875, -0.04024696350097656, -0.03455352783203125, -0.028860092163085938, -0.023166656494140625, -0.017473220825195312, -0.01177978515625, -0.0060863494873046875, -0.000392913818359375, 0.0053005218505859375, 0.01099395751953125, 0.016687393188476562, 0.022380828857421875, 0.028074264526367188, 0.0337677001953125, 0.03946113586425781, 0.045154571533203125, 0.05084800720214844, 0.05654144287109375, 0.06223487854003906, 0.06792831420898438, 0.07362174987792969, 0.079315185546875, 0.08500862121582031, 0.09070205688476562, 0.09639549255371094, 0.10208892822265625, 0.10778236389160156, 0.11347579956054688, 0.11916923522949219, 0.1248626708984375, 0.1305561065673828, 0.13624954223632812, 0.14194297790527344, 0.14763641357421875, 0.15332984924316406, 0.15902328491210938, 0.1647167205810547, 0.17041015625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 8.0, 1.0, 5.0, 3.0, 5.0, 8.0, 9.0, 14.0, 22.0, 28.0, 44.0, 58.0, 77.0, 84.0, 134.0, 221.0, 301.0, 537.0, 882.0, 1666.0, 3922.0, 15350.0, 150819.0, 3929683.0, 74154.0, 9875.0, 2942.0, 1350.0, 747.0, 418.0, 302.0, 178.0, 126.0, 75.0, 61.0, 56.0, 39.0, 24.0, 17.0, 9.0, 5.0, 8.0, 8.0, 5.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.517578125, -0.5005416870117188, -0.4835052490234375, -0.46646881103515625, -0.449432373046875, -0.43239593505859375, -0.4153594970703125, -0.39832305908203125, -0.38128662109375, -0.36425018310546875, -0.3472137451171875, -0.33017730712890625, -0.313140869140625, -0.29610443115234375, -0.2790679931640625, -0.26203155517578125, -0.2449951171875, -0.22795867919921875, -0.2109222412109375, -0.19388580322265625, -0.176849365234375, -0.15981292724609375, -0.1427764892578125, -0.12574005126953125, -0.10870361328125, -0.09166717529296875, -0.0746307373046875, -0.05759429931640625, -0.040557861328125, -0.02352142333984375, -0.0064849853515625, 0.01055145263671875, 0.027587890625, 0.04462432861328125, 0.0616607666015625, 0.07869720458984375, 0.095733642578125, 0.11277008056640625, 0.1298065185546875, 0.14684295654296875, 0.16387939453125, 0.18091583251953125, 0.1979522705078125, 0.21498870849609375, 0.232025146484375, 0.24906158447265625, 0.2660980224609375, 0.28313446044921875, 0.3001708984375, 0.31720733642578125, 0.3342437744140625, 0.35128021240234375, 0.368316650390625, 0.38535308837890625, 0.4023895263671875, 0.41942596435546875, 0.43646240234375, 0.45349884033203125, 0.4705352783203125, 0.48757171630859375, 0.504608154296875, 0.5216445922851562, 0.5386810302734375, 0.5557174682617188, 0.57275390625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 1.0, 5.0, 9.0, 12.0, 31.0, 74.0, 210.0, 2981.0, 562.0, 121.0, 36.0, 12.0, 5.0, 5.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.417236328125, -0.4072399139404297, -0.3972434997558594, -0.38724708557128906, -0.37725067138671875, -0.36725425720214844, -0.3572578430175781, -0.3472614288330078, -0.3372650146484375, -0.3272686004638672, -0.3172721862792969, -0.30727577209472656, -0.29727935791015625, -0.28728294372558594, -0.2772865295410156, -0.2672901153564453, -0.257293701171875, -0.2472972869873047, -0.23730087280273438, -0.22730445861816406, -0.21730804443359375, -0.20731163024902344, -0.19731521606445312, -0.1873188018798828, -0.1773223876953125, -0.1673259735107422, -0.15732955932617188, -0.14733314514160156, -0.13733673095703125, -0.12734031677246094, -0.11734390258789062, -0.10734748840332031, -0.09735107421875, -0.08735466003417969, -0.07735824584960938, -0.06736183166503906, -0.05736541748046875, -0.04736900329589844, -0.037372589111328125, -0.027376174926757812, -0.0173797607421875, -0.0073833465576171875, 0.002613067626953125, 0.012609481811523438, 0.02260589599609375, 0.03260231018066406, 0.042598724365234375, 0.05259513854980469, 0.062591552734375, 0.07258796691894531, 0.08258438110351562, 0.09258079528808594, 0.10257720947265625, 0.11257362365722656, 0.12257003784179688, 0.1325664520263672, 0.1425628662109375, 0.1525592803955078, 0.16255569458007812, 0.17255210876464844, 0.18254852294921875, 0.19254493713378906, 0.20254135131835938, 0.2125377655029297, 0.2225341796875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 10.0, 27.0, 131.0, 399.0, 332.0, 68.0, 11.0, 6.0, 5.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9986463785171509, -1.931889295578003, -1.8651320934295654, -1.7983750104904175, -1.7316179275512695, -1.6648608446121216, -1.5981037616729736, -1.5313465595245361, -1.4645894765853882, -1.3978323936462402, -1.3310751914978027, -1.2643181085586548, -1.1975610256195068, -1.1308039426803589, -1.064046859741211, -0.9972896575927734, -0.9305325746536255, -0.8637754917144775, -0.7970183491706848, -0.7302612066268921, -0.6635041236877441, -0.5967470407485962, -0.5299898982048035, -0.46323278546333313, -0.3964756727218628, -0.32971855998039246, -0.2629614472389221, -0.19620433449745178, -0.12944722175598145, -0.06269010901451111, 0.0040670037269592285, 0.07082411646842957, 0.13758111000061035, 0.2043382227420807, 0.271095335483551, 0.33785244822502136, 0.4046095609664917, 0.47136667370796204, 0.5381237864494324, 0.6048809289932251, 0.671638011932373, 0.738395094871521, 0.8051522374153137, 0.8719093799591064, 0.9386664628982544, 1.0054235458374023, 1.0721807479858398, 1.1389378309249878, 1.2056949138641357, 1.2724519968032837, 1.3392090797424316, 1.4059662818908691, 1.472723364830017, 1.539480447769165, 1.6062376499176025, 1.6729947328567505, 1.7397518157958984, 1.8065088987350464, 1.8732659816741943, 1.9400231838226318, 2.0067801475524902, 2.0735373497009277, 2.1402945518493652, 2.2070515155792236, 2.273808717727661]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 5.0, 3.0, 6.0, 6.0, 12.0, 19.0, 24.0, 35.0, 38.0, 48.0, 67.0, 80.0, 98.0, 78.0, 92.0, 67.0, 70.0, 63.0, 37.0, 41.0, 30.0, 26.0, 17.0, 15.0, 11.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5990517735481262, -0.5756936073303223, -0.5523354411125183, -0.5289772748947144, -0.5056191086769104, -0.48226094245910645, -0.4589027762413025, -0.43554461002349854, -0.4121864438056946, -0.3888282775878906, -0.36547011137008667, -0.3421119451522827, -0.31875377893447876, -0.2953956127166748, -0.27203744649887085, -0.2486792653799057, -0.22532108426094055, -0.2019629180431366, -0.17860475182533264, -0.1552465856075287, -0.13188841938972473, -0.10853024572134018, -0.08517207205295563, -0.06181390583515167, -0.03845573961734772, -0.015097571536898613, 0.008260596543550491, 0.031618766486644745, 0.0549769327044487, 0.07833509892225266, 0.10169327259063721, 0.12505143880844116, 0.14840960502624512, 0.17176777124404907, 0.19512593746185303, 0.21848410367965698, 0.24184226989746094, 0.2652004361152649, 0.28855860233306885, 0.3119167685508728, 0.33527493476867676, 0.3586331009864807, 0.38199126720428467, 0.4053494334220886, 0.4287075996398926, 0.45206576585769653, 0.4754239320755005, 0.49878209829330444, 0.5221402645111084, 0.5454984307289124, 0.5688565969467163, 0.5922147631645203, 0.6155729293823242, 0.6389310956001282, 0.6622892618179321, 0.6856474280357361, 0.7090056538581848, 0.7323638200759888, 0.7557219862937927, 0.7790801525115967, 0.8024383187294006, 0.8257964849472046, 0.8491546511650085, 0.8725128173828125, 0.8958709836006165]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 3.0, 6.0, 6.0, 5.0, 7.0, 13.0, 25.0, 15.0, 23.0, 39.0, 59.0, 74.0, 120.0, 154.0, 256.0, 412.0, 670.0, 1316.0, 2903.0, 8057.0, 26664.0, 113082.0, 480292.0, 319815.0, 66865.0, 17218.0, 5661.0, 2168.0, 1056.0, 547.0, 307.0, 192.0, 133.0, 110.0, 79.0, 57.0, 40.0, 22.0, 26.0, 17.0, 9.0, 7.0, 7.0, 5.0, 6.0, 2.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.372802734375, -0.3617820739746094, -0.35076141357421875, -0.3397407531738281, -0.3287200927734375, -0.3176994323730469, -0.30667877197265625, -0.2956581115722656, -0.284637451171875, -0.2736167907714844, -0.26259613037109375, -0.2515754699707031, -0.2405548095703125, -0.22953414916992188, -0.21851348876953125, -0.20749282836914062, -0.19647216796875, -0.18545150756835938, -0.17443084716796875, -0.16341018676757812, -0.1523895263671875, -0.14136886596679688, -0.13034820556640625, -0.11932754516601562, -0.108306884765625, -0.09728622436523438, -0.08626556396484375, -0.07524490356445312, -0.0642242431640625, -0.053203582763671875, -0.04218292236328125, -0.031162261962890625, -0.0201416015625, -0.009120941162109375, 0.00189971923828125, 0.012920379638671875, 0.0239410400390625, 0.034961700439453125, 0.04598236083984375, 0.057003021240234375, 0.068023681640625, 0.07904434204101562, 0.09006500244140625, 0.10108566284179688, 0.1121063232421875, 0.12312698364257812, 0.13414764404296875, 0.14516830444335938, 0.15618896484375, 0.16720962524414062, 0.17823028564453125, 0.18925094604492188, 0.2002716064453125, 0.21129226684570312, 0.22231292724609375, 0.23333358764648438, 0.244354248046875, 0.2553749084472656, 0.26639556884765625, 0.2774162292480469, 0.2884368896484375, 0.2994575500488281, 0.31047821044921875, 0.3214988708496094, 0.33251953125]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 2.0, 1.0, 8.0, 17.0, 23.0, 31.0, 39.0, 62.0, 67.0, 86.0, 98.0, 99.0, 101.0, 77.0, 72.0, 75.0, 53.0, 24.0, 30.0, 15.0, 8.0, 8.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2081298828125, -0.2022876739501953, -0.19644546508789062, -0.19060325622558594, -0.18476104736328125, -0.17891883850097656, -0.17307662963867188, -0.1672344207763672, -0.1613922119140625, -0.1555500030517578, -0.14970779418945312, -0.14386558532714844, -0.13802337646484375, -0.13218116760253906, -0.12633895874023438, -0.12049674987792969, -0.114654541015625, -0.10881233215332031, -0.10297012329101562, -0.09712791442871094, -0.09128570556640625, -0.08544349670410156, -0.07960128784179688, -0.07375907897949219, -0.0679168701171875, -0.06207466125488281, -0.056232452392578125, -0.05039024353027344, -0.04454803466796875, -0.03870582580566406, -0.032863616943359375, -0.027021408081054688, -0.02117919921875, -0.015336990356445312, -0.009494781494140625, -0.0036525726318359375, 0.00218963623046875, 0.008031845092773438, 0.013874053955078125, 0.019716262817382812, 0.0255584716796875, 0.03140068054199219, 0.037242889404296875, 0.04308509826660156, 0.04892730712890625, 0.05476951599121094, 0.060611724853515625, 0.06645393371582031, 0.072296142578125, 0.07813835144042969, 0.08398056030273438, 0.08982276916503906, 0.09566497802734375, 0.10150718688964844, 0.10734939575195312, 0.11319160461425781, 0.1190338134765625, 0.12487602233886719, 0.13071823120117188, 0.13656044006347656, 0.14240264892578125, 0.14824485778808594, 0.15408706665039062, 0.1599292755126953, 0.165771484375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 2.0, 5.0, 3.0, 8.0, 14.0, 12.0, 16.0, 22.0, 39.0, 27.0, 58.0, 82.0, 106.0, 193.0, 261.0, 449.0, 772.0, 1434.0, 3392.0, 9689.0, 36643.0, 172237.0, 541195.0, 218324.0, 44475.0, 11483.0, 3875.0, 1645.0, 808.0, 408.0, 242.0, 183.0, 145.0, 82.0, 53.0, 50.0, 36.0, 25.0, 25.0, 13.0, 9.0, 7.0, 6.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2442626953125, -0.23627281188964844, -0.22828292846679688, -0.2202930450439453, -0.21230316162109375, -0.2043132781982422, -0.19632339477539062, -0.18833351135253906, -0.1803436279296875, -0.17235374450683594, -0.16436386108398438, -0.1563739776611328, -0.14838409423828125, -0.1403942108154297, -0.13240432739257812, -0.12441444396972656, -0.116424560546875, -0.10843467712402344, -0.10044479370117188, -0.09245491027832031, -0.08446502685546875, -0.07647514343261719, -0.06848526000976562, -0.06049537658691406, -0.0525054931640625, -0.04451560974121094, -0.036525726318359375, -0.028535842895507812, -0.02054595947265625, -0.012556076049804688, -0.004566192626953125, 0.0034236907958984375, 0.01141357421875, 0.019403457641601562, 0.027393341064453125, 0.03538322448730469, 0.04337310791015625, 0.05136299133300781, 0.059352874755859375, 0.06734275817871094, 0.0753326416015625, 0.08332252502441406, 0.09131240844726562, 0.09930229187011719, 0.10729217529296875, 0.11528205871582031, 0.12327194213867188, 0.13126182556152344, 0.139251708984375, 0.14724159240722656, 0.15523147583007812, 0.1632213592529297, 0.17121124267578125, 0.1792011260986328, 0.18719100952148438, 0.19518089294433594, 0.2031707763671875, 0.21116065979003906, 0.21915054321289062, 0.2271404266357422, 0.23513031005859375, 0.2431201934814453, 0.2511100769042969, 0.25909996032714844, 0.26708984375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 2.0, 4.0, 8.0, 8.0, 11.0, 14.0, 22.0, 22.0, 25.0, 26.0, 27.0, 34.0, 32.0, 29.0, 38.0, 36.0, 40.0, 39.0, 42.0, 59.0, 41.0, 44.0, 45.0, 42.0, 45.0, 37.0, 32.0, 35.0, 15.0, 21.0, 26.0, 15.0, 16.0, 13.0, 12.0, 12.0, 7.0, 4.0, 5.0, 5.0, 6.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.433837890625, -0.42200469970703125, -0.4101715087890625, -0.39833831787109375, -0.386505126953125, -0.37467193603515625, -0.3628387451171875, -0.35100555419921875, -0.33917236328125, -0.32733917236328125, -0.3155059814453125, -0.30367279052734375, -0.291839599609375, -0.28000640869140625, -0.2681732177734375, -0.25634002685546875, -0.2445068359375, -0.23267364501953125, -0.2208404541015625, -0.20900726318359375, -0.197174072265625, -0.18534088134765625, -0.1735076904296875, -0.16167449951171875, -0.14984130859375, -0.13800811767578125, -0.1261749267578125, -0.11434173583984375, -0.102508544921875, -0.09067535400390625, -0.0788421630859375, -0.06700897216796875, -0.05517578125, -0.04334259033203125, -0.0315093994140625, -0.01967620849609375, -0.007843017578125, 0.00399017333984375, 0.0158233642578125, 0.02765655517578125, 0.03948974609375, 0.05132293701171875, 0.0631561279296875, 0.07498931884765625, 0.086822509765625, 0.09865570068359375, 0.1104888916015625, 0.12232208251953125, 0.1341552734375, 0.14598846435546875, 0.1578216552734375, 0.16965484619140625, 0.181488037109375, 0.19332122802734375, 0.2051544189453125, 0.21698760986328125, 0.22882080078125, 0.24065399169921875, 0.2524871826171875, 0.26432037353515625, 0.276153564453125, 0.28798675537109375, 0.2998199462890625, 0.31165313720703125, 0.323486328125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 8.0, 11.0, 36.0, 102.0, 415.0, 5786.0, 924535.0, 115932.0, 1462.0, 199.0, 40.0, 20.0, 9.0, 5.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52197265625, -0.50738525390625, -0.4927978515625, -0.47821044921875, -0.463623046875, -0.44903564453125, -0.4344482421875, -0.41986083984375, -0.4052734375, -0.39068603515625, -0.3760986328125, -0.36151123046875, -0.346923828125, -0.33233642578125, -0.3177490234375, -0.30316162109375, -0.28857421875, -0.27398681640625, -0.2593994140625, -0.24481201171875, -0.230224609375, -0.21563720703125, -0.2010498046875, -0.18646240234375, -0.171875, -0.15728759765625, -0.1427001953125, -0.12811279296875, -0.113525390625, -0.09893798828125, -0.0843505859375, -0.06976318359375, -0.05517578125, -0.04058837890625, -0.0260009765625, -0.01141357421875, 0.003173828125, 0.01776123046875, 0.0323486328125, 0.04693603515625, 0.0615234375, 0.07611083984375, 0.0906982421875, 0.10528564453125, 0.119873046875, 0.13446044921875, 0.1490478515625, 0.16363525390625, 0.17822265625, 0.19281005859375, 0.2073974609375, 0.22198486328125, 0.236572265625, 0.25115966796875, 0.2657470703125, 0.28033447265625, 0.294921875, 0.30950927734375, 0.3240966796875, 0.33868408203125, 0.353271484375, 0.36785888671875, 0.3824462890625, 0.39703369140625, 0.41162109375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 6.0, 10.0, 27.0, 32.0, 53.0, 93.0, 109.0, 220.0, 176.0, 100.0, 65.0, 47.0, 34.0, 16.0, 9.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002999305725097656, -0.00028908252716064453, -0.00027823448181152344, -0.00026738643646240234, -0.00025653839111328125, -0.00024569034576416016, -0.00023484230041503906, -0.00022399425506591797, -0.00021314620971679688, -0.00020229816436767578, -0.0001914501190185547, -0.0001806020736694336, -0.0001697540283203125, -0.0001589059829711914, -0.0001480579376220703, -0.00013720989227294922, -0.00012636184692382812, -0.00011551380157470703, -0.00010466575622558594, -9.381771087646484e-05, -8.296966552734375e-05, -7.212162017822266e-05, -6.127357482910156e-05, -5.042552947998047e-05, -3.9577484130859375e-05, -2.872943878173828e-05, -1.7881393432617188e-05, -7.033348083496094e-06, 3.814697265625e-06, 1.4662742614746094e-05, 2.5510787963867188e-05, 3.635883331298828e-05, 4.7206878662109375e-05, 5.805492401123047e-05, 6.890296936035156e-05, 7.975101470947266e-05, 9.059906005859375e-05, 0.00010144710540771484, 0.00011229515075683594, 0.00012314319610595703, 0.00013399124145507812, 0.00014483928680419922, 0.0001556873321533203, 0.0001665353775024414, 0.0001773834228515625, 0.0001882314682006836, 0.0001990795135498047, 0.00020992755889892578, 0.00022077560424804688, 0.00023162364959716797, 0.00024247169494628906, 0.00025331974029541016, 0.00026416778564453125, 0.00027501583099365234, 0.00028586387634277344, 0.00029671192169189453, 0.0003075599670410156, 0.0003184080123901367, 0.0003292560577392578, 0.0003401041030883789, 0.0003509521484375, 0.0003618001937866211, 0.0003726482391357422, 0.0003834962844848633, 0.0003943443298339844]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 5.0, 3.0, 6.0, 9.0, 20.0, 29.0, 56.0, 111.0, 200.0, 553.0, 2651.0, 41972.0, 873104.0, 123915.0, 4685.0, 766.0, 221.0, 105.0, 64.0, 38.0, 15.0, 15.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3017578125, -0.29278564453125, -0.2838134765625, -0.27484130859375, -0.265869140625, -0.25689697265625, -0.2479248046875, -0.23895263671875, -0.22998046875, -0.22100830078125, -0.2120361328125, -0.20306396484375, -0.194091796875, -0.18511962890625, -0.1761474609375, -0.16717529296875, -0.158203125, -0.14923095703125, -0.1402587890625, -0.13128662109375, -0.122314453125, -0.11334228515625, -0.1043701171875, -0.09539794921875, -0.08642578125, -0.07745361328125, -0.0684814453125, -0.05950927734375, -0.050537109375, -0.04156494140625, -0.0325927734375, -0.02362060546875, -0.0146484375, -0.00567626953125, 0.0032958984375, 0.01226806640625, 0.021240234375, 0.03021240234375, 0.0391845703125, 0.04815673828125, 0.05712890625, 0.06610107421875, 0.0750732421875, 0.08404541015625, 0.093017578125, 0.10198974609375, 0.1109619140625, 0.11993408203125, 0.12890625, 0.13787841796875, 0.1468505859375, 0.15582275390625, 0.164794921875, 0.17376708984375, 0.1827392578125, 0.19171142578125, 0.20068359375, 0.20965576171875, 0.2186279296875, 0.22760009765625, 0.236572265625, 0.24554443359375, 0.2545166015625, 0.26348876953125, 0.2724609375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 4.0, 4.0, 17.0, 50.0, 106.0, 186.0, 244.0, 204.0, 119.0, 50.0, 12.0, 9.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.56689453125, -0.5556869506835938, -0.5444793701171875, -0.5332717895507812, -0.522064208984375, -0.5108566284179688, -0.4996490478515625, -0.48844146728515625, -0.47723388671875, -0.46602630615234375, -0.4548187255859375, -0.44361114501953125, -0.432403564453125, -0.42119598388671875, -0.4099884033203125, -0.39878082275390625, -0.3875732421875, -0.37636566162109375, -0.3651580810546875, -0.35395050048828125, -0.342742919921875, -0.33153533935546875, -0.3203277587890625, -0.30912017822265625, -0.29791259765625, -0.28670501708984375, -0.2754974365234375, -0.26428985595703125, -0.253082275390625, -0.24187469482421875, -0.2306671142578125, -0.21945953369140625, -0.208251953125, -0.19704437255859375, -0.1858367919921875, -0.17462921142578125, -0.163421630859375, -0.15221405029296875, -0.1410064697265625, -0.12979888916015625, -0.11859130859375, -0.10738372802734375, -0.0961761474609375, -0.08496856689453125, -0.073760986328125, -0.06255340576171875, -0.0513458251953125, -0.04013824462890625, -0.0289306640625, -0.01772308349609375, -0.0065155029296875, 0.00469207763671875, 0.015899658203125, 0.02710723876953125, 0.0383148193359375, 0.04952239990234375, 0.06072998046875, 0.07193756103515625, 0.0831451416015625, 0.09435272216796875, 0.105560302734375, 0.11676788330078125, 0.1279754638671875, 0.13918304443359375, 0.150390625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 8.0, 21.0, 31.0, 103.0, 245.0, 277.0, 187.0, 79.0, 30.0, 9.0, 4.0, 2.0, 3.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.837831020355225, -5.712147235870361, -5.586463451385498, -5.460780143737793, -5.33509635925293, -5.209412574768066, -5.083728790283203, -4.95804500579834, -4.832361221313477, -4.706677436828613, -4.58099365234375, -4.455310344696045, -4.329626560211182, -4.203942775726318, -4.078258991241455, -3.952575206756592, -3.8268918991088867, -3.7012081146240234, -3.5755245685577393, -3.449840784072876, -3.324157238006592, -3.1984734535217285, -3.0727896690368652, -2.947105884552002, -2.8214223384857178, -2.6957385540008545, -2.5700550079345703, -2.444371223449707, -2.3186874389648438, -2.1930038928985596, -2.0673201084136963, -1.9416364431381226, -1.815953254699707, -1.6902695894241333, -1.5645859241485596, -1.4389021396636963, -1.3132184743881226, -1.1875348091125488, -1.0618510246276855, -0.9361673593521118, -0.8104836940765381, -0.6848000288009644, -0.5591163039207458, -0.43343260884284973, -0.3077489137649536, -0.18206524848937988, -0.05638152360916138, 0.06930220127105713, 0.19498586654663086, 0.320669561624527, 0.4463532567024231, 0.5720369815826416, 0.6977206468582153, 0.8234043121337891, 0.9490880370140076, 1.074771761894226, 1.2004554271697998, 1.3261390924453735, 1.4518227577209473, 1.5775065422058105, 1.7031902074813843, 1.828873872756958, 1.9545576572418213, 2.0802412033081055, 2.2059249877929688]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 11.0, 6.0, 7.0, 11.0, 15.0, 13.0, 13.0, 18.0, 20.0, 21.0, 25.0, 28.0, 35.0, 32.0, 41.0, 41.0, 40.0, 27.0, 31.0, 42.0, 45.0, 40.0, 43.0, 43.0, 41.0, 30.0, 26.0, 31.0, 38.0, 28.0, 17.0, 21.0, 20.0, 13.0, 22.0, 12.0, 9.0, 12.0, 8.0, 11.0, 9.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.745201587677002, -1.6897183656692505, -1.6342350244522095, -1.578751802444458, -1.523268461227417, -1.4677852392196655, -1.412302017211914, -1.356818675994873, -1.3013354539871216, -1.2458522319793701, -1.190368890762329, -1.1348856687545776, -1.0794024467468262, -1.0239191055297852, -0.9684358835220337, -0.9129526019096375, -0.8574693202972412, -0.801986038684845, -0.7465027570724487, -0.6910195350646973, -0.635536253452301, -0.5800529718399048, -0.5245697498321533, -0.4690864682197571, -0.41360318660736084, -0.3581199049949646, -0.30263665318489075, -0.2471533864736557, -0.19167011976242065, -0.13618683815002441, -0.08070358633995056, -0.02522033452987671, 0.03026282787322998, 0.08574609458446503, 0.14122936129570007, 0.19671262800693512, 0.25219589471817017, 0.3076791763305664, 0.36316242814064026, 0.4186456799507141, 0.47412896156311035, 0.5296122431755066, 0.5850955247879028, 0.6405787467956543, 0.6960620284080505, 0.7515453100204468, 0.8070285320281982, 0.8625118136405945, 0.9179950952529907, 0.973478376865387, 1.0289616584777832, 1.0844448804855347, 1.1399281024932861, 1.1954114437103271, 1.2508946657180786, 1.30637788772583, 1.361861228942871, 1.4173444509506226, 1.4728277921676636, 1.528311014175415, 1.583794355392456, 1.6392775774002075, 1.694760799407959, 1.750244140625, 1.8057273626327515]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 8.0, 7.0, 5.0, 9.0, 4.0, 13.0, 20.0, 14.0, 33.0, 58.0, 58.0, 141.0, 270.0, 485.0, 965.0, 2115.0, 5613.0, 18651.0, 155817.0, 3941878.0, 50926.0, 10419.0, 3612.0, 1532.0, 708.0, 356.0, 193.0, 99.0, 87.0, 58.0, 33.0, 30.0, 19.0, 15.0, 9.0, 13.0, 4.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.74267578125, -0.7216339111328125, -0.700592041015625, -0.6795501708984375, -0.65850830078125, -0.6374664306640625, -0.616424560546875, -0.5953826904296875, -0.5743408203125, -0.5532989501953125, -0.532257080078125, -0.5112152099609375, -0.49017333984375, -0.4691314697265625, -0.448089599609375, -0.4270477294921875, -0.406005859375, -0.3849639892578125, -0.363922119140625, -0.3428802490234375, -0.32183837890625, -0.3007965087890625, -0.279754638671875, -0.2587127685546875, -0.2376708984375, -0.2166290283203125, -0.195587158203125, -0.1745452880859375, -0.15350341796875, -0.1324615478515625, -0.111419677734375, -0.0903778076171875, -0.0693359375, -0.0482940673828125, -0.027252197265625, -0.0062103271484375, 0.01483154296875, 0.0358734130859375, 0.056915283203125, 0.0779571533203125, 0.0989990234375, 0.1200408935546875, 0.141082763671875, 0.1621246337890625, 0.18316650390625, 0.2042083740234375, 0.225250244140625, 0.2462921142578125, 0.267333984375, 0.2883758544921875, 0.309417724609375, 0.3304595947265625, 0.35150146484375, 0.3725433349609375, 0.393585205078125, 0.4146270751953125, 0.4356689453125, 0.4567108154296875, 0.477752685546875, 0.4987945556640625, 0.51983642578125, 0.5408782958984375, 0.561920166015625, 0.5829620361328125, 0.60400390625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 3.0, 2.0, 3.0, 8.0, 9.0, 18.0, 23.0, 42.0, 44.0, 60.0, 70.0, 71.0, 83.0, 88.0, 75.0, 75.0, 70.0, 74.0, 61.0, 34.0, 27.0, 26.0, 18.0, 11.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2109375, -0.205047607421875, -0.19915771484375, -0.193267822265625, -0.1873779296875, -0.181488037109375, -0.17559814453125, -0.169708251953125, -0.163818359375, -0.157928466796875, -0.15203857421875, -0.146148681640625, -0.1402587890625, -0.134368896484375, -0.12847900390625, -0.122589111328125, -0.11669921875, -0.110809326171875, -0.10491943359375, -0.099029541015625, -0.0931396484375, -0.087249755859375, -0.08135986328125, -0.075469970703125, -0.069580078125, -0.063690185546875, -0.05780029296875, -0.051910400390625, -0.0460205078125, -0.040130615234375, -0.03424072265625, -0.028350830078125, -0.0224609375, -0.016571044921875, -0.01068115234375, -0.004791259765625, 0.0010986328125, 0.006988525390625, 0.01287841796875, 0.018768310546875, 0.024658203125, 0.030548095703125, 0.03643798828125, 0.042327880859375, 0.0482177734375, 0.054107666015625, 0.05999755859375, 0.065887451171875, 0.07177734375, 0.077667236328125, 0.08355712890625, 0.089447021484375, 0.0953369140625, 0.101226806640625, 0.10711669921875, 0.113006591796875, 0.118896484375, 0.124786376953125, 0.13067626953125, 0.136566162109375, 0.1424560546875, 0.148345947265625, 0.15423583984375, 0.160125732421875, 0.166015625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 7.0, 6.0, 4.0, 10.0, 21.0, 22.0, 55.0, 60.0, 96.0, 157.0, 270.0, 430.0, 831.0, 1732.0, 4578.0, 20253.0, 389999.0, 3727023.0, 37437.0, 6777.0, 2179.0, 995.0, 523.0, 296.0, 171.0, 130.0, 81.0, 48.0, 36.0, 20.0, 19.0, 6.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5810546875, -0.5624008178710938, -0.5437469482421875, -0.5250930786132812, -0.506439208984375, -0.48778533935546875, -0.4691314697265625, -0.45047760009765625, -0.43182373046875, -0.41316986083984375, -0.3945159912109375, -0.37586212158203125, -0.357208251953125, -0.33855438232421875, -0.3199005126953125, -0.30124664306640625, -0.2825927734375, -0.26393890380859375, -0.2452850341796875, -0.22663116455078125, -0.207977294921875, -0.18932342529296875, -0.1706695556640625, -0.15201568603515625, -0.13336181640625, -0.11470794677734375, -0.0960540771484375, -0.07740020751953125, -0.058746337890625, -0.04009246826171875, -0.0214385986328125, -0.00278472900390625, 0.015869140625, 0.03452301025390625, 0.0531768798828125, 0.07183074951171875, 0.090484619140625, 0.10913848876953125, 0.1277923583984375, 0.14644622802734375, 0.16510009765625, 0.18375396728515625, 0.2024078369140625, 0.22106170654296875, 0.239715576171875, 0.25836944580078125, 0.2770233154296875, 0.29567718505859375, 0.3143310546875, 0.33298492431640625, 0.3516387939453125, 0.37029266357421875, 0.388946533203125, 0.40760040283203125, 0.4262542724609375, 0.44490814208984375, 0.46356201171875, 0.48221588134765625, 0.5008697509765625, 0.5195236206054688, 0.538177490234375, 0.5568313598632812, 0.5754852294921875, 0.5941390991210938, 0.61279296875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 11.0, 8.0, 14.0, 16.0, 45.0, 86.0, 506.0, 3039.0, 225.0, 66.0, 24.0, 12.0, 8.0, 6.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.54541015625, -0.5318679809570312, -0.5183258056640625, -0.5047836303710938, -0.491241455078125, -0.47769927978515625, -0.4641571044921875, -0.45061492919921875, -0.43707275390625, -0.42353057861328125, -0.4099884033203125, -0.39644622802734375, -0.382904052734375, -0.36936187744140625, -0.3558197021484375, -0.34227752685546875, -0.3287353515625, -0.31519317626953125, -0.3016510009765625, -0.28810882568359375, -0.274566650390625, -0.26102447509765625, -0.2474822998046875, -0.23394012451171875, -0.22039794921875, -0.20685577392578125, -0.1933135986328125, -0.17977142333984375, -0.166229248046875, -0.15268707275390625, -0.1391448974609375, -0.12560272216796875, -0.112060546875, -0.09851837158203125, -0.0849761962890625, -0.07143402099609375, -0.057891845703125, -0.04434967041015625, -0.0308074951171875, -0.01726531982421875, -0.00372314453125, 0.00981903076171875, 0.0233612060546875, 0.03690338134765625, 0.050445556640625, 0.06398773193359375, 0.0775299072265625, 0.09107208251953125, 0.1046142578125, 0.11815643310546875, 0.1316986083984375, 0.14524078369140625, 0.158782958984375, 0.17232513427734375, 0.1858673095703125, 0.19940948486328125, 0.21295166015625, 0.22649383544921875, 0.2400360107421875, 0.25357818603515625, 0.267120361328125, 0.28066253662109375, 0.2942047119140625, 0.30774688720703125, 0.3212890625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 6.0, 14.0, 36.0, 170.0, 467.0, 232.0, 49.0, 7.0, 10.0, 5.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.968031883239746, -3.87689208984375, -3.785752296447754, -3.694612503051758, -3.6034727096557617, -3.5123326778411865, -3.4211928844451904, -3.3300530910491943, -3.2389132976531982, -3.147773504257202, -3.056633710861206, -2.96549391746521, -2.8743538856506348, -2.7832140922546387, -2.6920742988586426, -2.6009345054626465, -2.5097947120666504, -2.4186549186706543, -2.327515125274658, -2.236375331878662, -2.145235538482666, -2.054095506668091, -1.9629557132720947, -1.8718159198760986, -1.7806761264801025, -1.6895363330841064, -1.5983965396881104, -1.5072566270828247, -1.4161168336868286, -1.3249770402908325, -1.2338371276855469, -1.1426973342895508, -1.0515577793121338, -0.9604179859161377, -0.8692781329154968, -0.778138279914856, -0.6869984865188599, -0.5958586931228638, -0.5047188401222229, -0.41357898712158203, -0.32243919372558594, -0.23129937052726746, -0.14015954732894897, -0.04901972413063049, 0.04212009906768799, 0.13325992226600647, 0.22439974546432495, 0.3155395984649658, 0.4066793918609619, 0.4978192150592804, 0.5889590382575989, 0.6800988912582397, 0.7712386846542358, 0.8623784780502319, 0.9535183310508728, 1.0446581840515137, 1.1357979774475098, 1.2269377708435059, 1.318077564239502, 1.4092174768447876, 1.5003572702407837, 1.5914970636367798, 1.6826369762420654, 1.7737767696380615, 1.8649165630340576]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 6.0, 4.0, 5.0, 9.0, 10.0, 15.0, 17.0, 16.0, 31.0, 31.0, 36.0, 42.0, 50.0, 54.0, 49.0, 68.0, 59.0, 54.0, 59.0, 40.0, 46.0, 57.0, 39.0, 33.0, 30.0, 27.0, 31.0, 25.0, 18.0, 13.0, 5.0, 9.0, 7.0, 3.0, 1.0, 0.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6551198363304138, -0.6312218904495239, -0.6073240041732788, -0.5834261178970337, -0.5595281720161438, -0.5356302261352539, -0.5117323398590088, -0.4878344237804413, -0.4639365077018738, -0.4400385916233063, -0.41614067554473877, -0.39224275946617126, -0.36834484338760376, -0.34444692730903625, -0.32054901123046875, -0.29665109515190125, -0.27275317907333374, -0.24885526299476624, -0.22495734691619873, -0.20105943083763123, -0.17716151475906372, -0.15326359868049622, -0.1293656826019287, -0.1054677665233612, -0.0815698504447937, -0.057671934366226196, -0.03377401828765869, -0.009876102209091187, 0.014021813869476318, 0.03791972994804382, 0.06181764602661133, 0.08571556210517883, 0.10961341857910156, 0.13351133465766907, 0.15740925073623657, 0.18130716681480408, 0.20520508289337158, 0.2291029989719391, 0.2530009150505066, 0.2768988311290741, 0.3007967472076416, 0.3246946632862091, 0.3485925793647766, 0.3724904954433441, 0.3963884115219116, 0.4202863276004791, 0.44418424367904663, 0.46808215975761414, 0.49198007583618164, 0.5158779621124268, 0.5397759079933167, 0.5636738538742065, 0.5875717401504517, 0.6114696264266968, 0.6353675723075867, 0.6592655181884766, 0.6831634044647217, 0.7070612907409668, 0.7309592366218567, 0.7548571825027466, 0.7787550687789917, 0.8026529550552368, 0.8265509009361267, 0.8504488468170166, 0.8743467330932617]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 9.0, 13.0, 21.0, 25.0, 44.0, 90.0, 195.0, 371.0, 995.0, 3540.0, 28818.0, 684001.0, 312748.0, 14004.0, 2321.0, 719.0, 309.0, 157.0, 90.0, 31.0, 20.0, 13.0, 12.0, 5.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.85888671875, -0.8335189819335938, -0.8081512451171875, -0.7827835083007812, -0.757415771484375, -0.7320480346679688, -0.7066802978515625, -0.6813125610351562, -0.65594482421875, -0.6305770874023438, -0.6052093505859375, -0.5798416137695312, -0.554473876953125, -0.5291061401367188, -0.5037384033203125, -0.47837066650390625, -0.4530029296875, -0.42763519287109375, -0.4022674560546875, -0.37689971923828125, -0.351531982421875, -0.32616424560546875, -0.3007965087890625, -0.27542877197265625, -0.25006103515625, -0.22469329833984375, -0.1993255615234375, -0.17395782470703125, -0.148590087890625, -0.12322235107421875, -0.0978546142578125, -0.07248687744140625, -0.047119140625, -0.02175140380859375, 0.0036163330078125, 0.02898406982421875, 0.054351806640625, 0.07971954345703125, 0.1050872802734375, 0.13045501708984375, 0.15582275390625, 0.18119049072265625, 0.2065582275390625, 0.23192596435546875, 0.257293701171875, 0.28266143798828125, 0.3080291748046875, 0.33339691162109375, 0.3587646484375, 0.38413238525390625, 0.4095001220703125, 0.43486785888671875, 0.460235595703125, 0.48560333251953125, 0.5109710693359375, 0.5363388061523438, 0.56170654296875, 0.5870742797851562, 0.6124420166015625, 0.6378097534179688, 0.663177490234375, 0.6885452270507812, 0.7139129638671875, 0.7392807006835938, 0.7646484375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 6.0, 7.0, 6.0, 11.0, 17.0, 34.0, 44.0, 57.0, 74.0, 64.0, 72.0, 73.0, 91.0, 87.0, 88.0, 53.0, 66.0, 56.0, 29.0, 24.0, 12.0, 17.0, 10.0, 0.0, 6.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.221435546875, -0.21514892578125, -0.2088623046875, -0.20257568359375, -0.1962890625, -0.19000244140625, -0.1837158203125, -0.17742919921875, -0.171142578125, -0.16485595703125, -0.1585693359375, -0.15228271484375, -0.14599609375, -0.13970947265625, -0.1334228515625, -0.12713623046875, -0.120849609375, -0.11456298828125, -0.1082763671875, -0.10198974609375, -0.095703125, -0.08941650390625, -0.0831298828125, -0.07684326171875, -0.070556640625, -0.06427001953125, -0.0579833984375, -0.05169677734375, -0.04541015625, -0.03912353515625, -0.0328369140625, -0.02655029296875, -0.020263671875, -0.01397705078125, -0.0076904296875, -0.00140380859375, 0.0048828125, 0.01116943359375, 0.0174560546875, 0.02374267578125, 0.030029296875, 0.03631591796875, 0.0426025390625, 0.04888916015625, 0.05517578125, 0.06146240234375, 0.0677490234375, 0.07403564453125, 0.080322265625, 0.08660888671875, 0.0928955078125, 0.09918212890625, 0.10546875, 0.11175537109375, 0.1180419921875, 0.12432861328125, 0.130615234375, 0.13690185546875, 0.1431884765625, 0.14947509765625, 0.15576171875, 0.16204833984375, 0.1683349609375, 0.17462158203125, 0.180908203125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 6.0, 3.0, 3.0, 26.0, 18.0, 25.0, 48.0, 84.0, 137.0, 214.0, 388.0, 825.0, 2079.0, 7520.0, 49578.0, 583976.0, 364060.0, 30900.0, 5451.0, 1672.0, 716.0, 356.0, 181.0, 95.0, 64.0, 41.0, 34.0, 20.0, 15.0, 11.0, 4.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.450927734375, -0.43721771240234375, -0.4235076904296875, -0.40979766845703125, -0.396087646484375, -0.38237762451171875, -0.3686676025390625, -0.35495758056640625, -0.34124755859375, -0.32753753662109375, -0.3138275146484375, -0.30011749267578125, -0.286407470703125, -0.27269744873046875, -0.2589874267578125, -0.24527740478515625, -0.2315673828125, -0.21785736083984375, -0.2041473388671875, -0.19043731689453125, -0.176727294921875, -0.16301727294921875, -0.1493072509765625, -0.13559722900390625, -0.12188720703125, -0.10817718505859375, -0.0944671630859375, -0.08075714111328125, -0.067047119140625, -0.05333709716796875, -0.0396270751953125, -0.02591705322265625, -0.01220703125, 0.00150299072265625, 0.0152130126953125, 0.02892303466796875, 0.042633056640625, 0.05634307861328125, 0.0700531005859375, 0.08376312255859375, 0.09747314453125, 0.11118316650390625, 0.1248931884765625, 0.13860321044921875, 0.152313232421875, 0.16602325439453125, 0.1797332763671875, 0.19344329833984375, 0.2071533203125, 0.22086334228515625, 0.2345733642578125, 0.24828338623046875, 0.261993408203125, 0.27570343017578125, 0.2894134521484375, 0.30312347412109375, 0.31683349609375, 0.33054351806640625, 0.3442535400390625, 0.35796356201171875, 0.371673583984375, 0.38538360595703125, 0.3990936279296875, 0.41280364990234375, 0.426513671875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 7.0, 4.0, 11.0, 12.0, 11.0, 12.0, 18.0, 33.0, 29.0, 36.0, 39.0, 58.0, 48.0, 47.0, 47.0, 64.0, 51.0, 56.0, 62.0, 49.0, 53.0, 44.0, 40.0, 26.0, 36.0, 25.0, 24.0, 23.0, 12.0, 4.0, 8.0, 8.0, 3.0, 8.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.478271484375, -0.4603157043457031, -0.44235992431640625, -0.4244041442871094, -0.4064483642578125, -0.3884925842285156, -0.37053680419921875, -0.3525810241699219, -0.334625244140625, -0.3166694641113281, -0.29871368408203125, -0.2807579040527344, -0.2628021240234375, -0.24484634399414062, -0.22689056396484375, -0.20893478393554688, -0.19097900390625, -0.17302322387695312, -0.15506744384765625, -0.13711166381835938, -0.1191558837890625, -0.10120010375976562, -0.08324432373046875, -0.06528854370117188, -0.047332763671875, -0.029376983642578125, -0.01142120361328125, 0.006534576416015625, 0.0244903564453125, 0.042446136474609375, 0.06040191650390625, 0.07835769653320312, 0.0963134765625, 0.11426925659179688, 0.13222503662109375, 0.15018081665039062, 0.1681365966796875, 0.18609237670898438, 0.20404815673828125, 0.22200393676757812, 0.239959716796875, 0.2579154968261719, 0.27587127685546875, 0.2938270568847656, 0.3117828369140625, 0.3297386169433594, 0.34769439697265625, 0.3656501770019531, 0.38360595703125, 0.4015617370605469, 0.41951751708984375, 0.4374732971191406, 0.4554290771484375, 0.4733848571777344, 0.49134063720703125, 0.5092964172363281, 0.527252197265625, 0.5452079772949219, 0.5631637573242188, 0.5811195373535156, 0.5990753173828125, 0.6170310974121094, 0.6349868774414062, 0.6529426574707031, 0.6708984375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 7.0, 8.0, 20.0, 49.0, 90.0, 225.0, 667.0, 3176.0, 38517.0, 849630.0, 147948.0, 6530.0, 1113.0, 343.0, 118.0, 54.0, 26.0, 12.0, 6.0, 7.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.322021484375, -0.31324195861816406, -0.3044624328613281, -0.2956829071044922, -0.28690338134765625, -0.2781238555908203, -0.2693443298339844, -0.26056480407714844, -0.2517852783203125, -0.24300575256347656, -0.23422622680664062, -0.2254467010498047, -0.21666717529296875, -0.2078876495361328, -0.19910812377929688, -0.19032859802246094, -0.181549072265625, -0.17276954650878906, -0.16399002075195312, -0.1552104949951172, -0.14643096923828125, -0.1376514434814453, -0.12887191772460938, -0.12009239196777344, -0.1113128662109375, -0.10253334045410156, -0.09375381469726562, -0.08497428894042969, -0.07619476318359375, -0.06741523742675781, -0.058635711669921875, -0.04985618591308594, -0.04107666015625, -0.03229713439941406, -0.023517608642578125, -0.014738082885742188, -0.00595855712890625, 0.0028209686279296875, 0.011600494384765625, 0.020380020141601562, 0.0291595458984375, 0.03793907165527344, 0.046718597412109375, 0.05549812316894531, 0.06427764892578125, 0.07305717468261719, 0.08183670043945312, 0.09061622619628906, 0.099395751953125, 0.10817527770996094, 0.11695480346679688, 0.1257343292236328, 0.13451385498046875, 0.1432933807373047, 0.15207290649414062, 0.16085243225097656, 0.1696319580078125, 0.17841148376464844, 0.18719100952148438, 0.1959705352783203, 0.20475006103515625, 0.2135295867919922, 0.22230911254882812, 0.23108863830566406, 0.2398681640625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 2.0, 5.0, 4.0, 6.0, 5.0, 12.0, 10.0, 15.0, 17.0, 21.0, 27.0, 33.0, 54.0, 63.0, 70.0, 101.0, 104.0, 93.0, 75.0, 58.0, 50.0, 36.0, 22.0, 27.0, 25.0, 15.0, 7.0, 16.0, 5.0, 7.0, 7.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00014388561248779297, -0.0001390315592288971, -0.00013417750597000122, -0.00012932345271110535, -0.00012446939945220947, -0.0001196153461933136, -0.00011476129293441772, -0.00010990723967552185, -0.00010505318641662598, -0.0001001991331577301, -9.534507989883423e-05, -9.049102663993835e-05, -8.563697338104248e-05, -8.07829201221466e-05, -7.592886686325073e-05, -7.107481360435486e-05, -6.622076034545898e-05, -6.136670708656311e-05, -5.6512653827667236e-05, -5.165860056877136e-05, -4.680454730987549e-05, -4.1950494050979614e-05, -3.709644079208374e-05, -3.2242387533187866e-05, -2.7388334274291992e-05, -2.2534281015396118e-05, -1.7680227756500244e-05, -1.282617449760437e-05, -7.972121238708496e-06, -3.118067979812622e-06, 1.735985279083252e-06, 6.590038537979126e-06, 1.1444091796875e-05, 1.6298145055770874e-05, 2.1152198314666748e-05, 2.6006251573562622e-05, 3.0860304832458496e-05, 3.571435809135437e-05, 4.0568411350250244e-05, 4.542246460914612e-05, 5.027651786804199e-05, 5.5130571126937866e-05, 5.998462438583374e-05, 6.483867764472961e-05, 6.969273090362549e-05, 7.454678416252136e-05, 7.940083742141724e-05, 8.425489068031311e-05, 8.910894393920898e-05, 9.396299719810486e-05, 9.881705045700073e-05, 0.0001036711037158966, 0.00010852515697479248, 0.00011337921023368835, 0.00011823326349258423, 0.0001230873167514801, 0.00012794137001037598, 0.00013279542326927185, 0.00013764947652816772, 0.0001425035297870636, 0.00014735758304595947, 0.00015221163630485535, 0.00015706568956375122, 0.0001619197428226471, 0.00016677379608154297]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 6.0, 16.0, 17.0, 49.0, 88.0, 229.0, 715.0, 3580.0, 77920.0, 920452.0, 41801.0, 2787.0, 512.0, 223.0, 76.0, 41.0, 19.0, 13.0, 6.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.292236328125, -0.2819557189941406, -0.27167510986328125, -0.2613945007324219, -0.2511138916015625, -0.24083328247070312, -0.23055267333984375, -0.22027206420898438, -0.209991455078125, -0.19971084594726562, -0.18943023681640625, -0.17914962768554688, -0.1688690185546875, -0.15858840942382812, -0.14830780029296875, -0.13802719116210938, -0.12774658203125, -0.11746597290039062, -0.10718536376953125, -0.09690475463867188, -0.0866241455078125, -0.07634353637695312, -0.06606292724609375, -0.055782318115234375, -0.045501708984375, -0.035221099853515625, -0.02494049072265625, -0.014659881591796875, -0.0043792724609375, 0.005901336669921875, 0.01618194580078125, 0.026462554931640625, 0.0367431640625, 0.047023773193359375, 0.05730438232421875, 0.06758499145507812, 0.0778656005859375, 0.08814620971679688, 0.09842681884765625, 0.10870742797851562, 0.118988037109375, 0.12926864624023438, 0.13954925537109375, 0.14982986450195312, 0.1601104736328125, 0.17039108276367188, 0.18067169189453125, 0.19095230102539062, 0.20123291015625, 0.21151351928710938, 0.22179412841796875, 0.23207473754882812, 0.2423553466796875, 0.2526359558105469, 0.26291656494140625, 0.2731971740722656, 0.283477783203125, 0.2937583923339844, 0.30403900146484375, 0.3143196105957031, 0.3246002197265625, 0.3348808288574219, 0.34516143798828125, 0.3554420471191406, 0.36572265625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 4.0, 1.0, 4.0, 11.0, 8.0, 18.0, 47.0, 62.0, 130.0, 153.0, 187.0, 138.0, 93.0, 73.0, 36.0, 13.0, 11.0, 7.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1502685546875, -0.14160728454589844, -0.13294601440429688, -0.12428474426269531, -0.11562347412109375, -0.10696220397949219, -0.09830093383789062, -0.08963966369628906, -0.0809783935546875, -0.07231712341308594, -0.06365585327148438, -0.05499458312988281, -0.04633331298828125, -0.03767204284667969, -0.029010772705078125, -0.020349502563476562, -0.011688232421875, -0.0030269622802734375, 0.005634307861328125, 0.014295578002929688, 0.02295684814453125, 0.03161811828613281, 0.040279388427734375, 0.04894065856933594, 0.0576019287109375, 0.06626319885253906, 0.07492446899414062, 0.08358573913574219, 0.09224700927734375, 0.10090827941894531, 0.10956954956054688, 0.11823081970214844, 0.12689208984375, 0.13555335998535156, 0.14421463012695312, 0.1528759002685547, 0.16153717041015625, 0.1701984405517578, 0.17885971069335938, 0.18752098083496094, 0.1961822509765625, 0.20484352111816406, 0.21350479125976562, 0.2221660614013672, 0.23082733154296875, 0.2394886016845703, 0.24814987182617188, 0.25681114196777344, 0.265472412109375, 0.27413368225097656, 0.2827949523925781, 0.2914562225341797, 0.30011749267578125, 0.3087787628173828, 0.3174400329589844, 0.32610130310058594, 0.3347625732421875, 0.34342384338378906, 0.3520851135253906, 0.3607463836669922, 0.36940765380859375, 0.3780689239501953, 0.3867301940917969, 0.39539146423339844, 0.404052734375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 7.0, 28.0, 54.0, 112.0, 204.0, 240.0, 179.0, 94.0, 38.0, 13.0, 14.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6615819931030273, -3.5490167140960693, -3.4364516735076904, -3.3238863945007324, -3.2113211154937744, -3.0987558364868164, -2.9861907958984375, -2.8736255168914795, -2.7610602378845215, -2.6484949588775635, -2.5359299182891846, -2.4233646392822266, -2.3107993602752686, -2.1982340812683105, -2.0856690406799316, -1.9731037616729736, -1.8605386018753052, -1.7479734420776367, -1.6354081630706787, -1.5228430032730103, -1.4102777242660522, -1.2977125644683838, -1.1851472854614258, -1.0725821256637573, -0.9600169062614441, -0.8474516868591309, -0.7348864674568176, -0.6223212480545044, -0.5097560882568359, -0.3971908688545227, -0.2846256494522095, -0.17206043004989624, -0.05949521064758301, 0.05307000130414963, 0.16563521325588226, 0.2782004177570343, 0.39076563715934753, 0.5033308267593384, 0.6158960461616516, 0.7284612655639648, 0.8410264849662781, 0.9535917043685913, 1.0661568641662598, 1.1787221431732178, 1.2912873029708862, 1.4038524627685547, 1.5164177417755127, 1.6289830207824707, 1.7415481805801392, 1.8541133403778076, 1.9666786193847656, 2.0792438983917236, 2.1918089389801025, 2.3043742179870605, 2.4169394969940186, 2.5295047760009766, 2.6420698165893555, 2.7546350955963135, 2.8672001361846924, 2.9797654151916504, 3.0923306941986084, 3.2048959732055664, 3.3174610137939453, 3.4300262928009033, 3.5425915718078613]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 8.0, 2.0, 7.0, 8.0, 13.0, 13.0, 17.0, 11.0, 19.0, 16.0, 24.0, 27.0, 23.0, 40.0, 38.0, 37.0, 38.0, 44.0, 43.0, 51.0, 42.0, 34.0, 37.0, 49.0, 45.0, 48.0, 36.0, 36.0, 16.0, 26.0, 26.0, 18.0, 20.0, 22.0, 12.0, 13.0, 7.0, 7.0, 7.0, 7.0, 0.0, 5.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.4537458419799805, -2.3853323459625244, -2.3169188499450684, -2.2485053539276123, -2.1800918579101562, -2.111678123474121, -2.043264627456665, -1.974851131439209, -1.906437635421753, -1.8380241394042969, -1.7696106433868408, -1.7011970281600952, -1.6327835321426392, -1.564370036125183, -1.4959564208984375, -1.4275429248809814, -1.3591294288635254, -1.2907159328460693, -1.2223024368286133, -1.1538888216018677, -1.0854753255844116, -1.0170618295669556, -0.9486482739448547, -0.8802347183227539, -0.8118212223052979, -0.7434077262878418, -0.674994170665741, -0.6065806150436401, -0.5381671190261841, -0.46975359320640564, -0.4013400673866272, -0.33292654156684875, -0.2645127773284912, -0.19609925150871277, -0.12768572568893433, -0.059272199869155884, 0.009141325950622559, 0.077554851770401, 0.14596837759017944, 0.21438190340995789, 0.28279542922973633, 0.35120895504951477, 0.4196224808692932, 0.48803600668907166, 0.5564495325088501, 0.6248630285263062, 0.693276584148407, 0.7616901397705078, 0.8301036357879639, 0.8985171318054199, 0.9669306874275208, 1.0353442430496216, 1.1037577390670776, 1.1721712350845337, 1.2405848503112793, 1.3089983463287354, 1.3774118423461914, 1.4458253383636475, 1.5142388343811035, 1.5826524496078491, 1.6510659456253052, 1.7194794416427612, 1.7878930568695068, 1.856306552886963, 1.924720048904419]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 1.0, 9.0, 4.0, 13.0, 14.0, 25.0, 45.0, 43.0, 100.0, 134.0, 201.0, 413.0, 1472.0, 39169.0, 4148656.0, 2715.0, 552.0, 290.0, 156.0, 88.0, 58.0, 43.0, 25.0, 16.0, 8.0, 11.0, 6.0, 4.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.6708984375, -1.6204986572265625, -1.570098876953125, -1.5196990966796875, -1.46929931640625, -1.4188995361328125, -1.368499755859375, -1.3180999755859375, -1.2677001953125, -1.2173004150390625, -1.166900634765625, -1.1165008544921875, -1.06610107421875, -1.0157012939453125, -0.965301513671875, -0.9149017333984375, -0.864501953125, -0.8141021728515625, -0.763702392578125, -0.7133026123046875, -0.66290283203125, -0.6125030517578125, -0.562103271484375, -0.5117034912109375, -0.4613037109375, -0.4109039306640625, -0.360504150390625, -0.3101043701171875, -0.25970458984375, -0.2093048095703125, -0.158905029296875, -0.1085052490234375, -0.05810546875, -0.0077056884765625, 0.042694091796875, 0.0930938720703125, 0.14349365234375, 0.1938934326171875, 0.244293212890625, 0.2946929931640625, 0.3450927734375, 0.3954925537109375, 0.445892333984375, 0.4962921142578125, 0.54669189453125, 0.5970916748046875, 0.647491455078125, 0.6978912353515625, 0.748291015625, 0.7986907958984375, 0.849090576171875, 0.8994903564453125, 0.94989013671875, 1.0002899169921875, 1.050689697265625, 1.1010894775390625, 1.1514892578125, 1.2018890380859375, 1.252288818359375, 1.3026885986328125, 1.35308837890625, 1.4034881591796875, 1.453887939453125, 1.5042877197265625, 1.5546875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 7.0, 2.0, 5.0, 5.0, 14.0, 16.0, 31.0, 28.0, 34.0, 37.0, 53.0, 68.0, 57.0, 63.0, 79.0, 76.0, 66.0, 72.0, 68.0, 56.0, 44.0, 31.0, 23.0, 15.0, 20.0, 10.0, 8.0, 6.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.221923828125, -0.2158985137939453, -0.20987319946289062, -0.20384788513183594, -0.19782257080078125, -0.19179725646972656, -0.18577194213867188, -0.1797466278076172, -0.1737213134765625, -0.1676959991455078, -0.16167068481445312, -0.15564537048339844, -0.14962005615234375, -0.14359474182128906, -0.13756942749023438, -0.1315441131591797, -0.125518798828125, -0.11949348449707031, -0.11346817016601562, -0.10744285583496094, -0.10141754150390625, -0.09539222717285156, -0.08936691284179688, -0.08334159851074219, -0.0773162841796875, -0.07129096984863281, -0.06526565551757812, -0.05924034118652344, -0.05321502685546875, -0.04718971252441406, -0.041164398193359375, -0.03513908386230469, -0.02911376953125, -0.023088455200195312, -0.017063140869140625, -0.011037826538085938, -0.00501251220703125, 0.0010128021240234375, 0.007038116455078125, 0.013063430786132812, 0.0190887451171875, 0.025114059448242188, 0.031139373779296875, 0.03716468811035156, 0.04319000244140625, 0.04921531677246094, 0.055240631103515625, 0.06126594543457031, 0.067291259765625, 0.07331657409667969, 0.07934188842773438, 0.08536720275878906, 0.09139251708984375, 0.09741783142089844, 0.10344314575195312, 0.10946846008300781, 0.1154937744140625, 0.12151908874511719, 0.12754440307617188, 0.13356971740722656, 0.13959503173828125, 0.14562034606933594, 0.15164566040039062, 0.1576709747314453, 0.1636962890625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 1.0, 6.0, 3.0, 4.0, 9.0, 5.0, 18.0, 22.0, 28.0, 39.0, 48.0, 80.0, 79.0, 115.0, 168.0, 248.0, 322.0, 526.0, 852.0, 1684.0, 3561.0, 9771.0, 52785.0, 4059514.0, 47402.0, 9372.0, 3562.0, 1592.0, 877.0, 495.0, 341.0, 231.0, 149.0, 124.0, 85.0, 44.0, 45.0, 19.0, 20.0, 12.0, 8.0, 10.0, 5.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.35693359375, -0.3459434509277344, -0.33495330810546875, -0.3239631652832031, -0.3129730224609375, -0.3019828796386719, -0.29099273681640625, -0.2800025939941406, -0.269012451171875, -0.2580223083496094, -0.24703216552734375, -0.23604202270507812, -0.2250518798828125, -0.21406173706054688, -0.20307159423828125, -0.19208145141601562, -0.18109130859375, -0.17010116577148438, -0.15911102294921875, -0.14812088012695312, -0.1371307373046875, -0.12614059448242188, -0.11515045166015625, -0.10416030883789062, -0.093170166015625, -0.08218002319335938, -0.07118988037109375, -0.060199737548828125, -0.0492095947265625, -0.038219451904296875, -0.02722930908203125, -0.016239166259765625, -0.0052490234375, 0.005741119384765625, 0.01673126220703125, 0.027721405029296875, 0.0387115478515625, 0.049701690673828125, 0.06069183349609375, 0.07168197631835938, 0.082672119140625, 0.09366226196289062, 0.10465240478515625, 0.11564254760742188, 0.1266326904296875, 0.13762283325195312, 0.14861297607421875, 0.15960311889648438, 0.17059326171875, 0.18158340454101562, 0.19257354736328125, 0.20356369018554688, 0.2145538330078125, 0.22554397583007812, 0.23653411865234375, 0.24752426147460938, 0.258514404296875, 0.2695045471191406, 0.28049468994140625, 0.2914848327636719, 0.3024749755859375, 0.3134651184082031, 0.32445526123046875, 0.3354454040527344, 0.346435546875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 3.0, 7.0, 14.0, 23.0, 120.0, 3665.0, 164.0, 33.0, 18.0, 11.0, 7.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.163818359375, -0.15996646881103516, -0.1561145782470703, -0.15226268768310547, -0.14841079711914062, -0.14455890655517578, -0.14070701599121094, -0.1368551254272461, -0.13300323486328125, -0.1291513442993164, -0.12529945373535156, -0.12144756317138672, -0.11759567260742188, -0.11374378204345703, -0.10989189147949219, -0.10604000091552734, -0.1021881103515625, -0.09833621978759766, -0.09448432922363281, -0.09063243865966797, -0.08678054809570312, -0.08292865753173828, -0.07907676696777344, -0.0752248764038086, -0.07137298583984375, -0.0675210952758789, -0.06366920471191406, -0.05981731414794922, -0.055965423583984375, -0.05211353302001953, -0.04826164245605469, -0.044409751892089844, -0.040557861328125, -0.036705970764160156, -0.03285408020019531, -0.02900218963623047, -0.025150299072265625, -0.02129840850830078, -0.017446517944335938, -0.013594627380371094, -0.00974273681640625, -0.005890846252441406, -0.0020389556884765625, 0.0018129348754882812, 0.005664825439453125, 0.009516716003417969, 0.013368606567382812, 0.017220497131347656, 0.0210723876953125, 0.024924278259277344, 0.028776168823242188, 0.03262805938720703, 0.036479949951171875, 0.04033184051513672, 0.04418373107910156, 0.048035621643066406, 0.05188751220703125, 0.055739402770996094, 0.05959129333496094, 0.06344318389892578, 0.06729507446289062, 0.07114696502685547, 0.07499885559082031, 0.07885074615478516, 0.08270263671875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 7.0, 13.0, 21.0, 61.0, 105.0, 168.0, 239.0, 186.0, 102.0, 61.0, 21.0, 8.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35893046855926514, -0.3456893265247345, -0.33244821429252625, -0.3192070722579956, -0.30596593022346497, -0.2927247881889343, -0.2794836759567261, -0.26624253392219543, -0.2530013918876648, -0.23976026475429535, -0.2265191227197647, -0.21327799558639526, -0.20003685355186462, -0.18679572641849518, -0.17355459928512573, -0.1603134572505951, -0.14707234501838684, -0.1338312178850174, -0.12059007585048676, -0.10734894871711731, -0.09410781413316727, -0.08086667954921722, -0.06762555241584778, -0.054384417831897736, -0.04114328324794769, -0.0279021505266428, -0.014661017805337906, -0.0014198869466781616, 0.011821247637271881, 0.025062382221221924, 0.03830350935459137, 0.05154464393854141, 0.06478574872016907, 0.07802688330411911, 0.09126801788806915, 0.1045091450214386, 0.11775027960538864, 0.13099141418933868, 0.14423254132270813, 0.15747368335723877, 0.17071481049060822, 0.18395593762397766, 0.1971970796585083, 0.21043820679187775, 0.2236793339252472, 0.23692047595977783, 0.2501615881919861, 0.2634027302265167, 0.27664387226104736, 0.289885014295578, 0.30312612652778625, 0.3163672685623169, 0.32960841059684753, 0.3428495526313782, 0.3560906648635864, 0.36933180689811707, 0.3825729489326477, 0.39581409096717834, 0.4090552031993866, 0.42229634523391724, 0.4355374872684479, 0.4487786293029785, 0.46201974153518677, 0.4752608835697174, 0.48850199580192566]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 6.0, 9.0, 10.0, 8.0, 10.0, 8.0, 8.0, 25.0, 20.0, 16.0, 14.0, 28.0, 28.0, 33.0, 41.0, 29.0, 28.0, 34.0, 36.0, 43.0, 47.0, 35.0, 48.0, 49.0, 30.0, 32.0, 35.0, 33.0, 31.0, 35.0, 31.0, 32.0, 23.0, 21.0, 17.0, 15.0, 8.0, 7.0, 9.0, 7.0, 8.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15804731845855713, -0.15313029289245605, -0.1482132524251938, -0.1432962268590927, -0.13837918639183044, -0.13346216082572937, -0.1285451203584671, -0.12362809479236603, -0.11871106177568436, -0.11379402875900269, -0.10887699574232101, -0.10395996272563934, -0.09904293715953827, -0.094125896692276, -0.08920887112617493, -0.08429183810949326, -0.07937480509281158, -0.07445777207612991, -0.06954073905944824, -0.06462370604276657, -0.0597066767513752, -0.05478964373469353, -0.049872614443302155, -0.04495558142662048, -0.04003854840993881, -0.03512151539325714, -0.03020448423922062, -0.025287453085184097, -0.020370420068502426, -0.015453387051820755, -0.010536355897784233, -0.005619324743747711, -0.00070229172706604, 0.0042147403582930565, 0.009131772443652153, 0.01404880452901125, 0.018965836614370346, 0.023882869631052017, 0.02879990078508854, 0.03371693193912506, 0.03863396495580673, 0.0435509979724884, 0.048468030989170074, 0.05338506028056145, 0.05830209329724312, 0.06321913003921509, 0.06813615560531616, 0.07305318862199783, 0.0779702216386795, 0.08288725465536118, 0.08780428767204285, 0.09272132068872452, 0.09763835370540619, 0.10255537927150726, 0.10747241228818893, 0.1123894453048706, 0.11730647832155228, 0.12222351133823395, 0.12714053690433502, 0.1320575773715973, 0.13697460293769836, 0.14189164340496063, 0.1468086689710617, 0.15172570943832397, 0.15664273500442505]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 6.0, 3.0, 8.0, 9.0, 14.0, 20.0, 32.0, 42.0, 63.0, 97.0, 123.0, 184.0, 265.0, 400.0, 608.0, 1187.0, 2294.0, 5076.0, 12257.0, 35721.0, 121031.0, 371742.0, 340346.0, 104746.0, 31591.0, 11169.0, 4576.0, 2085.0, 1105.0, 594.0, 370.0, 224.0, 172.0, 115.0, 89.0, 53.0, 38.0, 32.0, 13.0, 18.0, 15.0, 7.0, 6.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.306884765625, -0.29784393310546875, -0.2888031005859375, -0.27976226806640625, -0.270721435546875, -0.26168060302734375, -0.2526397705078125, -0.24359893798828125, -0.23455810546875, -0.22551727294921875, -0.2164764404296875, -0.20743560791015625, -0.198394775390625, -0.18935394287109375, -0.1803131103515625, -0.17127227783203125, -0.1622314453125, -0.15319061279296875, -0.1441497802734375, -0.13510894775390625, -0.126068115234375, -0.11702728271484375, -0.1079864501953125, -0.09894561767578125, -0.08990478515625, -0.08086395263671875, -0.0718231201171875, -0.06278228759765625, -0.053741455078125, -0.04470062255859375, -0.0356597900390625, -0.02661895751953125, -0.017578125, -0.00853729248046875, 0.0005035400390625, 0.00954437255859375, 0.018585205078125, 0.02762603759765625, 0.0366668701171875, 0.04570770263671875, 0.05474853515625, 0.06378936767578125, 0.0728302001953125, 0.08187103271484375, 0.090911865234375, 0.09995269775390625, 0.1089935302734375, 0.11803436279296875, 0.1270751953125, 0.13611602783203125, 0.1451568603515625, 0.15419769287109375, 0.163238525390625, 0.17227935791015625, 0.1813201904296875, 0.19036102294921875, 0.19940185546875, 0.20844268798828125, 0.2174835205078125, 0.22652435302734375, 0.235565185546875, 0.24460601806640625, 0.2536468505859375, 0.26268768310546875, 0.271728515625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 5.0, 4.0, 13.0, 6.0, 28.0, 21.0, 24.0, 26.0, 35.0, 43.0, 50.0, 68.0, 69.0, 65.0, 60.0, 65.0, 73.0, 66.0, 67.0, 46.0, 41.0, 33.0, 24.0, 23.0, 13.0, 8.0, 13.0, 6.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2242431640625, -0.2181072235107422, -0.21197128295898438, -0.20583534240722656, -0.19969940185546875, -0.19356346130371094, -0.18742752075195312, -0.1812915802001953, -0.1751556396484375, -0.1690196990966797, -0.16288375854492188, -0.15674781799316406, -0.15061187744140625, -0.14447593688964844, -0.13833999633789062, -0.1322040557861328, -0.126068115234375, -0.11993217468261719, -0.11379623413085938, -0.10766029357910156, -0.10152435302734375, -0.09538841247558594, -0.08925247192382812, -0.08311653137207031, -0.0769805908203125, -0.07084465026855469, -0.06470870971679688, -0.05857276916503906, -0.05243682861328125, -0.04630088806152344, -0.040164947509765625, -0.03402900695800781, -0.02789306640625, -0.021757125854492188, -0.015621185302734375, -0.009485244750976562, -0.00334930419921875, 0.0027866363525390625, 0.008922576904296875, 0.015058517456054688, 0.0211944580078125, 0.027330398559570312, 0.033466339111328125, 0.03960227966308594, 0.04573822021484375, 0.05187416076660156, 0.058010101318359375, 0.06414604187011719, 0.070281982421875, 0.07641792297363281, 0.08255386352539062, 0.08868980407714844, 0.09482574462890625, 0.10096168518066406, 0.10709762573242188, 0.11323356628417969, 0.1193695068359375, 0.1255054473876953, 0.13164138793945312, 0.13777732849121094, 0.14391326904296875, 0.15004920959472656, 0.15618515014648438, 0.1623210906982422, 0.16845703125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 6.0, 4.0, 9.0, 14.0, 21.0, 29.0, 33.0, 61.0, 74.0, 121.0, 224.0, 326.0, 565.0, 1117.0, 2897.0, 10526.0, 59533.0, 459226.0, 440968.0, 57024.0, 10346.0, 2898.0, 1118.0, 558.0, 330.0, 190.0, 131.0, 65.0, 54.0, 36.0, 23.0, 14.0, 6.0, 7.0, 3.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.363037109375, -0.3516883850097656, -0.34033966064453125, -0.3289909362792969, -0.3176422119140625, -0.3062934875488281, -0.29494476318359375, -0.2835960388183594, -0.272247314453125, -0.2608985900878906, -0.24954986572265625, -0.23820114135742188, -0.2268524169921875, -0.21550369262695312, -0.20415496826171875, -0.19280624389648438, -0.18145751953125, -0.17010879516601562, -0.15876007080078125, -0.14741134643554688, -0.1360626220703125, -0.12471389770507812, -0.11336517333984375, -0.10201644897460938, -0.090667724609375, -0.07931900024414062, -0.06797027587890625, -0.056621551513671875, -0.0452728271484375, -0.033924102783203125, -0.02257537841796875, -0.011226654052734375, 0.0001220703125, 0.011470794677734375, 0.02281951904296875, 0.034168243408203125, 0.0455169677734375, 0.056865692138671875, 0.06821441650390625, 0.07956314086914062, 0.090911865234375, 0.10226058959960938, 0.11360931396484375, 0.12495803833007812, 0.1363067626953125, 0.14765548706054688, 0.15900421142578125, 0.17035293579101562, 0.18170166015625, 0.19305038452148438, 0.20439910888671875, 0.21574783325195312, 0.2270965576171875, 0.23844528198242188, 0.24979400634765625, 0.2611427307128906, 0.272491455078125, 0.2838401794433594, 0.29518890380859375, 0.3065376281738281, 0.3178863525390625, 0.3292350769042969, 0.34058380126953125, 0.3519325256347656, 0.36328125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 3.0, 11.0, 5.0, 10.0, 9.0, 8.0, 14.0, 17.0, 23.0, 27.0, 27.0, 32.0, 50.0, 40.0, 48.0, 61.0, 39.0, 41.0, 65.0, 50.0, 41.0, 50.0, 43.0, 39.0, 44.0, 37.0, 30.0, 33.0, 27.0, 21.0, 17.0, 7.0, 13.0, 5.0, 7.0, 3.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.69970703125, -0.67938232421875, -0.6590576171875, -0.63873291015625, -0.618408203125, -0.59808349609375, -0.5777587890625, -0.55743408203125, -0.537109375, -0.51678466796875, -0.4964599609375, -0.47613525390625, -0.455810546875, -0.43548583984375, -0.4151611328125, -0.39483642578125, -0.37451171875, -0.35418701171875, -0.3338623046875, -0.31353759765625, -0.293212890625, -0.27288818359375, -0.2525634765625, -0.23223876953125, -0.2119140625, -0.19158935546875, -0.1712646484375, -0.15093994140625, -0.130615234375, -0.11029052734375, -0.0899658203125, -0.06964111328125, -0.04931640625, -0.02899169921875, -0.0086669921875, 0.01165771484375, 0.031982421875, 0.05230712890625, 0.0726318359375, 0.09295654296875, 0.11328125, 0.13360595703125, 0.1539306640625, 0.17425537109375, 0.194580078125, 0.21490478515625, 0.2352294921875, 0.25555419921875, 0.27587890625, 0.29620361328125, 0.3165283203125, 0.33685302734375, 0.357177734375, 0.37750244140625, 0.3978271484375, 0.41815185546875, 0.4384765625, 0.45880126953125, 0.4791259765625, 0.49945068359375, 0.519775390625, 0.54010009765625, 0.5604248046875, 0.58074951171875, 0.60107421875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 7.0, 10.0, 16.0, 31.0, 54.0, 120.0, 209.0, 651.0, 1980.0, 8954.0, 115927.0, 850253.0, 61387.0, 6341.0, 1576.0, 576.0, 236.0, 110.0, 51.0, 24.0, 13.0, 6.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2440185546875, -0.2357196807861328, -0.22742080688476562, -0.21912193298339844, -0.21082305908203125, -0.20252418518066406, -0.19422531127929688, -0.1859264373779297, -0.1776275634765625, -0.1693286895751953, -0.16102981567382812, -0.15273094177246094, -0.14443206787109375, -0.13613319396972656, -0.12783432006835938, -0.11953544616699219, -0.111236572265625, -0.10293769836425781, -0.09463882446289062, -0.08633995056152344, -0.07804107666015625, -0.06974220275878906, -0.061443328857421875, -0.05314445495605469, -0.0448455810546875, -0.03654670715332031, -0.028247833251953125, -0.019948959350585938, -0.01165008544921875, -0.0033512115478515625, 0.004947662353515625, 0.013246536254882812, 0.02154541015625, 0.029844284057617188, 0.038143157958984375, 0.04644203186035156, 0.05474090576171875, 0.06303977966308594, 0.07133865356445312, 0.07963752746582031, 0.0879364013671875, 0.09623527526855469, 0.10453414916992188, 0.11283302307128906, 0.12113189697265625, 0.12943077087402344, 0.13772964477539062, 0.1460285186767578, 0.154327392578125, 0.1626262664794922, 0.17092514038085938, 0.17922401428222656, 0.18752288818359375, 0.19582176208496094, 0.20412063598632812, 0.2124195098876953, 0.2207183837890625, 0.2290172576904297, 0.23731613159179688, 0.24561500549316406, 0.25391387939453125, 0.26221275329589844, 0.2705116271972656, 0.2788105010986328, 0.287109375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 1.0, 4.0, 7.0, 3.0, 4.0, 5.0, 7.0, 17.0, 11.0, 11.0, 16.0, 23.0, 32.0, 38.0, 47.0, 66.0, 73.0, 85.0, 108.0, 88.0, 61.0, 65.0, 53.0, 48.0, 35.0, 13.0, 12.0, 14.0, 18.0, 6.0, 7.0, 2.0, 6.0, 3.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.554624557495117e-05, -9.220093488693237e-05, -8.885562419891357e-05, -8.551031351089478e-05, -8.216500282287598e-05, -7.881969213485718e-05, -7.547438144683838e-05, -7.212907075881958e-05, -6.878376007080078e-05, -6.543844938278198e-05, -6.209313869476318e-05, -5.8747828006744385e-05, -5.5402517318725586e-05, -5.205720663070679e-05, -4.871189594268799e-05, -4.536658525466919e-05, -4.202127456665039e-05, -3.867596387863159e-05, -3.533065319061279e-05, -3.1985342502593994e-05, -2.8640031814575195e-05, -2.5294721126556396e-05, -2.1949410438537598e-05, -1.86040997505188e-05, -1.52587890625e-05, -1.1913478374481201e-05, -8.568167686462402e-06, -5.2228569984436035e-06, -1.8775463104248047e-06, 1.4677643775939941e-06, 4.813075065612793e-06, 8.158385753631592e-06, 1.150369644165039e-05, 1.484900712966919e-05, 1.8194317817687988e-05, 2.1539628505706787e-05, 2.4884939193725586e-05, 2.8230249881744385e-05, 3.1575560569763184e-05, 3.492087125778198e-05, 3.826618194580078e-05, 4.161149263381958e-05, 4.495680332183838e-05, 4.830211400985718e-05, 5.1647424697875977e-05, 5.4992735385894775e-05, 5.8338046073913574e-05, 6.168335676193237e-05, 6.502866744995117e-05, 6.837397813796997e-05, 7.171928882598877e-05, 7.506459951400757e-05, 7.840991020202637e-05, 8.175522089004517e-05, 8.510053157806396e-05, 8.844584226608276e-05, 9.179115295410156e-05, 9.513646364212036e-05, 9.848177433013916e-05, 0.00010182708501815796, 0.00010517239570617676, 0.00010851770639419556, 0.00011186301708221436, 0.00011520832777023315, 0.00011855363845825195]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 10.0, 11.0, 11.0, 18.0, 16.0, 30.0, 64.0, 78.0, 168.0, 333.0, 690.0, 1480.0, 4217.0, 16725.0, 162014.0, 745978.0, 98455.0, 12289.0, 3427.0, 1312.0, 516.0, 283.0, 159.0, 94.0, 51.0, 38.0, 29.0, 17.0, 11.0, 9.0, 4.0, 8.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.177978515625, -0.17192649841308594, -0.16587448120117188, -0.1598224639892578, -0.15377044677734375, -0.1477184295654297, -0.14166641235351562, -0.13561439514160156, -0.1295623779296875, -0.12351036071777344, -0.11745834350585938, -0.11140632629394531, -0.10535430908203125, -0.09930229187011719, -0.09325027465820312, -0.08719825744628906, -0.081146240234375, -0.07509422302246094, -0.06904220581054688, -0.06299018859863281, -0.05693817138671875, -0.05088615417480469, -0.044834136962890625, -0.03878211975097656, -0.0327301025390625, -0.026678085327148438, -0.020626068115234375, -0.014574050903320312, -0.00852203369140625, -0.0024700164794921875, 0.003582000732421875, 0.009634017944335938, 0.01568603515625, 0.021738052368164062, 0.027790069580078125, 0.03384208679199219, 0.03989410400390625, 0.04594612121582031, 0.051998138427734375, 0.05805015563964844, 0.0641021728515625, 0.07015419006347656, 0.07620620727539062, 0.08225822448730469, 0.08831024169921875, 0.09436225891113281, 0.10041427612304688, 0.10646629333496094, 0.112518310546875, 0.11857032775878906, 0.12462234497070312, 0.1306743621826172, 0.13672637939453125, 0.1427783966064453, 0.14883041381835938, 0.15488243103027344, 0.1609344482421875, 0.16698646545410156, 0.17303848266601562, 0.1790904998779297, 0.18514251708984375, 0.1911945343017578, 0.19724655151367188, 0.20329856872558594, 0.2093505859375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 6.0, 4.0, 15.0, 29.0, 41.0, 89.0, 121.0, 170.0, 171.0, 155.0, 89.0, 50.0, 21.0, 16.0, 4.0, 7.0, 6.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19970703125, -0.18926239013671875, -0.1788177490234375, -0.16837310791015625, -0.157928466796875, -0.14748382568359375, -0.1370391845703125, -0.12659454345703125, -0.11614990234375, -0.10570526123046875, -0.0952606201171875, -0.08481597900390625, -0.074371337890625, -0.06392669677734375, -0.0534820556640625, -0.04303741455078125, -0.0325927734375, -0.02214813232421875, -0.0117034912109375, -0.00125885009765625, 0.009185791015625, 0.01963043212890625, 0.0300750732421875, 0.04051971435546875, 0.05096435546875, 0.06140899658203125, 0.0718536376953125, 0.08229827880859375, 0.092742919921875, 0.10318756103515625, 0.1136322021484375, 0.12407684326171875, 0.134521484375, 0.14496612548828125, 0.1554107666015625, 0.16585540771484375, 0.176300048828125, 0.18674468994140625, 0.1971893310546875, 0.20763397216796875, 0.21807861328125, 0.22852325439453125, 0.2389678955078125, 0.24941253662109375, 0.259857177734375, 0.27030181884765625, 0.2807464599609375, 0.29119110107421875, 0.3016357421875, 0.31208038330078125, 0.3225250244140625, 0.33296966552734375, 0.343414306640625, 0.35385894775390625, 0.3643035888671875, 0.37474822998046875, 0.38519287109375, 0.39563751220703125, 0.4060821533203125, 0.41652679443359375, 0.426971435546875, 0.43741607666015625, 0.4478607177734375, 0.45830535888671875, 0.46875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 13.0, 20.0, 15.0, 27.0, 42.0, 60.0, 98.0, 138.0, 164.0, 150.0, 116.0, 63.0, 43.0, 19.0, 11.0, 9.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9455392360687256, -1.8637481927871704, -1.7819571495056152, -1.7001662254333496, -1.6183751821517944, -1.5365841388702393, -1.4547932147979736, -1.3730021715164185, -1.2912111282348633, -1.209420084953308, -1.127629041671753, -1.0458381175994873, -0.9640470743179321, -0.882256031036377, -0.8004650473594666, -0.7186740636825562, -0.636883020401001, -0.5550919771194458, -0.4733009934425354, -0.3915099799633026, -0.3097189664840698, -0.22792795300483704, -0.14613693952560425, -0.06434595584869385, 0.017445087432861328, 0.09923610091209412, 0.1810271143913269, 0.2628181278705597, 0.3446091413497925, 0.42640015482902527, 0.5081911683082581, 0.5899821519851685, 0.6717734336853027, 0.7535644769668579, 0.8353554606437683, 0.9171464443206787, 0.9989374876022339, 1.080728530883789, 1.1625194549560547, 1.2443104982376099, 1.326101541519165, 1.4078925848007202, 1.4896836280822754, 1.571474552154541, 1.6532655954360962, 1.7350566387176514, 1.816847562789917, 1.8986386060714722, 1.9804296493530273, 2.062220573425293, 2.1440117359161377, 2.2258026599884033, 2.307593822479248, 2.3893847465515137, 2.4711756706237793, 2.552966594696045, 2.6347577571868896, 2.7165486812591553, 2.79833984375, 2.8801307678222656, 2.9619216918945312, 3.043712854385376, 3.1255037784576416, 3.2072949409484863, 3.289085865020752]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 11.0, 2.0, 9.0, 4.0, 13.0, 9.0, 9.0, 16.0, 19.0, 27.0, 27.0, 25.0, 26.0, 42.0, 37.0, 34.0, 53.0, 50.0, 48.0, 52.0, 66.0, 43.0, 33.0, 27.0, 35.0, 31.0, 34.0, 26.0, 28.0, 29.0, 17.0, 18.0, 11.0, 15.0, 16.0, 11.0, 11.0, 5.0, 4.0, 8.0, 10.0, 3.0, 7.0, 2.0, 0.0, 2.0, 2.0, 1.0], "bins": [-3.0298027992248535, -2.9452853202819824, -2.8607680797576904, -2.7762506008148193, -2.6917331218719482, -2.607215642929077, -2.522698402404785, -2.438180923461914, -2.353663444519043, -2.269145965576172, -2.18462872505188, -2.100111246109009, -2.0155937671661377, -1.9310764074325562, -1.8465590476989746, -1.7620415687561035, -1.677524209022522, -1.5930068492889404, -1.5084893703460693, -1.4239720106124878, -1.3394545316696167, -1.2549371719360352, -1.170419692993164, -1.0859023332595825, -1.001384973526001, -0.9168675541877747, -0.8323501348495483, -0.7478327751159668, -0.6633152961730957, -0.5787979364395142, -0.49428051710128784, -0.4097630977630615, -0.32524561882019043, -0.2407281994819641, -0.156210795044899, -0.07169339060783386, 0.012824028730392456, 0.09734144806861877, 0.1818588376045227, 0.266376256942749, 0.35089367628097534, 0.43541109561920166, 0.519928514957428, 0.6044459342956543, 0.6889632940292358, 0.7734807729721069, 0.8579981327056885, 0.9425155520439148, 1.0270329713821411, 1.1115503311157227, 1.1960678100585938, 1.2805851697921753, 1.3651026487350464, 1.449620008468628, 1.534137487411499, 1.6186548471450806, 1.703172206878662, 1.7876895666122437, 1.8722070455551147, 1.9567244052886963, 2.0412418842315674, 2.1257593631744385, 2.2102766036987305, 2.2947940826416016, 2.3793115615844727]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 3.0, 7.0, 9.0, 15.0, 16.0, 30.0, 46.0, 95.0, 160.0, 292.0, 633.0, 1792.0, 7861.0, 4082732.0, 93825.0, 4436.0, 1244.0, 515.0, 242.0, 132.0, 64.0, 42.0, 23.0, 16.0, 14.0, 11.0, 6.0, 3.0, 6.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67578125, -0.6474456787109375, -0.619110107421875, -0.5907745361328125, -0.56243896484375, -0.5341033935546875, -0.505767822265625, -0.4774322509765625, -0.4490966796875, -0.4207611083984375, -0.392425537109375, -0.3640899658203125, -0.33575439453125, -0.3074188232421875, -0.279083251953125, -0.2507476806640625, -0.222412109375, -0.1940765380859375, -0.165740966796875, -0.1374053955078125, -0.10906982421875, -0.0807342529296875, -0.052398681640625, -0.0240631103515625, 0.0042724609375, 0.0326080322265625, 0.060943603515625, 0.0892791748046875, 0.11761474609375, 0.1459503173828125, 0.174285888671875, 0.2026214599609375, 0.23095703125, 0.2592926025390625, 0.287628173828125, 0.3159637451171875, 0.34429931640625, 0.3726348876953125, 0.400970458984375, 0.4293060302734375, 0.4576416015625, 0.4859771728515625, 0.514312744140625, 0.5426483154296875, 0.57098388671875, 0.5993194580078125, 0.627655029296875, 0.6559906005859375, 0.684326171875, 0.7126617431640625, 0.740997314453125, 0.7693328857421875, 0.79766845703125, 0.8260040283203125, 0.854339599609375, 0.8826751708984375, 0.9110107421875, 0.9393463134765625, 0.967681884765625, 0.9960174560546875, 1.02435302734375, 1.0526885986328125, 1.081024169921875, 1.1093597412109375, 1.1376953125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 9.0, 5.0, 7.0, 10.0, 12.0, 18.0, 16.0, 31.0, 30.0, 33.0, 30.0, 58.0, 58.0, 58.0, 64.0, 49.0, 71.0, 61.0, 68.0, 52.0, 45.0, 44.0, 28.0, 23.0, 25.0, 25.0, 20.0, 10.0, 16.0, 11.0, 6.0, 5.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2269287109375, -0.2207965850830078, -0.21466445922851562, -0.20853233337402344, -0.20240020751953125, -0.19626808166503906, -0.19013595581054688, -0.1840038299560547, -0.1778717041015625, -0.1717395782470703, -0.16560745239257812, -0.15947532653808594, -0.15334320068359375, -0.14721107482910156, -0.14107894897460938, -0.1349468231201172, -0.128814697265625, -0.12268257141113281, -0.11655044555664062, -0.11041831970214844, -0.10428619384765625, -0.09815406799316406, -0.09202194213867188, -0.08588981628417969, -0.0797576904296875, -0.07362556457519531, -0.06749343872070312, -0.06136131286621094, -0.05522918701171875, -0.04909706115722656, -0.042964935302734375, -0.03683280944824219, -0.03070068359375, -0.024568557739257812, -0.018436431884765625, -0.012304306030273438, -0.00617218017578125, -4.00543212890625e-05, 0.006092071533203125, 0.012224197387695312, 0.0183563232421875, 0.024488449096679688, 0.030620574951171875, 0.03675270080566406, 0.04288482666015625, 0.04901695251464844, 0.055149078369140625, 0.06128120422363281, 0.067413330078125, 0.07354545593261719, 0.07967758178710938, 0.08580970764160156, 0.09194183349609375, 0.09807395935058594, 0.10420608520507812, 0.11033821105957031, 0.1164703369140625, 0.12260246276855469, 0.12873458862304688, 0.13486671447753906, 0.14099884033203125, 0.14713096618652344, 0.15326309204101562, 0.1593952178955078, 0.16552734375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 5.0, 1.0, 5.0, 4.0, 7.0, 1.0, 5.0, 4.0, 11.0, 13.0, 18.0, 22.0, 24.0, 31.0, 38.0, 54.0, 99.0, 148.0, 239.0, 399.0, 724.0, 1280.0, 2787.0, 7816.0, 50247.0, 4061356.0, 54675.0, 8155.0, 2907.0, 1311.0, 702.0, 389.0, 265.0, 143.0, 100.0, 76.0, 58.0, 41.0, 26.0, 27.0, 19.0, 16.0, 8.0, 7.0, 5.0, 2.0, 5.0, 6.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.429931640625, -0.416290283203125, -0.40264892578125, -0.389007568359375, -0.3753662109375, -0.361724853515625, -0.34808349609375, -0.334442138671875, -0.32080078125, -0.307159423828125, -0.29351806640625, -0.279876708984375, -0.2662353515625, -0.252593994140625, -0.23895263671875, -0.225311279296875, -0.211669921875, -0.198028564453125, -0.18438720703125, -0.170745849609375, -0.1571044921875, -0.143463134765625, -0.12982177734375, -0.116180419921875, -0.1025390625, -0.088897705078125, -0.07525634765625, -0.061614990234375, -0.0479736328125, -0.034332275390625, -0.02069091796875, -0.007049560546875, 0.006591796875, 0.020233154296875, 0.03387451171875, 0.047515869140625, 0.0611572265625, 0.074798583984375, 0.08843994140625, 0.102081298828125, 0.11572265625, 0.129364013671875, 0.14300537109375, 0.156646728515625, 0.1702880859375, 0.183929443359375, 0.19757080078125, 0.211212158203125, 0.224853515625, 0.238494873046875, 0.25213623046875, 0.265777587890625, 0.2794189453125, 0.293060302734375, 0.30670166015625, 0.320343017578125, 0.333984375, 0.347625732421875, 0.36126708984375, 0.374908447265625, 0.3885498046875, 0.402191162109375, 0.41583251953125, 0.429473876953125, 0.443115234375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 1.0, 2.0, 14.0, 25.0, 80.0, 3577.0, 289.0, 49.0, 26.0, 5.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.267333984375, -0.26122188568115234, -0.2551097869873047, -0.24899768829345703, -0.24288558959960938, -0.23677349090576172, -0.23066139221191406, -0.2245492935180664, -0.21843719482421875, -0.2123250961303711, -0.20621299743652344, -0.20010089874267578, -0.19398880004882812, -0.18787670135498047, -0.1817646026611328, -0.17565250396728516, -0.1695404052734375, -0.16342830657958984, -0.1573162078857422, -0.15120410919189453, -0.14509201049804688, -0.13897991180419922, -0.13286781311035156, -0.1267557144165039, -0.12064361572265625, -0.1145315170288086, -0.10841941833496094, -0.10230731964111328, -0.09619522094726562, -0.09008312225341797, -0.08397102355957031, -0.07785892486572266, -0.071746826171875, -0.06563472747802734, -0.05952262878417969, -0.05341053009033203, -0.047298431396484375, -0.04118633270263672, -0.03507423400878906, -0.028962135314941406, -0.02285003662109375, -0.016737937927246094, -0.010625839233398438, -0.004513740539550781, 0.001598358154296875, 0.007710456848144531, 0.013822555541992188, 0.019934654235839844, 0.0260467529296875, 0.032158851623535156, 0.03827095031738281, 0.04438304901123047, 0.050495147705078125, 0.05660724639892578, 0.06271934509277344, 0.0688314437866211, 0.07494354248046875, 0.0810556411743164, 0.08716773986816406, 0.09327983856201172, 0.09939193725585938, 0.10550403594970703, 0.11161613464355469, 0.11772823333740234, 0.12384033203125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 6.0, 20.0, 48.0, 71.0, 124.0, 163.0, 176.0, 147.0, 109.0, 65.0, 34.0, 15.0, 11.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5215672254562378, -0.508392333984375, -0.495217502117157, -0.4820426106452942, -0.4688677489757538, -0.4556928873062134, -0.4425179958343506, -0.4293431341648102, -0.4161682724952698, -0.40299341082572937, -0.38981854915618896, -0.37664365768432617, -0.36346879601478577, -0.35029393434524536, -0.33711904287338257, -0.32394418120384216, -0.31076931953430176, -0.29759445786476135, -0.28441959619522095, -0.27124470472335815, -0.25806984305381775, -0.24489498138427734, -0.23172010481357574, -0.21854522824287415, -0.20537036657333374, -0.19219550490379333, -0.17902062833309174, -0.16584575176239014, -0.15267089009284973, -0.13949602842330933, -0.12632115185260773, -0.11314628273248672, -0.09997141361236572, -0.08679654449224472, -0.07362167537212372, -0.060446806252002716, -0.047271937131881714, -0.03409706801176071, -0.02092219889163971, -0.007747329771518707, 0.005427539348602295, 0.018602408468723297, 0.0317772775888443, 0.0449521467089653, 0.058127015829086304, 0.0713018849492073, 0.08447675406932831, 0.09765162318944931, 0.11082649230957031, 0.12400136142969131, 0.13717623054981232, 0.15035110712051392, 0.16352596879005432, 0.17670083045959473, 0.18987570703029633, 0.20305058360099792, 0.21622544527053833, 0.22940030694007874, 0.24257518351078033, 0.25575006008148193, 0.26892492175102234, 0.28209978342056274, 0.29527467489242554, 0.30844953656196594, 0.32162439823150635]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 4.0, 4.0, 9.0, 6.0, 11.0, 10.0, 16.0, 12.0, 26.0, 18.0, 21.0, 24.0, 23.0, 37.0, 41.0, 43.0, 43.0, 42.0, 40.0, 52.0, 46.0, 51.0, 49.0, 50.0, 42.0, 38.0, 45.0, 30.0, 28.0, 30.0, 28.0, 16.0, 19.0, 12.0, 12.0, 9.0, 5.0, 1.0, 6.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.22378134727478027, -0.21661347150802612, -0.20944559574127197, -0.20227771997451782, -0.19510984420776367, -0.18794196844100952, -0.18077409267425537, -0.17360621690750122, -0.16643834114074707, -0.15927046537399292, -0.15210258960723877, -0.14493471384048462, -0.13776683807373047, -0.13059896230697632, -0.12343109399080276, -0.11626321822404861, -0.10909534990787506, -0.10192747414112091, -0.09475959837436676, -0.08759172260761261, -0.08042384684085846, -0.07325597107410431, -0.06608810275793076, -0.058920226991176605, -0.051752351224422455, -0.044584475457668304, -0.037416599690914154, -0.030248727649450302, -0.02308085188269615, -0.015912976115942, -0.00874510407447815, -0.001577228307723999, 0.005590647459030151, 0.012758522294461727, 0.019926397129893303, 0.027094271034002304, 0.034262146800756454, 0.041430022567510605, 0.04859789460897446, 0.05576577037572861, 0.06293364614248276, 0.07010152190923691, 0.07726939767599106, 0.08443726599216461, 0.09160514175891876, 0.09877301752567291, 0.10594089329242706, 0.11310876905918121, 0.12027664482593536, 0.12744452059268951, 0.13461239635944366, 0.14178027212619781, 0.14894814789295197, 0.15611602365970612, 0.16328388452529907, 0.17045176029205322, 0.17761963605880737, 0.18478751182556152, 0.19195538759231567, 0.19912326335906982, 0.20629113912582397, 0.21345901489257812, 0.22062689065933228, 0.22779476642608643, 0.23496264219284058]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 2.0, 3.0, 8.0, 5.0, 16.0, 16.0, 26.0, 41.0, 63.0, 114.0, 187.0, 332.0, 721.0, 1794.0, 5629.0, 26799.0, 197356.0, 629659.0, 155930.0, 21931.0, 4942.0, 1533.0, 637.0, 340.0, 190.0, 96.0, 69.0, 44.0, 21.0, 22.0, 15.0, 6.0, 3.0, 8.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.291015625, -0.27860260009765625, -0.2661895751953125, -0.25377655029296875, -0.241363525390625, -0.22895050048828125, -0.2165374755859375, -0.20412445068359375, -0.19171142578125, -0.17929840087890625, -0.1668853759765625, -0.15447235107421875, -0.142059326171875, -0.12964630126953125, -0.1172332763671875, -0.10482025146484375, -0.0924072265625, -0.07999420166015625, -0.0675811767578125, -0.05516815185546875, -0.042755126953125, -0.03034210205078125, -0.0179290771484375, -0.00551605224609375, 0.00689697265625, 0.01930999755859375, 0.0317230224609375, 0.04413604736328125, 0.056549072265625, 0.06896209716796875, 0.0813751220703125, 0.09378814697265625, 0.106201171875, 0.11861419677734375, 0.1310272216796875, 0.14344024658203125, 0.155853271484375, 0.16826629638671875, 0.1806793212890625, 0.19309234619140625, 0.20550537109375, 0.21791839599609375, 0.2303314208984375, 0.24274444580078125, 0.255157470703125, 0.26757049560546875, 0.2799835205078125, 0.29239654541015625, 0.3048095703125, 0.31722259521484375, 0.3296356201171875, 0.34204864501953125, 0.354461669921875, 0.36687469482421875, 0.3792877197265625, 0.39170074462890625, 0.40411376953125, 0.41652679443359375, 0.4289398193359375, 0.44135284423828125, 0.453765869140625, 0.46617889404296875, 0.4785919189453125, 0.49100494384765625, 0.50341796875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 9.0, 9.0, 9.0, 14.0, 14.0, 17.0, 23.0, 34.0, 30.0, 43.0, 34.0, 47.0, 47.0, 62.0, 58.0, 62.0, 76.0, 68.0, 50.0, 47.0, 39.0, 39.0, 33.0, 22.0, 24.0, 26.0, 16.0, 15.0, 13.0, 6.0, 6.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.22509765625, -0.21892738342285156, -0.21275711059570312, -0.2065868377685547, -0.20041656494140625, -0.1942462921142578, -0.18807601928710938, -0.18190574645996094, -0.1757354736328125, -0.16956520080566406, -0.16339492797851562, -0.1572246551513672, -0.15105438232421875, -0.1448841094970703, -0.13871383666992188, -0.13254356384277344, -0.126373291015625, -0.12020301818847656, -0.11403274536132812, -0.10786247253417969, -0.10169219970703125, -0.09552192687988281, -0.08935165405273438, -0.08318138122558594, -0.0770111083984375, -0.07084083557128906, -0.06467056274414062, -0.05850028991699219, -0.05233001708984375, -0.04615974426269531, -0.039989471435546875, -0.03381919860839844, -0.02764892578125, -0.021478652954101562, -0.015308380126953125, -0.009138107299804688, -0.00296783447265625, 0.0032024383544921875, 0.009372711181640625, 0.015542984008789062, 0.0217132568359375, 0.027883529663085938, 0.034053802490234375, 0.04022407531738281, 0.04639434814453125, 0.05256462097167969, 0.058734893798828125, 0.06490516662597656, 0.071075439453125, 0.07724571228027344, 0.08341598510742188, 0.08958625793457031, 0.09575653076171875, 0.10192680358886719, 0.10809707641601562, 0.11426734924316406, 0.1204376220703125, 0.12660789489746094, 0.13277816772460938, 0.1389484405517578, 0.14511871337890625, 0.1512889862060547, 0.15745925903320312, 0.16362953186035156, 0.1697998046875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 10.0, 6.0, 12.0, 13.0, 24.0, 27.0, 45.0, 87.0, 142.0, 257.0, 412.0, 932.0, 2305.0, 7677.0, 80388.0, 859631.0, 84587.0, 7812.0, 2300.0, 890.0, 433.0, 226.0, 124.0, 83.0, 47.0, 25.0, 13.0, 21.0, 8.0, 8.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.54638671875, -0.5278701782226562, -0.5093536376953125, -0.49083709716796875, -0.472320556640625, -0.45380401611328125, -0.4352874755859375, -0.41677093505859375, -0.39825439453125, -0.37973785400390625, -0.3612213134765625, -0.34270477294921875, -0.324188232421875, -0.30567169189453125, -0.2871551513671875, -0.26863861083984375, -0.2501220703125, -0.23160552978515625, -0.2130889892578125, -0.19457244873046875, -0.176055908203125, -0.15753936767578125, -0.1390228271484375, -0.12050628662109375, -0.10198974609375, -0.08347320556640625, -0.0649566650390625, -0.04644012451171875, -0.027923583984375, -0.00940704345703125, 0.0091094970703125, 0.02762603759765625, 0.046142578125, 0.06465911865234375, 0.0831756591796875, 0.10169219970703125, 0.120208740234375, 0.13872528076171875, 0.1572418212890625, 0.17575836181640625, 0.19427490234375, 0.21279144287109375, 0.2313079833984375, 0.24982452392578125, 0.268341064453125, 0.28685760498046875, 0.3053741455078125, 0.32389068603515625, 0.3424072265625, 0.36092376708984375, 0.3794403076171875, 0.39795684814453125, 0.416473388671875, 0.43498992919921875, 0.4535064697265625, 0.47202301025390625, 0.49053955078125, 0.5090560913085938, 0.5275726318359375, 0.5460891723632812, 0.564605712890625, 0.5831222534179688, 0.6016387939453125, 0.6201553344726562, 0.638671875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 8.0, 16.0, 17.0, 16.0, 45.0, 62.0, 73.0, 107.0, 126.0, 95.0, 96.0, 97.0, 81.0, 71.0, 42.0, 13.0, 13.0, 6.0, 8.0, 3.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3193359375, -1.2679290771484375, -1.216522216796875, -1.1651153564453125, -1.11370849609375, -1.0623016357421875, -1.010894775390625, -0.9594879150390625, -0.9080810546875, -0.8566741943359375, -0.805267333984375, -0.7538604736328125, -0.70245361328125, -0.6510467529296875, -0.599639892578125, -0.5482330322265625, -0.496826171875, -0.4454193115234375, -0.394012451171875, -0.3426055908203125, -0.29119873046875, -0.2397918701171875, -0.188385009765625, -0.1369781494140625, -0.0855712890625, -0.0341644287109375, 0.017242431640625, 0.0686492919921875, 0.12005615234375, 0.1714630126953125, 0.222869873046875, 0.2742767333984375, 0.32568359375, 0.3770904541015625, 0.428497314453125, 0.4799041748046875, 0.53131103515625, 0.5827178955078125, 0.634124755859375, 0.6855316162109375, 0.7369384765625, 0.7883453369140625, 0.839752197265625, 0.8911590576171875, 0.94256591796875, 0.9939727783203125, 1.045379638671875, 1.0967864990234375, 1.148193359375, 1.1996002197265625, 1.251007080078125, 1.3024139404296875, 1.35382080078125, 1.4052276611328125, 1.456634521484375, 1.5080413818359375, 1.5594482421875, 1.6108551025390625, 1.662261962890625, 1.7136688232421875, 1.76507568359375, 1.8164825439453125, 1.867889404296875, 1.9192962646484375, 1.970703125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 7.0, 3.0, 9.0, 10.0, 33.0, 44.0, 199.0, 1083.0, 972378.0, 73845.0, 696.0, 157.0, 52.0, 15.0, 9.0, 12.0, 6.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.037109375, -0.982269287109375, -0.92742919921875, -0.872589111328125, -0.8177490234375, -0.762908935546875, -0.70806884765625, -0.653228759765625, -0.598388671875, -0.543548583984375, -0.48870849609375, -0.433868408203125, -0.3790283203125, -0.324188232421875, -0.26934814453125, -0.214508056640625, -0.15966796875, -0.104827880859375, -0.04998779296875, 0.004852294921875, 0.0596923828125, 0.114532470703125, 0.16937255859375, 0.224212646484375, 0.279052734375, 0.333892822265625, 0.38873291015625, 0.443572998046875, 0.4984130859375, 0.553253173828125, 0.60809326171875, 0.662933349609375, 0.7177734375, 0.772613525390625, 0.82745361328125, 0.882293701171875, 0.9371337890625, 0.991973876953125, 1.04681396484375, 1.101654052734375, 1.156494140625, 1.211334228515625, 1.26617431640625, 1.321014404296875, 1.3758544921875, 1.430694580078125, 1.48553466796875, 1.540374755859375, 1.59521484375, 1.650054931640625, 1.70489501953125, 1.759735107421875, 1.8145751953125, 1.869415283203125, 1.92425537109375, 1.979095458984375, 2.033935546875, 2.088775634765625, 2.14361572265625, 2.198455810546875, 2.2532958984375, 2.308135986328125, 2.36297607421875, 2.417816162109375, 2.47265625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 8.0, 5.0, 3.0, 6.0, 6.0, 14.0, 16.0, 19.0, 25.0, 30.0, 44.0, 48.0, 75.0, 76.0, 101.0, 79.0, 92.0, 70.0, 67.0, 53.0, 21.0, 29.0, 27.0, 21.0, 13.0, 11.0, 10.0, 7.0, 9.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.368492126464844e-05, -8.103344589471817e-05, -7.83819705247879e-05, -7.573049515485764e-05, -7.307901978492737e-05, -7.04275444149971e-05, -6.777606904506683e-05, -6.512459367513657e-05, -6.24731183052063e-05, -5.982164293527603e-05, -5.7170167565345764e-05, -5.45186921954155e-05, -5.186721682548523e-05, -4.921574145555496e-05, -4.6564266085624695e-05, -4.391279071569443e-05, -4.126131534576416e-05, -3.860983997583389e-05, -3.5958364605903625e-05, -3.330688923597336e-05, -3.065541386604309e-05, -2.8003938496112823e-05, -2.5352463126182556e-05, -2.270098775625229e-05, -2.004951238632202e-05, -1.7398037016391754e-05, -1.4746561646461487e-05, -1.209508627653122e-05, -9.443610906600952e-06, -6.792135536670685e-06, -4.1406601667404175e-06, -1.4891847968101501e-06, 1.1622905731201172e-06, 3.8137659430503845e-06, 6.465241312980652e-06, 9.11671668291092e-06, 1.1768192052841187e-05, 1.4419667422771454e-05, 1.707114279270172e-05, 1.972261816263199e-05, 2.2374093532562256e-05, 2.5025568902492523e-05, 2.767704427242279e-05, 3.0328519642353058e-05, 3.2979995012283325e-05, 3.563147038221359e-05, 3.828294575214386e-05, 4.093442112207413e-05, 4.3585896492004395e-05, 4.623737186193466e-05, 4.888884723186493e-05, 5.1540322601795197e-05, 5.4191797971725464e-05, 5.684327334165573e-05, 5.9494748711586e-05, 6.214622408151627e-05, 6.479769945144653e-05, 6.74491748213768e-05, 7.010065019130707e-05, 7.275212556123734e-05, 7.54036009311676e-05, 7.805507630109787e-05, 8.070655167102814e-05, 8.33580270409584e-05, 8.600950241088867e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 11.0, 15.0, 35.0, 42.0, 92.0, 184.0, 411.0, 1606.0, 14714.0, 1006623.0, 22033.0, 1913.0, 473.0, 172.0, 99.0, 51.0, 28.0, 18.0, 10.0, 5.0, 7.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6552734375, -0.6323318481445312, -0.6093902587890625, -0.5864486694335938, -0.563507080078125, -0.5405654907226562, -0.5176239013671875, -0.49468231201171875, -0.47174072265625, -0.44879913330078125, -0.4258575439453125, -0.40291595458984375, -0.379974365234375, -0.35703277587890625, -0.3340911865234375, -0.31114959716796875, -0.2882080078125, -0.26526641845703125, -0.2423248291015625, -0.21938323974609375, -0.196441650390625, -0.17350006103515625, -0.1505584716796875, -0.12761688232421875, -0.10467529296875, -0.08173370361328125, -0.0587921142578125, -0.03585052490234375, -0.012908935546875, 0.01003265380859375, 0.0329742431640625, 0.05591583251953125, 0.078857421875, 0.10179901123046875, 0.1247406005859375, 0.14768218994140625, 0.170623779296875, 0.19356536865234375, 0.2165069580078125, 0.23944854736328125, 0.26239013671875, 0.28533172607421875, 0.3082733154296875, 0.33121490478515625, 0.354156494140625, 0.37709808349609375, 0.4000396728515625, 0.42298126220703125, 0.4459228515625, 0.46886444091796875, 0.4918060302734375, 0.5147476196289062, 0.537689208984375, 0.5606307983398438, 0.5835723876953125, 0.6065139770507812, 0.62945556640625, 0.6523971557617188, 0.6753387451171875, 0.6982803344726562, 0.721221923828125, 0.7441635131835938, 0.7671051025390625, 0.7900466918945312, 0.81298828125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 8.0, 6.0, 9.0, 18.0, 117.0, 447.0, 318.0, 51.0, 11.0, 7.0, 4.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.572265625, -1.5386962890625, -1.505126953125, -1.4715576171875, -1.43798828125, -1.4044189453125, -1.370849609375, -1.3372802734375, -1.3037109375, -1.2701416015625, -1.236572265625, -1.2030029296875, -1.16943359375, -1.1358642578125, -1.102294921875, -1.0687255859375, -1.03515625, -1.0015869140625, -0.968017578125, -0.9344482421875, -0.90087890625, -0.8673095703125, -0.833740234375, -0.8001708984375, -0.7666015625, -0.7330322265625, -0.699462890625, -0.6658935546875, -0.63232421875, -0.5987548828125, -0.565185546875, -0.5316162109375, -0.498046875, -0.4644775390625, -0.430908203125, -0.3973388671875, -0.36376953125, -0.3302001953125, -0.296630859375, -0.2630615234375, -0.2294921875, -0.1959228515625, -0.162353515625, -0.1287841796875, -0.09521484375, -0.0616455078125, -0.028076171875, 0.0054931640625, 0.0390625, 0.0726318359375, 0.106201171875, 0.1397705078125, 0.17333984375, 0.2069091796875, 0.240478515625, 0.2740478515625, 0.3076171875, 0.3411865234375, 0.374755859375, 0.4083251953125, 0.44189453125, 0.4754638671875, 0.509033203125, 0.5426025390625, 0.576171875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 6.0, 19.0, 41.0, 177.0, 535.0, 190.0, 20.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.39830780029297, -21.948360443115234, -21.4984130859375, -21.0484676361084, -20.598520278930664, -20.14857292175293, -19.698625564575195, -19.248680114746094, -18.79873275756836, -18.348785400390625, -17.89883804321289, -17.44889259338379, -16.998945236206055, -16.54899787902832, -16.099050521850586, -15.649104118347168, -15.199156761169434, -14.7492094039917, -14.299263000488281, -13.849315643310547, -13.399369239807129, -12.949421882629395, -12.499475479125977, -12.049528121948242, -11.599580764770508, -11.149633407592773, -10.699687004089355, -10.249739646911621, -9.799793243408203, -9.349845886230469, -8.899898529052734, -8.449952125549316, -8.000005722045898, -7.550058841705322, -7.100111961364746, -6.650164604187012, -6.200218200683594, -5.750270843505859, -5.300323963165283, -4.850377082824707, -4.400430202484131, -3.9504833221435547, -3.5005364418029785, -3.0505893230438232, -2.600642442703247, -2.150695562362671, -1.7007484436035156, -1.2508015632629395, -0.8008546829223633, -0.35090774297714233, 0.09903919696807861, 0.5489861965179443, 0.9989330768585205, 1.4488799571990967, 1.898827075958252, 2.348773956298828, 2.7987208366394043, 3.2486677169799805, 3.6986145973205566, 4.148561477661133, 4.598508834838867, 5.048455238342285, 5.4984025955200195, 5.948349475860596, 6.398296356201172]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 5.0, 9.0, 7.0, 6.0, 12.0, 8.0, 17.0, 17.0, 16.0, 20.0, 23.0, 26.0, 28.0, 32.0, 32.0, 37.0, 42.0, 44.0, 53.0, 45.0, 45.0, 53.0, 43.0, 42.0, 31.0, 37.0, 26.0, 29.0, 38.0, 29.0, 22.0, 25.0, 16.0, 13.0, 11.0, 11.0, 13.0, 15.0, 2.0, 1.0, 7.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.7863407135009766, -3.668015480041504, -3.5496902465820312, -3.4313650131225586, -3.313039779663086, -3.1947145462036133, -3.0763893127441406, -2.958064079284668, -2.8397388458251953, -2.7214136123657227, -2.60308837890625, -2.4847631454467773, -2.3664379119873047, -2.248112678527832, -2.1297874450683594, -2.0114622116088867, -1.8931372165679932, -1.7748119831085205, -1.6564867496490479, -1.5381615161895752, -1.4198362827301025, -1.3015110492706299, -1.1831859350204468, -1.0648607015609741, -0.9465354681015015, -0.8282102346420288, -0.7098850011825562, -0.5915598273277283, -0.4732345938682556, -0.35490936040878296, -0.23658418655395508, -0.11825895309448242, 6.604194641113281e-05, 0.1183912605047226, 0.23671647906303406, 0.3550416827201843, 0.473366916179657, 0.5916921496391296, 0.7100173234939575, 0.8283425569534302, 0.9466677904129028, 1.0649930238723755, 1.1833182573318481, 1.3016433715820312, 1.419968605041504, 1.5382938385009766, 1.6566190719604492, 1.7749443054199219, 1.8932695388793945, 2.011594772338867, 2.12992000579834, 2.2482452392578125, 2.366570472717285, 2.484895706176758, 2.6032209396362305, 2.721546173095703, 2.839871406555176, 2.9581966400146484, 3.076521873474121, 3.1948471069335938, 3.3131723403930664, 3.431497573852539, 3.5498228073120117, 3.6681480407714844, 3.786473035812378]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 6.0, 14.0, 21.0, 46.0, 84.0, 194.0, 534.0, 1476.0, 8628.0, 4133710.0, 45410.0, 2831.0, 779.0, 285.0, 120.0, 53.0, 32.0, 22.0, 17.0, 6.0, 5.0, 5.0, 3.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.86083984375, -0.83453369140625, -0.8082275390625, -0.78192138671875, -0.755615234375, -0.72930908203125, -0.7030029296875, -0.67669677734375, -0.650390625, -0.62408447265625, -0.5977783203125, -0.57147216796875, -0.545166015625, -0.51885986328125, -0.4925537109375, -0.46624755859375, -0.43994140625, -0.41363525390625, -0.3873291015625, -0.36102294921875, -0.334716796875, -0.30841064453125, -0.2821044921875, -0.25579833984375, -0.2294921875, -0.20318603515625, -0.1768798828125, -0.15057373046875, -0.124267578125, -0.09796142578125, -0.0716552734375, -0.04534912109375, -0.01904296875, 0.00726318359375, 0.0335693359375, 0.05987548828125, 0.086181640625, 0.11248779296875, 0.1387939453125, 0.16510009765625, 0.19140625, 0.21771240234375, 0.2440185546875, 0.27032470703125, 0.296630859375, 0.32293701171875, 0.3492431640625, 0.37554931640625, 0.40185546875, 0.42816162109375, 0.4544677734375, 0.48077392578125, 0.507080078125, 0.53338623046875, 0.5596923828125, 0.58599853515625, 0.6123046875, 0.63861083984375, 0.6649169921875, 0.69122314453125, 0.717529296875, 0.74383544921875, 0.7701416015625, 0.79644775390625, 0.82275390625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 6.0, 2.0, 11.0, 11.0, 12.0, 10.0, 17.0, 24.0, 24.0, 25.0, 25.0, 37.0, 49.0, 41.0, 44.0, 61.0, 51.0, 65.0, 68.0, 57.0, 67.0, 45.0, 46.0, 30.0, 28.0, 27.0, 19.0, 16.0, 7.0, 13.0, 6.0, 7.0, 11.0, 5.0, 6.0, 1.0, 5.0, 3.0, 1.0, 4.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.229248046875, -0.22238922119140625, -0.2155303955078125, -0.20867156982421875, -0.201812744140625, -0.19495391845703125, -0.1880950927734375, -0.18123626708984375, -0.17437744140625, -0.16751861572265625, -0.1606597900390625, -0.15380096435546875, -0.146942138671875, -0.14008331298828125, -0.1332244873046875, -0.12636566162109375, -0.1195068359375, -0.11264801025390625, -0.1057891845703125, -0.09893035888671875, -0.092071533203125, -0.08521270751953125, -0.0783538818359375, -0.07149505615234375, -0.06463623046875, -0.05777740478515625, -0.0509185791015625, -0.04405975341796875, -0.037200927734375, -0.03034210205078125, -0.0234832763671875, -0.01662445068359375, -0.009765625, -0.00290679931640625, 0.0039520263671875, 0.01081085205078125, 0.017669677734375, 0.02452850341796875, 0.0313873291015625, 0.03824615478515625, 0.04510498046875, 0.05196380615234375, 0.0588226318359375, 0.06568145751953125, 0.072540283203125, 0.07939910888671875, 0.0862579345703125, 0.09311676025390625, 0.0999755859375, 0.10683441162109375, 0.1136932373046875, 0.12055206298828125, 0.127410888671875, 0.13426971435546875, 0.1411285400390625, 0.14798736572265625, 0.15484619140625, 0.16170501708984375, 0.1685638427734375, 0.17542266845703125, 0.182281494140625, 0.18914031982421875, 0.1959991455078125, 0.20285797119140625, 0.209716796875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 6.0, 11.0, 19.0, 17.0, 18.0, 33.0, 56.0, 47.0, 68.0, 148.0, 370.0, 1227.0, 11815.0, 4168553.0, 9954.0, 1180.0, 357.0, 113.0, 54.0, 44.0, 51.0, 36.0, 24.0, 18.0, 24.0, 13.0, 9.0, 2.0, 6.0, 1.0, 7.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.537109375, -1.494964599609375, -1.45281982421875, -1.410675048828125, -1.3685302734375, -1.326385498046875, -1.28424072265625, -1.242095947265625, -1.199951171875, -1.157806396484375, -1.11566162109375, -1.073516845703125, -1.0313720703125, -0.989227294921875, -0.94708251953125, -0.904937744140625, -0.86279296875, -0.820648193359375, -0.77850341796875, -0.736358642578125, -0.6942138671875, -0.652069091796875, -0.60992431640625, -0.567779541015625, -0.525634765625, -0.483489990234375, -0.44134521484375, -0.399200439453125, -0.3570556640625, -0.314910888671875, -0.27276611328125, -0.230621337890625, -0.1884765625, -0.146331787109375, -0.10418701171875, -0.062042236328125, -0.0198974609375, 0.022247314453125, 0.06439208984375, 0.106536865234375, 0.148681640625, 0.190826416015625, 0.23297119140625, 0.275115966796875, 0.3172607421875, 0.359405517578125, 0.40155029296875, 0.443695068359375, 0.48583984375, 0.527984619140625, 0.57012939453125, 0.612274169921875, 0.6544189453125, 0.696563720703125, 0.73870849609375, 0.780853271484375, 0.822998046875, 0.865142822265625, 0.90728759765625, 0.949432373046875, 0.9915771484375, 1.033721923828125, 1.07586669921875, 1.118011474609375, 1.16015625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 8.0, 27.0, 3703.0, 302.0, 34.0, 4.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1875, -0.175689697265625, -0.16387939453125, -0.152069091796875, -0.1402587890625, -0.128448486328125, -0.11663818359375, -0.104827880859375, -0.093017578125, -0.081207275390625, -0.06939697265625, -0.057586669921875, -0.0457763671875, -0.033966064453125, -0.02215576171875, -0.010345458984375, 0.00146484375, 0.013275146484375, 0.02508544921875, 0.036895751953125, 0.0487060546875, 0.060516357421875, 0.07232666015625, 0.084136962890625, 0.095947265625, 0.107757568359375, 0.11956787109375, 0.131378173828125, 0.1431884765625, 0.154998779296875, 0.16680908203125, 0.178619384765625, 0.1904296875, 0.202239990234375, 0.21405029296875, 0.225860595703125, 0.2376708984375, 0.249481201171875, 0.26129150390625, 0.273101806640625, 0.284912109375, 0.296722412109375, 0.30853271484375, 0.320343017578125, 0.3321533203125, 0.343963623046875, 0.35577392578125, 0.367584228515625, 0.37939453125, 0.391204833984375, 0.40301513671875, 0.414825439453125, 0.4266357421875, 0.438446044921875, 0.45025634765625, 0.462066650390625, 0.473876953125, 0.485687255859375, 0.49749755859375, 0.509307861328125, 0.5211181640625, 0.532928466796875, 0.54473876953125, 0.556549072265625, 0.568359375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 7.0, 24.0, 291.0, 522.0, 127.0, 21.0, 9.0, 10.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3711837530136108, -1.3162442445755005, -1.2613046169281006, -1.2063651084899902, -1.1514256000518799, -1.09648597240448, -1.0415464639663696, -0.9866068959236145, -0.9316673278808594, -0.8767277598381042, -0.8217881917953491, -0.7668486833572388, -0.7119091153144836, -0.6569695472717285, -0.6020300388336182, -0.547090470790863, -0.4921509027481079, -0.4372113347053528, -0.38227179646492004, -0.3273322582244873, -0.2723926901817322, -0.21745312213897705, -0.1625135838985443, -0.10757404565811157, -0.052634477615356445, 0.002305075526237488, 0.05724462866783142, 0.11218418180942535, 0.1671237349510193, 0.22206330299377441, 0.27700284123420715, 0.3319423794746399, 0.38688182830810547, 0.4418213963508606, 0.49676093459129333, 0.5517004728317261, 0.6066400408744812, 0.6615796089172363, 0.7165191173553467, 0.7714586853981018, 0.8263982534408569, 0.8813378214836121, 0.9362773895263672, 0.9912168979644775, 1.046156406402588, 1.1010960340499878, 1.1560355424880981, 1.210975170135498, 1.2659146785736084, 1.3208541870117188, 1.3757938146591187, 1.430733323097229, 1.485672950744629, 1.5406124591827393, 1.5955519676208496, 1.65049147605896, 1.7054311037063599, 1.7603706121444702, 1.8153102397918701, 1.8702497482299805, 1.9251892566680908, 1.9801288843154907, 2.0350685119628906, 2.090008020401001, 2.1449475288391113]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 4.0, 3.0, 3.0, 12.0, 11.0, 16.0, 23.0, 26.0, 32.0, 33.0, 39.0, 54.0, 49.0, 64.0, 57.0, 53.0, 52.0, 49.0, 51.0, 67.0, 47.0, 48.0, 44.0, 44.0, 31.0, 19.0, 18.0, 15.0, 15.0, 6.0, 8.0, 1.0, 5.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4719772934913635, -0.45801466703414917, -0.4440520107746124, -0.43008938431739807, -0.41612672805786133, -0.402164101600647, -0.3882014751434326, -0.3742388188838959, -0.36027616262435913, -0.3463135361671448, -0.33235087990760803, -0.3183882534503937, -0.30442559719085693, -0.2904629707336426, -0.2765003442764282, -0.2625376880168915, -0.24857506155967712, -0.23461242020130157, -0.22064977884292603, -0.20668715238571167, -0.19272449612617493, -0.17876186966896057, -0.16479922831058502, -0.15083658695220947, -0.13687394559383392, -0.12291130423545837, -0.10894866287708282, -0.09498602896928787, -0.08102338761091232, -0.06706074625253677, -0.05309811234474182, -0.03913547098636627, -0.025172829627990723, -0.011210190132260323, 0.0027524493634700775, 0.01671508699655533, 0.030677728354930878, 0.04464036971330643, 0.05860300362110138, 0.07256564497947693, 0.08652828633785248, 0.10049092769622803, 0.11445356905460358, 0.12841621041297913, 0.14237883687019348, 0.15634149312973022, 0.17030411958694458, 0.18426676094532013, 0.19822940230369568, 0.21219204366207123, 0.22615468502044678, 0.24011731147766113, 0.2540799677371979, 0.26804259419441223, 0.282005250453949, 0.29596787691116333, 0.3099305033683777, 0.32389312982559204, 0.3378557860851288, 0.35181841254234314, 0.3657810688018799, 0.37974369525909424, 0.3937063217163086, 0.40766897797584534, 0.4216316342353821]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 9.0, 9.0, 13.0, 12.0, 23.0, 48.0, 59.0, 96.0, 188.0, 267.0, 377.0, 663.0, 1289.0, 2434.0, 4851.0, 10532.0, 25230.0, 69480.0, 214143.0, 404117.0, 203894.0, 66562.0, 24173.0, 10021.0, 4692.0, 2323.0, 1202.0, 733.0, 419.0, 226.0, 155.0, 108.0, 61.0, 49.0, 26.0, 27.0, 14.0, 11.0, 5.0, 4.0, 4.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.23779296875, -0.23069000244140625, -0.2235870361328125, -0.21648406982421875, -0.209381103515625, -0.20227813720703125, -0.1951751708984375, -0.18807220458984375, -0.18096923828125, -0.17386627197265625, -0.1667633056640625, -0.15966033935546875, -0.152557373046875, -0.14545440673828125, -0.1383514404296875, -0.13124847412109375, -0.1241455078125, -0.11704254150390625, -0.1099395751953125, -0.10283660888671875, -0.095733642578125, -0.08863067626953125, -0.0815277099609375, -0.07442474365234375, -0.06732177734375, -0.06021881103515625, -0.0531158447265625, -0.04601287841796875, -0.038909912109375, -0.03180694580078125, -0.0247039794921875, -0.01760101318359375, -0.010498046875, -0.00339508056640625, 0.0037078857421875, 0.01081085205078125, 0.017913818359375, 0.02501678466796875, 0.0321197509765625, 0.03922271728515625, 0.04632568359375, 0.05342864990234375, 0.0605316162109375, 0.06763458251953125, 0.074737548828125, 0.08184051513671875, 0.0889434814453125, 0.09604644775390625, 0.1031494140625, 0.11025238037109375, 0.1173553466796875, 0.12445831298828125, 0.131561279296875, 0.13866424560546875, 0.1457672119140625, 0.15287017822265625, 0.15997314453125, 0.16707611083984375, 0.1741790771484375, 0.18128204345703125, 0.188385009765625, 0.19548797607421875, 0.2025909423828125, 0.20969390869140625, 0.216796875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 8.0, 5.0, 9.0, 6.0, 12.0, 12.0, 15.0, 22.0, 22.0, 28.0, 31.0, 40.0, 42.0, 55.0, 43.0, 41.0, 57.0, 67.0, 66.0, 61.0, 54.0, 45.0, 40.0, 38.0, 40.0, 32.0, 25.0, 12.0, 10.0, 14.0, 13.0, 7.0, 6.0, 6.0, 4.0, 3.0, 2.0, 0.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.23095703125, -0.22406387329101562, -0.21717071533203125, -0.21027755737304688, -0.2033843994140625, -0.19649124145507812, -0.18959808349609375, -0.18270492553710938, -0.175811767578125, -0.16891860961914062, -0.16202545166015625, -0.15513229370117188, -0.1482391357421875, -0.14134597778320312, -0.13445281982421875, -0.12755966186523438, -0.12066650390625, -0.11377334594726562, -0.10688018798828125, -0.09998703002929688, -0.0930938720703125, -0.08620071411132812, -0.07930755615234375, -0.07241439819335938, -0.065521240234375, -0.058628082275390625, -0.05173492431640625, -0.044841766357421875, -0.0379486083984375, -0.031055450439453125, -0.02416229248046875, -0.017269134521484375, -0.0103759765625, -0.003482818603515625, 0.00341033935546875, 0.010303497314453125, 0.0171966552734375, 0.024089813232421875, 0.03098297119140625, 0.037876129150390625, 0.044769287109375, 0.051662445068359375, 0.05855560302734375, 0.06544876098632812, 0.0723419189453125, 0.07923507690429688, 0.08612823486328125, 0.09302139282226562, 0.09991455078125, 0.10680770874023438, 0.11370086669921875, 0.12059402465820312, 0.1274871826171875, 0.13438034057617188, 0.14127349853515625, 0.14816665649414062, 0.155059814453125, 0.16195297241210938, 0.16884613037109375, 0.17573928833007812, 0.1826324462890625, 0.18952560424804688, 0.19641876220703125, 0.20331192016601562, 0.210205078125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 7.0, 9.0, 5.0, 10.0, 11.0, 12.0, 25.0, 20.0, 29.0, 39.0, 49.0, 82.0, 103.0, 153.0, 203.0, 325.0, 550.0, 952.0, 1935.0, 5508.0, 23968.0, 221918.0, 693507.0, 79996.0, 12216.0, 3496.0, 1405.0, 732.0, 417.0, 291.0, 176.0, 105.0, 83.0, 40.0, 52.0, 35.0, 29.0, 18.0, 16.0, 13.0, 2.0, 5.0, 3.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.42333984375, -0.40981292724609375, -0.3962860107421875, -0.38275909423828125, -0.369232177734375, -0.35570526123046875, -0.3421783447265625, -0.32865142822265625, -0.31512451171875, -0.30159759521484375, -0.2880706787109375, -0.27454376220703125, -0.261016845703125, -0.24748992919921875, -0.2339630126953125, -0.22043609619140625, -0.2069091796875, -0.19338226318359375, -0.1798553466796875, -0.16632843017578125, -0.152801513671875, -0.13927459716796875, -0.1257476806640625, -0.11222076416015625, -0.09869384765625, -0.08516693115234375, -0.0716400146484375, -0.05811309814453125, -0.044586181640625, -0.03105926513671875, -0.0175323486328125, -0.00400543212890625, 0.009521484375, 0.02304840087890625, 0.0365753173828125, 0.05010223388671875, 0.063629150390625, 0.07715606689453125, 0.0906829833984375, 0.10420989990234375, 0.11773681640625, 0.13126373291015625, 0.1447906494140625, 0.15831756591796875, 0.171844482421875, 0.18537139892578125, 0.1988983154296875, 0.21242523193359375, 0.2259521484375, 0.23947906494140625, 0.2530059814453125, 0.26653289794921875, 0.280059814453125, 0.29358673095703125, 0.3071136474609375, 0.32064056396484375, 0.33416748046875, 0.34769439697265625, 0.3612213134765625, 0.37474822998046875, 0.388275146484375, 0.40180206298828125, 0.4153289794921875, 0.42885589599609375, 0.4423828125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 6.0, 9.0, 13.0, 7.0, 14.0, 20.0, 14.0, 24.0, 26.0, 26.0, 28.0, 41.0, 38.0, 42.0, 43.0, 55.0, 47.0, 53.0, 41.0, 54.0, 37.0, 42.0, 31.0, 39.0, 39.0, 29.0, 28.0, 31.0, 24.0, 14.0, 18.0, 12.0, 9.0, 11.0, 3.0, 4.0, 4.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.994140625, -0.9647750854492188, -0.9354095458984375, -0.9060440063476562, -0.876678466796875, -0.8473129272460938, -0.8179473876953125, -0.7885818481445312, -0.75921630859375, -0.7298507690429688, -0.7004852294921875, -0.6711196899414062, -0.641754150390625, -0.6123886108398438, -0.5830230712890625, -0.5536575317382812, -0.5242919921875, -0.49492645263671875, -0.4655609130859375, -0.43619537353515625, -0.406829833984375, -0.37746429443359375, -0.3480987548828125, -0.31873321533203125, -0.28936767578125, -0.26000213623046875, -0.2306365966796875, -0.20127105712890625, -0.171905517578125, -0.14253997802734375, -0.1131744384765625, -0.08380889892578125, -0.054443359375, -0.02507781982421875, 0.0042877197265625, 0.03365325927734375, 0.063018798828125, 0.09238433837890625, 0.1217498779296875, 0.15111541748046875, 0.18048095703125, 0.20984649658203125, 0.2392120361328125, 0.26857757568359375, 0.297943115234375, 0.32730865478515625, 0.3566741943359375, 0.38603973388671875, 0.4154052734375, 0.44477081298828125, 0.4741363525390625, 0.5035018920898438, 0.532867431640625, 0.5622329711914062, 0.5915985107421875, 0.6209640502929688, 0.65032958984375, 0.6796951293945312, 0.7090606689453125, 0.7384262084960938, 0.767791748046875, 0.7971572875976562, 0.8265228271484375, 0.8558883666992188, 0.88525390625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 7.0, 3.0, 3.0, 9.0, 10.0, 28.0, 42.0, 111.0, 512.0, 9398.0, 1029636.0, 8062.0, 554.0, 109.0, 30.0, 18.0, 9.0, 8.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.15234375, -1.1238784790039062, -1.0954132080078125, -1.0669479370117188, -1.038482666015625, -1.0100173950195312, -0.9815521240234375, -0.9530868530273438, -0.92462158203125, -0.8961563110351562, -0.8676910400390625, -0.8392257690429688, -0.810760498046875, -0.7822952270507812, -0.7538299560546875, -0.7253646850585938, -0.6968994140625, -0.6684341430664062, -0.6399688720703125, -0.6115036010742188, -0.583038330078125, -0.5545730590820312, -0.5261077880859375, -0.49764251708984375, -0.46917724609375, -0.44071197509765625, -0.4122467041015625, -0.38378143310546875, -0.355316162109375, -0.32685089111328125, -0.2983856201171875, -0.26992034912109375, -0.241455078125, -0.21298980712890625, -0.1845245361328125, -0.15605926513671875, -0.127593994140625, -0.09912872314453125, -0.0706634521484375, -0.04219818115234375, -0.01373291015625, 0.01473236083984375, 0.0431976318359375, 0.07166290283203125, 0.100128173828125, 0.12859344482421875, 0.1570587158203125, 0.18552398681640625, 0.2139892578125, 0.24245452880859375, 0.2709197998046875, 0.29938507080078125, 0.327850341796875, 0.35631561279296875, 0.3847808837890625, 0.41324615478515625, 0.44171142578125, 0.47017669677734375, 0.4986419677734375, 0.5271072387695312, 0.555572509765625, 0.5840377807617188, 0.6125030517578125, 0.6409683227539062, 0.66943359375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 1.0, 6.0, 8.0, 5.0, 7.0, 8.0, 12.0, 9.0, 10.0, 20.0, 29.0, 31.0, 44.0, 63.0, 75.0, 112.0, 103.0, 109.0, 91.0, 64.0, 41.0, 30.0, 21.0, 15.0, 14.0, 8.0, 11.0, 12.0, 14.0, 3.0, 7.0, 6.0, 6.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.341934204101562e-05, -6.103515625e-05, -5.8650970458984375e-05, -5.626678466796875e-05, -5.3882598876953125e-05, -5.14984130859375e-05, -4.9114227294921875e-05, -4.673004150390625e-05, -4.4345855712890625e-05, -4.1961669921875e-05, -3.9577484130859375e-05, -3.719329833984375e-05, -3.4809112548828125e-05, -3.24249267578125e-05, -3.0040740966796875e-05, -2.765655517578125e-05, -2.5272369384765625e-05, -2.288818359375e-05, -2.0503997802734375e-05, -1.811981201171875e-05, -1.5735626220703125e-05, -1.33514404296875e-05, -1.0967254638671875e-05, -8.58306884765625e-06, -6.198883056640625e-06, -3.814697265625e-06, -1.430511474609375e-06, 9.5367431640625e-07, 3.337860107421875e-06, 5.7220458984375e-06, 8.106231689453125e-06, 1.049041748046875e-05, 1.2874603271484375e-05, 1.52587890625e-05, 1.7642974853515625e-05, 2.002716064453125e-05, 2.2411346435546875e-05, 2.47955322265625e-05, 2.7179718017578125e-05, 2.956390380859375e-05, 3.1948089599609375e-05, 3.4332275390625e-05, 3.6716461181640625e-05, 3.910064697265625e-05, 4.1484832763671875e-05, 4.38690185546875e-05, 4.6253204345703125e-05, 4.863739013671875e-05, 5.1021575927734375e-05, 5.340576171875e-05, 5.5789947509765625e-05, 5.817413330078125e-05, 6.0558319091796875e-05, 6.29425048828125e-05, 6.532669067382812e-05, 6.771087646484375e-05, 7.009506225585938e-05, 7.2479248046875e-05, 7.486343383789062e-05, 7.724761962890625e-05, 7.963180541992188e-05, 8.20159912109375e-05, 8.440017700195312e-05, 8.678436279296875e-05, 8.916854858398438e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 3.0, 7.0, 11.0, 8.0, 11.0, 17.0, 23.0, 38.0, 60.0, 89.0, 143.0, 285.0, 570.0, 1457.0, 4801.0, 31202.0, 691646.0, 296793.0, 16125.0, 3172.0, 1089.0, 427.0, 218.0, 122.0, 76.0, 53.0, 34.0, 25.0, 16.0, 13.0, 5.0, 6.0, 5.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.272216796875, -0.2644062042236328, -0.2565956115722656, -0.24878501892089844, -0.24097442626953125, -0.23316383361816406, -0.22535324096679688, -0.2175426483154297, -0.2097320556640625, -0.2019214630126953, -0.19411087036132812, -0.18630027770996094, -0.17848968505859375, -0.17067909240722656, -0.16286849975585938, -0.1550579071044922, -0.147247314453125, -0.1394367218017578, -0.13162612915039062, -0.12381553649902344, -0.11600494384765625, -0.10819435119628906, -0.10038375854492188, -0.09257316589355469, -0.0847625732421875, -0.07695198059082031, -0.06914138793945312, -0.06133079528808594, -0.05352020263671875, -0.04570960998535156, -0.037899017333984375, -0.030088424682617188, -0.02227783203125, -0.014467239379882812, -0.006656646728515625, 0.0011539459228515625, 0.00896453857421875, 0.016775131225585938, 0.024585723876953125, 0.03239631652832031, 0.0402069091796875, 0.04801750183105469, 0.055828094482421875, 0.06363868713378906, 0.07144927978515625, 0.07925987243652344, 0.08707046508789062, 0.09488105773925781, 0.102691650390625, 0.11050224304199219, 0.11831283569335938, 0.12612342834472656, 0.13393402099609375, 0.14174461364746094, 0.14955520629882812, 0.1573657989501953, 0.1651763916015625, 0.1729869842529297, 0.18079757690429688, 0.18860816955566406, 0.19641876220703125, 0.20422935485839844, 0.21203994750976562, 0.2198505401611328, 0.2276611328125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 1.0, 1.0, 2.0, 4.0, 3.0, 9.0, 11.0, 37.0, 44.0, 82.0, 107.0, 158.0, 165.0, 127.0, 98.0, 66.0, 25.0, 19.0, 14.0, 6.0, 2.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4384765625, -0.4256553649902344, -0.41283416748046875, -0.4000129699707031, -0.3871917724609375, -0.3743705749511719, -0.36154937744140625, -0.3487281799316406, -0.335906982421875, -0.3230857849121094, -0.31026458740234375, -0.2974433898925781, -0.2846221923828125, -0.2718009948730469, -0.25897979736328125, -0.24615859985351562, -0.23333740234375, -0.22051620483398438, -0.20769500732421875, -0.19487380981445312, -0.1820526123046875, -0.16923141479492188, -0.15641021728515625, -0.14358901977539062, -0.130767822265625, -0.11794662475585938, -0.10512542724609375, -0.09230422973632812, -0.0794830322265625, -0.06666183471679688, -0.05384063720703125, -0.041019439697265625, -0.0281982421875, -0.015377044677734375, -0.00255584716796875, 0.010265350341796875, 0.0230865478515625, 0.035907745361328125, 0.04872894287109375, 0.061550140380859375, 0.074371337890625, 0.08719253540039062, 0.10001373291015625, 0.11283493041992188, 0.1256561279296875, 0.13847732543945312, 0.15129852294921875, 0.16411972045898438, 0.17694091796875, 0.18976211547851562, 0.20258331298828125, 0.21540451049804688, 0.2282257080078125, 0.24104690551757812, 0.25386810302734375, 0.2666893005371094, 0.279510498046875, 0.2923316955566406, 0.30515289306640625, 0.3179740905761719, 0.3307952880859375, 0.3436164855957031, 0.35643768310546875, 0.3692588806152344, 0.382080078125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 4.0, 22.0, 50.0, 150.0, 305.0, 285.0, 135.0, 32.0, 9.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.243878364562988, -7.036629676818848, -6.829380989074707, -6.622132301330566, -6.414883613586426, -6.207634925842285, -6.0003862380981445, -5.793137550354004, -5.585888862609863, -5.378640174865723, -5.171391487121582, -4.964142799377441, -4.756894111633301, -4.54964542388916, -4.3423967361450195, -4.135148048400879, -3.9278995990753174, -3.7206509113311768, -3.513402223587036, -3.3061535358428955, -3.098904848098755, -2.8916563987731934, -2.6844077110290527, -2.477159023284912, -2.2699103355407715, -2.062661647796631, -1.8554129600524902, -1.6481642723083496, -1.440915584564209, -1.233667016029358, -1.0264183282852173, -0.8191696405410767, -0.6119208335876465, -0.40467214584350586, -0.19742348790168762, 0.009825170040130615, 0.21707385778427124, 0.4243224859237671, 0.6315711736679077, 0.8388198614120483, 1.046068549156189, 1.2533172369003296, 1.4605659246444702, 1.6678144931793213, 1.875063180923462, 2.0823118686676025, 2.289560556411743, 2.496809244155884, 2.7040579319000244, 2.911306619644165, 3.1185553073883057, 3.3258039951324463, 3.533052682876587, 3.7403011322021484, 3.947549819946289, 4.15479850769043, 4.36204719543457, 4.569295883178711, 4.776544570922852, 4.983793258666992, 5.191041946411133, 5.398290634155273, 5.605539321899414, 5.812788009643555, 6.020036697387695]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 5.0, 7.0, 5.0, 8.0, 8.0, 11.0, 12.0, 9.0, 11.0, 18.0, 24.0, 17.0, 29.0, 23.0, 27.0, 22.0, 37.0, 50.0, 43.0, 42.0, 53.0, 53.0, 42.0, 44.0, 49.0, 47.0, 45.0, 29.0, 27.0, 25.0, 31.0, 24.0, 22.0, 15.0, 17.0, 14.0, 18.0, 6.0, 7.0, 7.0, 4.0, 3.0, 8.0, 3.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.311081886291504, -4.176558971405029, -4.042036056518555, -3.90751314163208, -3.7729902267456055, -3.638467311859131, -3.503944158554077, -3.3694212436676025, -3.234898328781128, -3.1003754138946533, -2.9658524990081787, -2.831329584121704, -2.6968064308166504, -2.562283515930176, -2.427760601043701, -2.2932376861572266, -2.158714771270752, -2.0241918563842773, -1.8896689414978027, -1.7551459074020386, -1.620622992515564, -1.4861000776290894, -1.3515770435333252, -1.2170541286468506, -1.082531213760376, -0.9480082988739014, -0.813485324382782, -0.6789623498916626, -0.544439435005188, -0.4099165201187134, -0.275393545627594, -0.1408705711364746, -0.006347179412841797, 0.1281757652759552, 0.2626987099647522, 0.3972216546535492, 0.5317445993423462, 0.6662675142288208, 0.8007904887199402, 0.9353134632110596, 1.0698363780975342, 1.2043592929840088, 1.3388822078704834, 1.4734052419662476, 1.6079281568527222, 1.7424510717391968, 1.876974105834961, 2.0114970207214355, 2.14601993560791, 2.2805428504943848, 2.4150657653808594, 2.549588680267334, 2.6841115951538086, 2.818634510040283, 2.953157663345337, 3.0876805782318115, 3.222203493118286, 3.3567264080047607, 3.4912493228912354, 3.62577223777771, 3.7602953910827637, 3.8948183059692383, 4.029341220855713, 4.1638641357421875, 4.298387050628662]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 7.0, 9.0, 6.0, 19.0, 21.0, 35.0, 32.0, 70.0, 106.0, 210.0, 407.0, 946.0, 3677.0, 33943.0, 4091754.0, 55981.0, 4798.0, 1211.0, 448.0, 227.0, 133.0, 79.0, 45.0, 37.0, 21.0, 18.0, 7.0, 5.0, 7.0, 4.0, 3.0, 5.0, 1.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.480224609375, -0.4614448547363281, -0.44266510009765625, -0.4238853454589844, -0.4051055908203125, -0.3863258361816406, -0.36754608154296875, -0.3487663269042969, -0.329986572265625, -0.3112068176269531, -0.29242706298828125, -0.2736473083496094, -0.2548675537109375, -0.23608779907226562, -0.21730804443359375, -0.19852828979492188, -0.17974853515625, -0.16096878051757812, -0.14218902587890625, -0.12340927124023438, -0.1046295166015625, -0.08584976196289062, -0.06707000732421875, -0.048290252685546875, -0.029510498046875, -0.010730743408203125, 0.00804901123046875, 0.026828765869140625, 0.0456085205078125, 0.06438827514648438, 0.08316802978515625, 0.10194778442382812, 0.1207275390625, 0.13950729370117188, 0.15828704833984375, 0.17706680297851562, 0.1958465576171875, 0.21462631225585938, 0.23340606689453125, 0.2521858215332031, 0.270965576171875, 0.2897453308105469, 0.30852508544921875, 0.3273048400878906, 0.3460845947265625, 0.3648643493652344, 0.38364410400390625, 0.4024238586425781, 0.42120361328125, 0.4399833679199219, 0.45876312255859375, 0.4775428771972656, 0.4963226318359375, 0.5151023864746094, 0.5338821411132812, 0.5526618957519531, 0.571441650390625, 0.5902214050292969, 0.6090011596679688, 0.6277809143066406, 0.6465606689453125, 0.6653404235839844, 0.6841201782226562, 0.7028999328613281, 0.7216796875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 5.0, 6.0, 10.0, 17.0, 22.0, 16.0, 36.0, 39.0, 52.0, 62.0, 57.0, 74.0, 72.0, 84.0, 84.0, 72.0, 66.0, 52.0, 30.0, 29.0, 21.0, 17.0, 10.0, 15.0, 9.0, 10.0, 4.0, 1.0, 7.0, 5.0, 2.0, 5.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2939453125, -0.28488922119140625, -0.2758331298828125, -0.26677703857421875, -0.257720947265625, -0.24866485595703125, -0.2396087646484375, -0.23055267333984375, -0.22149658203125, -0.21244049072265625, -0.2033843994140625, -0.19432830810546875, -0.185272216796875, -0.17621612548828125, -0.1671600341796875, -0.15810394287109375, -0.1490478515625, -0.13999176025390625, -0.1309356689453125, -0.12187957763671875, -0.112823486328125, -0.10376739501953125, -0.0947113037109375, -0.08565521240234375, -0.07659912109375, -0.06754302978515625, -0.0584869384765625, -0.04943084716796875, -0.040374755859375, -0.03131866455078125, -0.0222625732421875, -0.01320648193359375, -0.004150390625, 0.00490570068359375, 0.0139617919921875, 0.02301788330078125, 0.032073974609375, 0.04113006591796875, 0.0501861572265625, 0.05924224853515625, 0.06829833984375, 0.07735443115234375, 0.0864105224609375, 0.09546661376953125, 0.104522705078125, 0.11357879638671875, 0.1226348876953125, 0.13169097900390625, 0.1407470703125, 0.14980316162109375, 0.1588592529296875, 0.16791534423828125, 0.176971435546875, 0.18602752685546875, 0.1950836181640625, 0.20413970947265625, 0.21319580078125, 0.22225189208984375, 0.2313079833984375, 0.24036407470703125, 0.249420166015625, 0.25847625732421875, 0.2675323486328125, 0.27658843994140625, 0.28564453125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 6.0, 9.0, 11.0, 13.0, 17.0, 23.0, 24.0, 37.0, 47.0, 65.0, 92.0, 83.0, 118.0, 125.0, 150.0, 159.0, 206.0, 388.0, 9716.0, 4181005.0, 724.0, 270.0, 182.0, 158.0, 144.0, 92.0, 81.0, 81.0, 66.0, 45.0, 29.0, 22.0, 22.0, 22.0, 17.0, 9.0, 5.0, 9.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.708984375, -3.597320556640625, -3.48565673828125, -3.373992919921875, -3.2623291015625, -3.150665283203125, -3.03900146484375, -2.927337646484375, -2.815673828125, -2.704010009765625, -2.59234619140625, -2.480682373046875, -2.3690185546875, -2.257354736328125, -2.14569091796875, -2.034027099609375, -1.92236328125, -1.810699462890625, -1.69903564453125, -1.587371826171875, -1.4757080078125, -1.364044189453125, -1.25238037109375, -1.140716552734375, -1.029052734375, -0.917388916015625, -0.80572509765625, -0.694061279296875, -0.5823974609375, -0.470733642578125, -0.35906982421875, -0.247406005859375, -0.1357421875, -0.024078369140625, 0.08758544921875, 0.199249267578125, 0.3109130859375, 0.422576904296875, 0.53424072265625, 0.645904541015625, 0.757568359375, 0.869232177734375, 0.98089599609375, 1.092559814453125, 1.2042236328125, 1.315887451171875, 1.42755126953125, 1.539215087890625, 1.65087890625, 1.762542724609375, 1.87420654296875, 1.985870361328125, 2.0975341796875, 2.209197998046875, 2.32086181640625, 2.432525634765625, 2.544189453125, 2.655853271484375, 2.76751708984375, 2.879180908203125, 2.9908447265625, 3.102508544921875, 3.21417236328125, 3.325836181640625, 3.4375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 249.0, 3829.0, 7.0, 1.0, 0.0, 1.0], "bins": [-4.125, -4.055194854736328, -3.9853897094726562, -3.9155845642089844, -3.8457794189453125, -3.7759742736816406, -3.7061691284179688, -3.636363983154297, -3.566558837890625, -3.496753692626953, -3.4269485473632812, -3.3571434020996094, -3.2873382568359375, -3.2175331115722656, -3.1477279663085938, -3.077922821044922, -3.00811767578125, -2.938312530517578, -2.8685073852539062, -2.7987022399902344, -2.7288970947265625, -2.6590919494628906, -2.5892868041992188, -2.519481658935547, -2.449676513671875, -2.379871368408203, -2.3100662231445312, -2.2402610778808594, -2.1704559326171875, -2.1006507873535156, -2.0308456420898438, -1.9610404968261719, -1.8912353515625, -1.8214302062988281, -1.7516250610351562, -1.6818199157714844, -1.6120147705078125, -1.5422096252441406, -1.4724044799804688, -1.4025993347167969, -1.332794189453125, -1.2629890441894531, -1.1931838989257812, -1.1233787536621094, -1.0535736083984375, -0.9837684631347656, -0.9139633178710938, -0.8441581726074219, -0.77435302734375, -0.7045478820800781, -0.6347427368164062, -0.5649375915527344, -0.4951324462890625, -0.4253273010253906, -0.35552215576171875, -0.2857170104980469, -0.215911865234375, -0.14610671997070312, -0.07630157470703125, -0.006496429443359375, 0.0633087158203125, 0.13311386108398438, 0.20291900634765625, 0.2727241516113281, 0.342529296875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 30.0, 225.0, 634.0, 92.0, 15.0, 4.0, 3.0, 0.0, 1.0, 2.0], "bins": [-15.436528205871582, -15.161609649658203, -14.886691093444824, -14.611773490905762, -14.336854934692383, -14.061936378479004, -13.787017822265625, -13.512100219726562, -13.237181663513184, -12.962263107299805, -12.687344551086426, -12.412426948547363, -12.137508392333984, -11.862589836120605, -11.587671279907227, -11.312753677368164, -11.037834167480469, -10.76291561126709, -10.487997055053711, -10.213079452514648, -9.93816089630127, -9.66324234008789, -9.388323783874512, -9.113405227661133, -8.83848762512207, -8.563569068908691, -8.288650512695312, -8.01373291015625, -7.738814353942871, -7.463895797729492, -7.188977241516113, -6.914059162139893, -6.63914155960083, -6.364223003387451, -6.0893049240112305, -5.814386367797852, -5.539468288421631, -5.264549732208252, -4.989631652832031, -4.714713096618652, -4.439794540405273, -4.1648759841918945, -3.889957904815674, -3.615039348602295, -3.340121269226074, -3.0652027130126953, -2.7902843952178955, -2.5153660774230957, -2.240447998046875, -1.9655296802520752, -1.6906113624572754, -1.415692925453186, -1.1407746076583862, -0.8658562898635864, -0.5909378528594971, -0.31601953506469727, -0.04110121726989746, 0.23381713032722473, 0.5087354779243469, 0.7836538553237915, 1.0585721731185913, 1.3334904909133911, 1.6084089279174805, 1.8833272457122803, 2.15824556350708]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 11.0, 23.0, 25.0, 33.0, 66.0, 78.0, 99.0, 165.0, 153.0, 121.0, 88.0, 45.0, 25.0, 24.0, 17.0, 11.0, 6.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.094334602355957, -5.877405166625977, -5.660475730895996, -5.443546295166016, -5.226616859436035, -5.009687423706055, -4.792757987976074, -4.575828552246094, -4.358899116516113, -4.141969680786133, -3.9250402450561523, -3.708110809326172, -3.4911813735961914, -3.274251937866211, -3.0573225021362305, -2.84039306640625, -2.6234633922576904, -2.40653395652771, -2.1896045207977295, -1.972675085067749, -1.7557456493377686, -1.5388160943984985, -1.321886658668518, -1.1049572229385376, -0.8880277872085571, -0.6710983514785767, -0.4541688859462738, -0.23723942041397095, -0.02030998468399048, 0.19661951065063477, 0.41354894638061523, 0.6304783821105957, 0.8474078178405762, 1.0643372535705566, 1.281266689300537, 1.4981961250305176, 1.715125560760498, 1.932055115699768, 2.148984432220459, 2.3659138679504395, 2.58284330368042, 2.7997727394104004, 3.016702175140381, 3.2336316108703613, 3.450561046600342, 3.6674904823303223, 3.8844199180603027, 4.101349353790283, 4.318279266357422, 4.535208702087402, 4.752138137817383, 4.969067573547363, 5.185997009277344, 5.402926445007324, 5.619855880737305, 5.836785316467285, 6.053714752197266, 6.270644187927246, 6.487573623657227, 6.704503059387207, 6.9214324951171875, 7.138361930847168, 7.355291366577148, 7.572220802307129, 7.789150238037109]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 7.0, 6.0, 12.0, 15.0, 25.0, 28.0, 53.0, 80.0, 141.0, 256.0, 433.0, 840.0, 2154.0, 6479.0, 27877.0, 233341.0, 677445.0, 78909.0, 13862.0, 3763.0, 1387.0, 622.0, 317.0, 192.0, 116.0, 62.0, 50.0, 22.0, 19.0, 14.0, 8.0, 5.0, 4.0, 0.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.69287109375, -0.6714019775390625, -0.649932861328125, -0.6284637451171875, -0.60699462890625, -0.5855255126953125, -0.564056396484375, -0.5425872802734375, -0.5211181640625, -0.4996490478515625, -0.478179931640625, -0.4567108154296875, -0.43524169921875, -0.4137725830078125, -0.392303466796875, -0.3708343505859375, -0.349365234375, -0.3278961181640625, -0.306427001953125, -0.2849578857421875, -0.26348876953125, -0.2420196533203125, -0.220550537109375, -0.1990814208984375, -0.1776123046875, -0.1561431884765625, -0.134674072265625, -0.1132049560546875, -0.09173583984375, -0.0702667236328125, -0.048797607421875, -0.0273284912109375, -0.005859375, 0.0156097412109375, 0.037078857421875, 0.0585479736328125, 0.08001708984375, 0.1014862060546875, 0.122955322265625, 0.1444244384765625, 0.1658935546875, 0.1873626708984375, 0.208831787109375, 0.2303009033203125, 0.25177001953125, 0.2732391357421875, 0.294708251953125, 0.3161773681640625, 0.337646484375, 0.3591156005859375, 0.380584716796875, 0.4020538330078125, 0.42352294921875, 0.4449920654296875, 0.466461181640625, 0.4879302978515625, 0.5093994140625, 0.5308685302734375, 0.552337646484375, 0.5738067626953125, 0.59527587890625, 0.6167449951171875, 0.638214111328125, 0.6596832275390625, 0.68115234375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 0.0, 3.0, 4.0, 8.0, 11.0, 8.0, 28.0, 29.0, 32.0, 36.0, 55.0, 63.0, 78.0, 84.0, 92.0, 97.0, 80.0, 71.0, 63.0, 44.0, 31.0, 26.0, 14.0, 12.0, 11.0, 7.0, 5.0, 6.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51806640625, -0.5005340576171875, -0.483001708984375, -0.4654693603515625, -0.44793701171875, -0.4304046630859375, -0.412872314453125, -0.3953399658203125, -0.3778076171875, -0.3602752685546875, -0.342742919921875, -0.3252105712890625, -0.30767822265625, -0.2901458740234375, -0.272613525390625, -0.2550811767578125, -0.237548828125, -0.2200164794921875, -0.202484130859375, -0.1849517822265625, -0.16741943359375, -0.1498870849609375, -0.132354736328125, -0.1148223876953125, -0.0972900390625, -0.0797576904296875, -0.062225341796875, -0.0446929931640625, -0.02716064453125, -0.0096282958984375, 0.007904052734375, 0.0254364013671875, 0.04296875, 0.0605010986328125, 0.078033447265625, 0.0955657958984375, 0.11309814453125, 0.1306304931640625, 0.148162841796875, 0.1656951904296875, 0.1832275390625, 0.2007598876953125, 0.218292236328125, 0.2358245849609375, 0.25335693359375, 0.2708892822265625, 0.288421630859375, 0.3059539794921875, 0.323486328125, 0.3410186767578125, 0.358551025390625, 0.3760833740234375, 0.39361572265625, 0.4111480712890625, 0.428680419921875, 0.4462127685546875, 0.4637451171875, 0.4812774658203125, 0.498809814453125, 0.5163421630859375, 0.53387451171875, 0.5514068603515625, 0.568939208984375, 0.5864715576171875, 0.60400390625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 5.0, 4.0, 5.0, 12.0, 36.0, 79.0, 196.0, 610.0, 3402.0, 1027021.0, 15698.0, 971.0, 298.0, 112.0, 56.0, 19.0, 13.0, 5.0, 3.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.232421875, -3.1197509765625, -3.007080078125, -2.8944091796875, -2.78173828125, -2.6690673828125, -2.556396484375, -2.4437255859375, -2.3310546875, -2.2183837890625, -2.105712890625, -1.9930419921875, -1.88037109375, -1.7677001953125, -1.655029296875, -1.5423583984375, -1.4296875, -1.3170166015625, -1.204345703125, -1.0916748046875, -0.97900390625, -0.8663330078125, -0.753662109375, -0.6409912109375, -0.5283203125, -0.4156494140625, -0.302978515625, -0.1903076171875, -0.07763671875, 0.0350341796875, 0.147705078125, 0.2603759765625, 0.373046875, 0.4857177734375, 0.598388671875, 0.7110595703125, 0.82373046875, 0.9364013671875, 1.049072265625, 1.1617431640625, 1.2744140625, 1.3870849609375, 1.499755859375, 1.6124267578125, 1.72509765625, 1.8377685546875, 1.950439453125, 2.0631103515625, 2.17578125, 2.2884521484375, 2.401123046875, 2.5137939453125, 2.62646484375, 2.7391357421875, 2.851806640625, 2.9644775390625, 3.0771484375, 3.1898193359375, 3.302490234375, 3.4151611328125, 3.52783203125, 3.6405029296875, 3.753173828125, 3.8658447265625, 3.978515625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 10.0, 28.0, 92.0, 268.0, 270.0, 209.0, 95.0, 27.0, 10.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.140625, -7.91046142578125, -7.6802978515625, -7.45013427734375, -7.219970703125, -6.98980712890625, -6.7596435546875, -6.52947998046875, -6.29931640625, -6.06915283203125, -5.8389892578125, -5.60882568359375, -5.378662109375, -5.14849853515625, -4.9183349609375, -4.68817138671875, -4.4580078125, -4.22784423828125, -3.9976806640625, -3.76751708984375, -3.537353515625, -3.30718994140625, -3.0770263671875, -2.84686279296875, -2.61669921875, -2.38653564453125, -2.1563720703125, -1.92620849609375, -1.696044921875, -1.46588134765625, -1.2357177734375, -1.00555419921875, -0.775390625, -0.54522705078125, -0.3150634765625, -0.08489990234375, 0.145263671875, 0.37542724609375, 0.6055908203125, 0.83575439453125, 1.06591796875, 1.29608154296875, 1.5262451171875, 1.75640869140625, 1.986572265625, 2.21673583984375, 2.4468994140625, 2.67706298828125, 2.9072265625, 3.13739013671875, 3.3675537109375, 3.59771728515625, 3.827880859375, 4.05804443359375, 4.2882080078125, 4.51837158203125, 4.74853515625, 4.97869873046875, 5.2088623046875, 5.43902587890625, 5.669189453125, 5.89935302734375, 6.1295166015625, 6.35968017578125, 6.58984375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 11.0, 31.0, 120.0, 1040.0, 1042332.0, 4711.0, 225.0, 45.0, 19.0, 10.0, 3.0, 6.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.30859375, -4.202667236328125, -4.09674072265625, -3.990814208984375, -3.8848876953125, -3.778961181640625, -3.67303466796875, -3.567108154296875, -3.461181640625, -3.355255126953125, -3.24932861328125, -3.143402099609375, -3.0374755859375, -2.931549072265625, -2.82562255859375, -2.719696044921875, -2.61376953125, -2.507843017578125, -2.40191650390625, -2.295989990234375, -2.1900634765625, -2.084136962890625, -1.97821044921875, -1.872283935546875, -1.766357421875, -1.660430908203125, -1.55450439453125, -1.448577880859375, -1.3426513671875, -1.236724853515625, -1.13079833984375, -1.024871826171875, -0.9189453125, -0.813018798828125, -0.70709228515625, -0.601165771484375, -0.4952392578125, -0.389312744140625, -0.28338623046875, -0.177459716796875, -0.071533203125, 0.034393310546875, 0.14031982421875, 0.246246337890625, 0.3521728515625, 0.458099365234375, 0.56402587890625, 0.669952392578125, 0.77587890625, 0.881805419921875, 0.98773193359375, 1.093658447265625, 1.1995849609375, 1.305511474609375, 1.41143798828125, 1.517364501953125, 1.623291015625, 1.729217529296875, 1.83514404296875, 1.941070556640625, 2.0469970703125, 2.152923583984375, 2.25885009765625, 2.364776611328125, 2.470703125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 1.0, 5.0, 9.0, 7.0, 4.0, 10.0, 8.0, 17.0, 19.0, 32.0, 26.0, 57.0, 68.0, 122.0, 171.0, 132.0, 76.0, 56.0, 38.0, 37.0, 22.0, 14.0, 5.0, 6.0, 11.0, 8.0, 5.0, 6.0, 6.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00010693073272705078, -0.00010365061461925507, -0.00010037049651145935, -9.709037840366364e-05, -9.381026029586792e-05, -9.05301421880722e-05, -8.725002408027649e-05, -8.396990597248077e-05, -8.068978786468506e-05, -7.740966975688934e-05, -7.412955164909363e-05, -7.084943354129791e-05, -6.75693154335022e-05, -6.428919732570648e-05, -6.1009079217910767e-05, -5.772896111011505e-05, -5.4448843002319336e-05, -5.116872489452362e-05, -4.7888606786727905e-05, -4.460848867893219e-05, -4.1328370571136475e-05, -3.804825246334076e-05, -3.4768134355545044e-05, -3.148801624774933e-05, -2.8207898139953613e-05, -2.4927780032157898e-05, -2.1647661924362183e-05, -1.8367543816566467e-05, -1.5087425708770752e-05, -1.1807307600975037e-05, -8.527189493179321e-06, -5.247071385383606e-06, -1.9669532775878906e-06, 1.3131648302078247e-06, 4.59328293800354e-06, 7.873401045799255e-06, 1.115351915359497e-05, 1.4433637261390686e-05, 1.77137553691864e-05, 2.0993873476982117e-05, 2.4273991584777832e-05, 2.7554109692573547e-05, 3.083422780036926e-05, 3.411434590816498e-05, 3.739446401596069e-05, 4.067458212375641e-05, 4.3954700231552124e-05, 4.723481833934784e-05, 5.0514936447143555e-05, 5.379505455493927e-05, 5.7075172662734985e-05, 6.03552907705307e-05, 6.363540887832642e-05, 6.691552698612213e-05, 7.019564509391785e-05, 7.347576320171356e-05, 7.675588130950928e-05, 8.003599941730499e-05, 8.331611752510071e-05, 8.659623563289642e-05, 8.987635374069214e-05, 9.315647184848785e-05, 9.643658995628357e-05, 9.971670806407928e-05, 0.000102996826171875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 7.0, 9.0, 19.0, 95.0, 365.0, 8637.0, 1037654.0, 1500.0, 188.0, 57.0, 16.0, 8.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.142578125, -2.05438232421875, -1.9661865234375, -1.87799072265625, -1.789794921875, -1.70159912109375, -1.6134033203125, -1.52520751953125, -1.43701171875, -1.34881591796875, -1.2606201171875, -1.17242431640625, -1.084228515625, -0.99603271484375, -0.9078369140625, -0.81964111328125, -0.7314453125, -0.64324951171875, -0.5550537109375, -0.46685791015625, -0.378662109375, -0.29046630859375, -0.2022705078125, -0.11407470703125, -0.02587890625, 0.06231689453125, 0.1505126953125, 0.23870849609375, 0.326904296875, 0.41510009765625, 0.5032958984375, 0.59149169921875, 0.6796875, 0.76788330078125, 0.8560791015625, 0.94427490234375, 1.032470703125, 1.12066650390625, 1.2088623046875, 1.29705810546875, 1.38525390625, 1.47344970703125, 1.5616455078125, 1.64984130859375, 1.738037109375, 1.82623291015625, 1.9144287109375, 2.00262451171875, 2.0908203125, 2.17901611328125, 2.2672119140625, 2.35540771484375, 2.443603515625, 2.53179931640625, 2.6199951171875, 2.70819091796875, 2.79638671875, 2.88458251953125, 2.9727783203125, 3.06097412109375, 3.149169921875, 3.23736572265625, 3.3255615234375, 3.41375732421875, 3.501953125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 6.0, 14.0, 55.0, 432.0, 407.0, 54.0, 20.0, 5.0, 7.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.134765625, -1.071685791015625, -1.00860595703125, -0.945526123046875, -0.8824462890625, -0.819366455078125, -0.75628662109375, -0.693206787109375, -0.630126953125, -0.567047119140625, -0.50396728515625, -0.440887451171875, -0.3778076171875, -0.314727783203125, -0.25164794921875, -0.188568115234375, -0.12548828125, -0.062408447265625, 0.00067138671875, 0.063751220703125, 0.1268310546875, 0.189910888671875, 0.25299072265625, 0.316070556640625, 0.379150390625, 0.442230224609375, 0.50531005859375, 0.568389892578125, 0.6314697265625, 0.694549560546875, 0.75762939453125, 0.820709228515625, 0.8837890625, 0.946868896484375, 1.00994873046875, 1.073028564453125, 1.1361083984375, 1.199188232421875, 1.26226806640625, 1.325347900390625, 1.388427734375, 1.451507568359375, 1.51458740234375, 1.577667236328125, 1.6407470703125, 1.703826904296875, 1.76690673828125, 1.829986572265625, 1.89306640625, 1.956146240234375, 2.01922607421875, 2.082305908203125, 2.1453857421875, 2.208465576171875, 2.27154541015625, 2.334625244140625, 2.397705078125, 2.460784912109375, 2.52386474609375, 2.586944580078125, 2.6500244140625, 2.713104248046875, 2.77618408203125, 2.839263916015625, 2.90234375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 2.0, 6.0, 5.0, 20.0, 52.0, 345.0, 510.0, 44.0, 12.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.40204620361328, -37.2132682800293, -36.02449035644531, -34.83570861816406, -33.64693069458008, -32.458152770996094, -31.26937484741211, -30.080595016479492, -28.891815185546875, -27.70303726196289, -26.514257431030273, -25.32547950744629, -24.136699676513672, -22.947921752929688, -21.759143829345703, -20.570363998413086, -19.3815860748291, -18.192808151245117, -17.0040283203125, -15.815250396728516, -14.626470565795898, -13.437692642211914, -12.248913764953613, -11.060134887695312, -9.871356010437012, -8.682577133178711, -7.49379825592041, -6.305019855499268, -5.116240978240967, -3.927462100982666, -2.7386837005615234, -1.5499048233032227, -0.3611259460449219, 0.8276528120040894, 2.0164315700531006, 3.2052102088928223, 4.393989086151123, 5.582767963409424, 6.771546363830566, 7.960325241088867, 9.149104118347168, 10.337882995605469, 11.52666187286377, 12.71544075012207, 13.904218673706055, 15.092998504638672, 16.281776428222656, 17.47055435180664, 18.659334182739258, 19.848112106323242, 21.03689193725586, 22.225669860839844, 23.41444969177246, 24.603227615356445, 25.792007446289062, 26.980785369873047, 28.16956329345703, 29.358341217041016, 30.547121047973633, 31.735898971557617, 32.924678802490234, 34.11345672607422, 35.3022346496582, 36.49101257324219, 37.67979431152344]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 4.0, 6.0, 3.0, 6.0, 5.0, 10.0, 14.0, 18.0, 23.0, 27.0, 45.0, 29.0, 32.0, 46.0, 57.0, 63.0, 75.0, 60.0, 58.0, 63.0, 71.0, 45.0, 45.0, 50.0, 25.0, 23.0, 25.0, 14.0, 17.0, 9.0, 6.0, 9.0, 5.0, 11.0, 4.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0], "bins": [-16.041461944580078, -15.645145416259766, -15.248828887939453, -14.852511405944824, -14.456194877624512, -14.0598783493042, -13.66356086730957, -13.267244338989258, -12.870927810668945, -12.474611282348633, -12.07829475402832, -11.681977272033691, -11.285660743713379, -10.889344215393066, -10.493026733398438, -10.096710205078125, -9.700393676757812, -9.3040771484375, -8.907760620117188, -8.511443138122559, -8.115126609802246, -7.718810081481934, -7.322493076324463, -6.926176071166992, -6.52985954284668, -6.133543014526367, -5.7372260093688965, -5.340909004211426, -4.944592475891113, -4.548275947570801, -4.15195894241333, -3.7556421756744385, -3.359325408935547, -2.9630086421966553, -2.5666918754577637, -2.170375108718872, -1.7740583419799805, -1.3777415752410889, -0.9814248085021973, -0.5851080417633057, -0.18879127502441406, 0.20752549171447754, 0.6038422584533691, 1.0001590251922607, 1.3964757919311523, 1.792792558670044, 2.1891093254089355, 2.585426092147827, 2.9817428588867188, 3.3780596256256104, 3.774376392364502, 4.170693397521973, 4.567009925842285, 4.963326454162598, 5.359643459320068, 5.755960464477539, 6.152276992797852, 6.548593521118164, 6.944910526275635, 7.3412275314331055, 7.737544059753418, 8.13386058807373, 8.53017807006836, 8.926494598388672, 9.322811126708984]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 1.0, 2.0, 5.0, 3.0, 5.0, 6.0, 8.0, 15.0, 15.0, 23.0, 32.0, 49.0, 84.0, 113.0, 157.0, 258.0, 356.0, 660.0, 1124.0, 1924.0, 3987.0, 8995.0, 26012.0, 142763.0, 3075730.0, 846898.0, 56645.0, 15315.0, 6033.0, 2909.0, 1611.0, 891.0, 573.0, 347.0, 219.0, 163.0, 98.0, 64.0, 54.0, 48.0, 28.0, 14.0, 18.0, 6.0, 8.0, 4.0, 7.0, 4.0, 1.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.357421875, -0.3468437194824219, -0.33626556396484375, -0.3256874084472656, -0.3151092529296875, -0.3045310974121094, -0.29395294189453125, -0.2833747863769531, -0.272796630859375, -0.2622184753417969, -0.25164031982421875, -0.24106216430664062, -0.2304840087890625, -0.21990585327148438, -0.20932769775390625, -0.19874954223632812, -0.18817138671875, -0.17759323120117188, -0.16701507568359375, -0.15643692016601562, -0.1458587646484375, -0.13528060913085938, -0.12470245361328125, -0.11412429809570312, -0.103546142578125, -0.09296798706054688, -0.08238983154296875, -0.07181167602539062, -0.0612335205078125, -0.050655364990234375, -0.04007720947265625, -0.029499053955078125, -0.0189208984375, -0.008342742919921875, 0.00223541259765625, 0.012813568115234375, 0.0233917236328125, 0.033969879150390625, 0.04454803466796875, 0.055126190185546875, 0.065704345703125, 0.07628250122070312, 0.08686065673828125, 0.09743881225585938, 0.1080169677734375, 0.11859512329101562, 0.12917327880859375, 0.13975143432617188, 0.15032958984375, 0.16090774536132812, 0.17148590087890625, 0.18206405639648438, 0.1926422119140625, 0.20322036743164062, 0.21379852294921875, 0.22437667846679688, 0.234954833984375, 0.24553298950195312, 0.25611114501953125, 0.2666893005371094, 0.2772674560546875, 0.2878456115722656, 0.29842376708984375, 0.3090019226074219, 0.319580078125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 0.0, 5.0, 6.0, 3.0, 13.0, 19.0, 19.0, 27.0, 27.0, 49.0, 56.0, 68.0, 70.0, 88.0, 74.0, 88.0, 79.0, 68.0, 65.0, 36.0, 23.0, 36.0, 29.0, 14.0, 8.0, 5.0, 7.0, 5.0, 3.0, 8.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.395751953125, -0.3832664489746094, -0.37078094482421875, -0.3582954406738281, -0.3458099365234375, -0.3333244323730469, -0.32083892822265625, -0.3083534240722656, -0.295867919921875, -0.2833824157714844, -0.27089691162109375, -0.2584114074707031, -0.2459259033203125, -0.23344039916992188, -0.22095489501953125, -0.20846939086914062, -0.19598388671875, -0.18349838256835938, -0.17101287841796875, -0.15852737426757812, -0.1460418701171875, -0.13355636596679688, -0.12107086181640625, -0.10858535766601562, -0.096099853515625, -0.08361434936523438, -0.07112884521484375, -0.058643341064453125, -0.0461578369140625, -0.033672332763671875, -0.02118682861328125, -0.008701324462890625, 0.0037841796875, 0.016269683837890625, 0.02875518798828125, 0.041240692138671875, 0.0537261962890625, 0.06621170043945312, 0.07869720458984375, 0.09118270874023438, 0.103668212890625, 0.11615371704101562, 0.12863922119140625, 0.14112472534179688, 0.1536102294921875, 0.16609573364257812, 0.17858123779296875, 0.19106674194335938, 0.20355224609375, 0.21603775024414062, 0.22852325439453125, 0.24100875854492188, 0.2534942626953125, 0.2659797668457031, 0.27846527099609375, 0.2909507751464844, 0.303436279296875, 0.3159217834472656, 0.32840728759765625, 0.3408927917480469, 0.3533782958984375, 0.3658638000488281, 0.37834930419921875, 0.3908348083496094, 0.4033203125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 6.0, 8.0, 3.0, 3.0, 11.0, 15.0, 36.0, 50.0, 61.0, 114.0, 199.0, 493.0, 1254.0, 4833.0, 23698.0, 950106.0, 3172635.0, 31834.0, 6083.0, 1570.0, 594.0, 281.0, 136.0, 91.0, 60.0, 42.0, 25.0, 16.0, 5.0, 7.0, 3.0, 4.0, 5.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.79150390625, -0.7651748657226562, -0.7388458251953125, -0.7125167846679688, -0.686187744140625, -0.6598587036132812, -0.6335296630859375, -0.6072006225585938, -0.58087158203125, -0.5545425415039062, -0.5282135009765625, -0.5018844604492188, -0.475555419921875, -0.44922637939453125, -0.4228973388671875, -0.39656829833984375, -0.3702392578125, -0.34391021728515625, -0.3175811767578125, -0.29125213623046875, -0.264923095703125, -0.23859405517578125, -0.2122650146484375, -0.18593597412109375, -0.15960693359375, -0.13327789306640625, -0.1069488525390625, -0.08061981201171875, -0.054290771484375, -0.02796173095703125, -0.0016326904296875, 0.02469635009765625, 0.051025390625, 0.07735443115234375, 0.1036834716796875, 0.13001251220703125, 0.156341552734375, 0.18267059326171875, 0.2089996337890625, 0.23532867431640625, 0.26165771484375, 0.28798675537109375, 0.3143157958984375, 0.34064483642578125, 0.366973876953125, 0.39330291748046875, 0.4196319580078125, 0.44596099853515625, 0.4722900390625, 0.49861907958984375, 0.5249481201171875, 0.5512771606445312, 0.577606201171875, 0.6039352416992188, 0.6302642822265625, 0.6565933227539062, 0.68292236328125, 0.7092514038085938, 0.7355804443359375, 0.7619094848632812, 0.788238525390625, 0.8145675659179688, 0.8408966064453125, 0.8672256469726562, 0.8935546875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 3.0, 5.0, 3.0, 11.0, 6.0, 18.0, 37.0, 80.0, 347.0, 2406.0, 825.0, 159.0, 58.0, 31.0, 29.0, 10.0, 20.0, 7.0, 10.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8447265625, -0.8074188232421875, -0.770111083984375, -0.7328033447265625, -0.69549560546875, -0.6581878662109375, -0.620880126953125, -0.5835723876953125, -0.5462646484375, -0.5089569091796875, -0.471649169921875, -0.4343414306640625, -0.39703369140625, -0.3597259521484375, -0.322418212890625, -0.2851104736328125, -0.247802734375, -0.2104949951171875, -0.173187255859375, -0.1358795166015625, -0.09857177734375, -0.0612640380859375, -0.023956298828125, 0.0133514404296875, 0.0506591796875, 0.0879669189453125, 0.125274658203125, 0.1625823974609375, 0.19989013671875, 0.2371978759765625, 0.274505615234375, 0.3118133544921875, 0.34912109375, 0.3864288330078125, 0.423736572265625, 0.4610443115234375, 0.49835205078125, 0.5356597900390625, 0.572967529296875, 0.6102752685546875, 0.6475830078125, 0.6848907470703125, 0.722198486328125, 0.7595062255859375, 0.79681396484375, 0.8341217041015625, 0.871429443359375, 0.9087371826171875, 0.946044921875, 0.9833526611328125, 1.020660400390625, 1.0579681396484375, 1.09527587890625, 1.1325836181640625, 1.169891357421875, 1.2071990966796875, 1.2445068359375, 1.2818145751953125, 1.319122314453125, 1.3564300537109375, 1.39373779296875, 1.4310455322265625, 1.468353271484375, 1.5056610107421875, 1.54296875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 10.0, 34.0, 180.0, 446.0, 201.0, 46.0, 28.0, 12.0, 6.0, 6.0, 5.0, 6.0, 3.0, 4.0, 1.0, 5.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.4840898513793945, -7.1733880043029785, -6.8626861572265625, -6.5519843101501465, -6.2412824630737305, -5.930580139160156, -5.61987829208374, -5.309176445007324, -4.998474597930908, -4.687772750854492, -4.377070903778076, -4.06636905670166, -3.755666971206665, -3.444965124130249, -3.134263038635254, -2.823561191558838, -2.512859344482422, -2.202157497406006, -1.8914555311203003, -1.5807535648345947, -1.2700517177581787, -0.9593498706817627, -0.6486479043960571, -0.33794593811035156, -0.027244091033935547, 0.28345781564712524, 0.594159722328186, 0.9048616290092468, 1.2155635356903076, 1.5262653827667236, 1.8369673490524292, 2.1476693153381348, 2.458372116088867, 2.769073963165283, 3.079775810241699, 3.3904778957366943, 3.7011797428131104, 4.0118818283081055, 4.3225836753845215, 4.6332855224609375, 4.9439873695373535, 5.2546892166137695, 5.5653910636901855, 5.876092910766602, 6.186795234680176, 6.497496604919434, 6.808198928833008, 7.118900775909424, 7.42960262298584, 7.740304470062256, 8.051006317138672, 8.361708641052246, 8.672410011291504, 8.983112335205078, 9.293813705444336, 9.60451602935791, 9.915218353271484, 10.225920677185059, 10.536622047424316, 10.84732437133789, 11.158025741577148, 11.468728065490723, 11.77942943572998, 12.090131759643555, 12.400833129882812]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 8.0, 7.0, 15.0, 15.0, 16.0, 27.0, 30.0, 40.0, 58.0, 44.0, 46.0, 77.0, 66.0, 64.0, 60.0, 56.0, 64.0, 41.0, 59.0, 50.0, 30.0, 15.0, 20.0, 21.0, 17.0, 20.0, 8.0, 7.0, 8.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.888029098510742, -4.734557151794434, -4.581085205078125, -4.427613258361816, -4.274141311645508, -4.120669364929199, -3.9671971797943115, -3.813724994659424, -3.6602530479431152, -3.5067811012268066, -3.353309154510498, -3.1998372077941895, -3.0463650226593018, -2.892893075942993, -2.7394211292266846, -2.585948944091797, -2.4324772357940674, -2.279005289077759, -2.12553334236145, -1.972061276435852, -1.818589210510254, -1.6651172637939453, -1.5116453170776367, -1.3581732511520386, -1.20470130443573, -1.0512293577194214, -0.8977572917938232, -0.7442853450775146, -0.5908133387565613, -0.4373413324356079, -0.2838693857192993, -0.13039731979370117, 0.023074626922607422, 0.1765466183423996, 0.3300186097621918, 0.48349058628082275, 0.6369625926017761, 0.7904345989227295, 0.9439065456390381, 1.0973786115646362, 1.2508505582809448, 1.4043225049972534, 1.5577945709228516, 1.7112665176391602, 1.8647384643554688, 2.0182104110717773, 2.171682357788086, 2.3251545429229736, 2.4786264896392822, 2.632098436355591, 2.7855703830718994, 2.939042568206787, 3.0925145149230957, 3.2459864616394043, 3.399458408355713, 3.5529303550720215, 3.70640230178833, 3.8598742485046387, 4.013346195220947, 4.166818141937256, 4.3202900886535645, 4.473762512207031, 4.62723445892334, 4.780706405639648, 4.934178352355957]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 8.0, 10.0, 14.0, 16.0, 25.0, 37.0, 34.0, 73.0, 87.0, 125.0, 202.0, 318.0, 474.0, 761.0, 1152.0, 1863.0, 3066.0, 5579.0, 10167.0, 20131.0, 43628.0, 105611.0, 262116.0, 329765.0, 147640.0, 59636.0, 26444.0, 12748.0, 6881.0, 3821.0, 2283.0, 1349.0, 839.0, 585.0, 328.0, 232.0, 153.0, 102.0, 70.0, 57.0, 38.0, 14.0, 17.0, 18.0, 11.0, 11.0, 6.0, 5.0, 5.0, 2.0, 1.0, 3.0, 3.0], "bins": [-0.2333984375, -0.22657012939453125, -0.2197418212890625, -0.21291351318359375, -0.206085205078125, -0.19925689697265625, -0.1924285888671875, -0.18560028076171875, -0.17877197265625, -0.17194366455078125, -0.1651153564453125, -0.15828704833984375, -0.151458740234375, -0.14463043212890625, -0.1378021240234375, -0.13097381591796875, -0.1241455078125, -0.11731719970703125, -0.1104888916015625, -0.10366058349609375, -0.096832275390625, -0.09000396728515625, -0.0831756591796875, -0.07634735107421875, -0.06951904296875, -0.06269073486328125, -0.0558624267578125, -0.04903411865234375, -0.042205810546875, -0.03537750244140625, -0.0285491943359375, -0.02172088623046875, -0.014892578125, -0.00806427001953125, -0.0012359619140625, 0.00559234619140625, 0.012420654296875, 0.01924896240234375, 0.0260772705078125, 0.03290557861328125, 0.03973388671875, 0.04656219482421875, 0.0533905029296875, 0.06021881103515625, 0.067047119140625, 0.07387542724609375, 0.0807037353515625, 0.08753204345703125, 0.0943603515625, 0.10118865966796875, 0.1080169677734375, 0.11484527587890625, 0.121673583984375, 0.12850189208984375, 0.1353302001953125, 0.14215850830078125, 0.14898681640625, 0.15581512451171875, 0.1626434326171875, 0.16947174072265625, 0.176300048828125, 0.18312835693359375, 0.1899566650390625, 0.19678497314453125, 0.20361328125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 3.0, 8.0, 6.0, 10.0, 12.0, 14.0, 18.0, 17.0, 20.0, 30.0, 34.0, 32.0, 44.0, 58.0, 61.0, 64.0, 58.0, 55.0, 66.0, 60.0, 41.0, 56.0, 41.0, 36.0, 35.0, 26.0, 14.0, 14.0, 13.0, 8.0, 9.0, 8.0, 4.0, 9.0, 8.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2880859375, -0.278839111328125, -0.26959228515625, -0.260345458984375, -0.2510986328125, -0.241851806640625, -0.23260498046875, -0.223358154296875, -0.214111328125, -0.204864501953125, -0.19561767578125, -0.186370849609375, -0.1771240234375, -0.167877197265625, -0.15863037109375, -0.149383544921875, -0.14013671875, -0.130889892578125, -0.12164306640625, -0.112396240234375, -0.1031494140625, -0.093902587890625, -0.08465576171875, -0.075408935546875, -0.066162109375, -0.056915283203125, -0.04766845703125, -0.038421630859375, -0.0291748046875, -0.019927978515625, -0.01068115234375, -0.001434326171875, 0.0078125, 0.017059326171875, 0.02630615234375, 0.035552978515625, 0.0447998046875, 0.054046630859375, 0.06329345703125, 0.072540283203125, 0.081787109375, 0.091033935546875, 0.10028076171875, 0.109527587890625, 0.1187744140625, 0.128021240234375, 0.13726806640625, 0.146514892578125, 0.15576171875, 0.165008544921875, 0.17425537109375, 0.183502197265625, 0.1927490234375, 0.201995849609375, 0.21124267578125, 0.220489501953125, 0.229736328125, 0.238983154296875, 0.24822998046875, 0.257476806640625, 0.2667236328125, 0.275970458984375, 0.28521728515625, 0.294464111328125, 0.3037109375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 4.0, 6.0, 5.0, 9.0, 16.0, 25.0, 30.0, 42.0, 65.0, 110.0, 143.0, 267.0, 452.0, 826.0, 2134.0, 10171.0, 252106.0, 757745.0, 19040.0, 3056.0, 987.0, 515.0, 277.0, 160.0, 105.0, 90.0, 58.0, 45.0, 14.0, 16.0, 13.0, 6.0, 8.0, 6.0, 5.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9794921875, -0.946990966796875, -0.91448974609375, -0.881988525390625, -0.8494873046875, -0.816986083984375, -0.78448486328125, -0.751983642578125, -0.719482421875, -0.686981201171875, -0.65447998046875, -0.621978759765625, -0.5894775390625, -0.556976318359375, -0.52447509765625, -0.491973876953125, -0.45947265625, -0.426971435546875, -0.39447021484375, -0.361968994140625, -0.3294677734375, -0.296966552734375, -0.26446533203125, -0.231964111328125, -0.199462890625, -0.166961669921875, -0.13446044921875, -0.101959228515625, -0.0694580078125, -0.036956787109375, -0.00445556640625, 0.028045654296875, 0.060546875, 0.093048095703125, 0.12554931640625, 0.158050537109375, 0.1905517578125, 0.223052978515625, 0.25555419921875, 0.288055419921875, 0.320556640625, 0.353057861328125, 0.38555908203125, 0.418060302734375, 0.4505615234375, 0.483062744140625, 0.51556396484375, 0.548065185546875, 0.58056640625, 0.613067626953125, 0.64556884765625, 0.678070068359375, 0.7105712890625, 0.743072509765625, 0.77557373046875, 0.808074951171875, 0.840576171875, 0.873077392578125, 0.90557861328125, 0.938079833984375, 0.9705810546875, 1.003082275390625, 1.03558349609375, 1.068084716796875, 1.1005859375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 8.0, 8.0, 7.0, 11.0, 10.0, 17.0, 16.0, 24.0, 42.0, 46.0, 47.0, 69.0, 64.0, 80.0, 69.0, 74.0, 88.0, 55.0, 45.0, 53.0, 49.0, 36.0, 11.0, 30.0, 14.0, 11.0, 6.0, 6.0, 7.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.052734375, -1.9956512451171875, -1.938568115234375, -1.8814849853515625, -1.82440185546875, -1.7673187255859375, -1.710235595703125, -1.6531524658203125, -1.5960693359375, -1.5389862060546875, -1.481903076171875, -1.4248199462890625, -1.36773681640625, -1.3106536865234375, -1.253570556640625, -1.1964874267578125, -1.139404296875, -1.0823211669921875, -1.025238037109375, -0.9681549072265625, -0.91107177734375, -0.8539886474609375, -0.796905517578125, -0.7398223876953125, -0.6827392578125, -0.6256561279296875, -0.568572998046875, -0.5114898681640625, -0.45440673828125, -0.3973236083984375, -0.340240478515625, -0.2831573486328125, -0.22607421875, -0.1689910888671875, -0.111907958984375, -0.0548248291015625, 0.00225830078125, 0.0593414306640625, 0.116424560546875, 0.1735076904296875, 0.2305908203125, 0.2876739501953125, 0.344757080078125, 0.4018402099609375, 0.45892333984375, 0.5160064697265625, 0.573089599609375, 0.6301727294921875, 0.687255859375, 0.7443389892578125, 0.801422119140625, 0.8585052490234375, 0.91558837890625, 0.9726715087890625, 1.029754638671875, 1.0868377685546875, 1.1439208984375, 1.2010040283203125, 1.258087158203125, 1.3151702880859375, 1.37225341796875, 1.4293365478515625, 1.486419677734375, 1.5435028076171875, 1.6005859375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 1.0, 3.0, 3.0, 9.0, 11.0, 10.0, 24.0, 42.0, 74.0, 99.0, 187.0, 422.0, 1192.0, 5295.0, 80168.0, 926413.0, 29718.0, 3313.0, 856.0, 324.0, 148.0, 100.0, 46.0, 30.0, 25.0, 11.0, 10.0, 2.0, 6.0, 1.0, 3.0, 5.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.447509765625, -0.4355316162109375, -0.423553466796875, -0.4115753173828125, -0.39959716796875, -0.3876190185546875, -0.375640869140625, -0.3636627197265625, -0.3516845703125, -0.3397064208984375, -0.327728271484375, -0.3157501220703125, -0.30377197265625, -0.2917938232421875, -0.279815673828125, -0.2678375244140625, -0.255859375, -0.2438812255859375, -0.231903076171875, -0.2199249267578125, -0.20794677734375, -0.1959686279296875, -0.183990478515625, -0.1720123291015625, -0.1600341796875, -0.1480560302734375, -0.136077880859375, -0.1240997314453125, -0.11212158203125, -0.1001434326171875, -0.088165283203125, -0.0761871337890625, -0.064208984375, -0.0522308349609375, -0.040252685546875, -0.0282745361328125, -0.01629638671875, -0.0043182373046875, 0.007659912109375, 0.0196380615234375, 0.0316162109375, 0.0435943603515625, 0.055572509765625, 0.0675506591796875, 0.07952880859375, 0.0915069580078125, 0.103485107421875, 0.1154632568359375, 0.12744140625, 0.1394195556640625, 0.151397705078125, 0.1633758544921875, 0.17535400390625, 0.1873321533203125, 0.199310302734375, 0.2112884521484375, 0.2232666015625, 0.2352447509765625, 0.247222900390625, 0.2592010498046875, 0.27117919921875, 0.2831573486328125, 0.295135498046875, 0.3071136474609375, 0.319091796875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 5.0, 4.0, 0.0, 2.0, 4.0, 8.0, 7.0, 7.0, 8.0, 16.0, 27.0, 19.0, 36.0, 66.0, 108.0, 188.0, 176.0, 114.0, 63.0, 38.0, 25.0, 16.0, 15.0, 17.0, 8.0, 5.0, 2.0, 3.0, 1.0, 4.0, 5.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0001633167266845703, -0.00015837885439395905, -0.00015344098210334778, -0.0001485031098127365, -0.00014356523752212524, -0.00013862736523151398, -0.0001336894929409027, -0.00012875162065029144, -0.00012381374835968018, -0.00011887587606906891, -0.00011393800377845764, -0.00010900013148784637, -0.00010406225919723511, -9.912438690662384e-05, -9.418651461601257e-05, -8.92486423254013e-05, -8.431077003479004e-05, -7.937289774417877e-05, -7.44350254535675e-05, -6.949715316295624e-05, -6.455928087234497e-05, -5.9621408581733704e-05, -5.4683536291122437e-05, -4.974566400051117e-05, -4.48077917098999e-05, -3.9869919419288635e-05, -3.493204712867737e-05, -2.99941748380661e-05, -2.5056302547454834e-05, -2.0118430256843567e-05, -1.51805579662323e-05, -1.0242685675621033e-05, -5.304813385009766e-06, -3.6694109439849854e-07, 4.5709311962127686e-06, 9.508803486824036e-06, 1.4446675777435303e-05, 1.938454806804657e-05, 2.4322420358657837e-05, 2.9260292649269104e-05, 3.419816493988037e-05, 3.913603723049164e-05, 4.4073909521102905e-05, 4.901178181171417e-05, 5.394965410232544e-05, 5.8887526392936707e-05, 6.382539868354797e-05, 6.876327097415924e-05, 7.370114326477051e-05, 7.863901555538177e-05, 8.357688784599304e-05, 8.851476013660431e-05, 9.345263242721558e-05, 9.839050471782684e-05, 0.00010332837700843811, 0.00010826624929904938, 0.00011320412158966064, 0.00011814199388027191, 0.00012307986617088318, 0.00012801773846149445, 0.0001329556107521057, 0.00013789348304271698, 0.00014283135533332825, 0.00014776922762393951, 0.00015270709991455078]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 4.0, 5.0, 1.0, 11.0, 10.0, 15.0, 20.0, 33.0, 44.0, 82.0, 128.0, 263.0, 536.0, 1458.0, 6179.0, 72894.0, 906975.0, 52205.0, 5315.0, 1313.0, 486.0, 232.0, 142.0, 90.0, 52.0, 14.0, 23.0, 9.0, 9.0, 5.0, 1.0, 0.0, 4.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2283935546875, -0.2172260284423828, -0.20605850219726562, -0.19489097595214844, -0.18372344970703125, -0.17255592346191406, -0.16138839721679688, -0.1502208709716797, -0.1390533447265625, -0.1278858184814453, -0.11671829223632812, -0.10555076599121094, -0.09438323974609375, -0.08321571350097656, -0.07204818725585938, -0.06088066101074219, -0.049713134765625, -0.03854560852050781, -0.027378082275390625, -0.016210556030273438, -0.00504302978515625, 0.0061244964599609375, 0.017292022705078125, 0.028459548950195312, 0.0396270751953125, 0.05079460144042969, 0.061962127685546875, 0.07312965393066406, 0.08429718017578125, 0.09546470642089844, 0.10663223266601562, 0.11779975891113281, 0.12896728515625, 0.1401348114013672, 0.15130233764648438, 0.16246986389160156, 0.17363739013671875, 0.18480491638183594, 0.19597244262695312, 0.2071399688720703, 0.2183074951171875, 0.2294750213623047, 0.24064254760742188, 0.25181007385253906, 0.26297760009765625, 0.27414512634277344, 0.2853126525878906, 0.2964801788330078, 0.307647705078125, 0.3188152313232422, 0.3299827575683594, 0.34115028381347656, 0.35231781005859375, 0.36348533630371094, 0.3746528625488281, 0.3858203887939453, 0.3969879150390625, 0.4081554412841797, 0.4193229675292969, 0.43049049377441406, 0.44165802001953125, 0.45282554626464844, 0.4639930725097656, 0.4751605987548828, 0.486328125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 10.0, 5.0, 11.0, 8.0, 10.0, 20.0, 23.0, 15.0, 34.0, 51.0, 39.0, 54.0, 68.0, 54.0, 78.0, 64.0, 74.0, 71.0, 54.0, 49.0, 56.0, 32.0, 25.0, 22.0, 9.0, 15.0, 10.0, 8.0, 2.0, 12.0, 3.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 4.0], "bins": [-0.302734375, -0.29532814025878906, -0.2879219055175781, -0.2805156707763672, -0.27310943603515625, -0.2657032012939453, -0.2582969665527344, -0.25089073181152344, -0.2434844970703125, -0.23607826232910156, -0.22867202758789062, -0.2212657928466797, -0.21385955810546875, -0.2064533233642578, -0.19904708862304688, -0.19164085388183594, -0.184234619140625, -0.17682838439941406, -0.16942214965820312, -0.1620159149169922, -0.15460968017578125, -0.1472034454345703, -0.13979721069335938, -0.13239097595214844, -0.1249847412109375, -0.11757850646972656, -0.11017227172851562, -0.10276603698730469, -0.09535980224609375, -0.08795356750488281, -0.08054733276367188, -0.07314109802246094, -0.06573486328125, -0.05832862854003906, -0.050922393798828125, -0.04351615905761719, -0.03610992431640625, -0.028703689575195312, -0.021297454833984375, -0.013891220092773438, -0.0064849853515625, 0.0009212493896484375, 0.008327484130859375, 0.015733718872070312, 0.02313995361328125, 0.030546188354492188, 0.037952423095703125, 0.04535865783691406, 0.052764892578125, 0.06017112731933594, 0.06757736206054688, 0.07498359680175781, 0.08238983154296875, 0.08979606628417969, 0.09720230102539062, 0.10460853576660156, 0.1120147705078125, 0.11942100524902344, 0.12682723999023438, 0.1342334747314453, 0.14163970947265625, 0.1490459442138672, 0.15645217895507812, 0.16385841369628906, 0.1712646484375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 14.0, 76.0, 560.0, 283.0, 43.0, 19.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.1772518157959, -18.717815399169922, -18.258378982543945, -17.79894256591797, -17.33950424194336, -16.880067825317383, -16.420631408691406, -15.96119499206543, -15.501758575439453, -15.042322158813477, -14.5828857421875, -14.123448371887207, -13.66401195526123, -13.204575538635254, -12.745138168334961, -12.285701751708984, -11.826265335083008, -11.366828918457031, -10.907392501831055, -10.447955131530762, -9.988518714904785, -9.529082298278809, -9.069644927978516, -8.610208511352539, -8.150772094726562, -7.691335678100586, -7.231898784637451, -6.772461891174316, -6.31302547454834, -5.853589057922363, -5.3941521644592285, -4.934715270996094, -4.475277900695801, -4.015841484069824, -3.5564045906066895, -3.096967935562134, -2.637531280517578, -2.1780946254730225, -1.7186579704284668, -1.2592213153839111, -0.7997846603393555, -0.3403480052947998, 0.11908864974975586, 0.5785253047943115, 1.0379619598388672, 1.4973986148834229, 1.9568352699279785, 2.416271924972534, 2.87570858001709, 3.3351452350616455, 3.794581890106201, 4.254018783569336, 4.7134552001953125, 5.172891616821289, 5.632328510284424, 6.091765403747559, 6.551201820373535, 7.010638236999512, 7.4700751304626465, 7.929512023925781, 8.388948440551758, 8.848384857177734, 9.307821273803711, 9.767258644104004, 10.22669506072998]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 6.0, 5.0, 8.0, 8.0, 15.0, 9.0, 14.0, 21.0, 31.0, 29.0, 32.0, 52.0, 40.0, 59.0, 67.0, 78.0, 73.0, 65.0, 66.0, 58.0, 48.0, 48.0, 27.0, 29.0, 27.0, 23.0, 20.0, 8.0, 11.0, 10.0, 12.0, 5.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.539610862731934, -5.338078022003174, -5.136545181274414, -4.935012340545654, -4.7334794998168945, -4.531946182250977, -4.330413341522217, -4.128880500793457, -3.9273476600646973, -3.7258148193359375, -3.5242819786071777, -3.322748899459839, -3.121216058731079, -2.9196832180023193, -2.7181501388549805, -2.5166172981262207, -2.315084457397461, -2.113551616668701, -1.9120186567306519, -1.7104856967926025, -1.5089528560638428, -1.307420015335083, -1.1058870553970337, -0.9043540954589844, -0.7028212547302246, -0.5012883543968201, -0.2997554540634155, -0.09822255373001099, 0.10331034660339355, 0.3048431873321533, 0.5063761472702026, 0.707909107208252, 0.9094424247741699, 1.1109752655029297, 1.312508225440979, 1.5140411853790283, 1.715574026107788, 1.9171068668365479, 2.1186399459838867, 2.3201727867126465, 2.5217056274414062, 2.723238468170166, 2.924771308898926, 3.1263043880462646, 3.3278372287750244, 3.529370069503784, 3.730903148651123, 3.932435989379883, 4.133968830108643, 4.335501670837402, 4.537034511566162, 4.738567352294922, 4.94010066986084, 5.141633033752441, 5.343166351318359, 5.544699192047119, 5.746232032775879, 5.947764873504639, 6.149297714233398, 6.350830554962158, 6.552363395690918, 6.753896713256836, 6.955429553985596, 7.1569623947143555, 7.358495235443115]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 4.0, 4.0, 2.0, 11.0, 10.0, 11.0, 23.0, 10.0, 24.0, 41.0, 62.0, 58.0, 117.0, 292.0, 630.0, 1968.0, 7096.0, 51299.0, 3892196.0, 227285.0, 9238.0, 2112.0, 805.0, 355.0, 194.0, 113.0, 83.0, 53.0, 32.0, 33.0, 21.0, 26.0, 19.0, 12.0, 12.0, 7.0, 3.0, 10.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0], "bins": [-0.66650390625, -0.6467132568359375, -0.626922607421875, -0.6071319580078125, -0.58734130859375, -0.5675506591796875, -0.547760009765625, -0.5279693603515625, -0.5081787109375, -0.4883880615234375, -0.468597412109375, -0.4488067626953125, -0.42901611328125, -0.4092254638671875, -0.389434814453125, -0.3696441650390625, -0.349853515625, -0.3300628662109375, -0.310272216796875, -0.2904815673828125, -0.27069091796875, -0.2509002685546875, -0.231109619140625, -0.2113189697265625, -0.1915283203125, -0.1717376708984375, -0.151947021484375, -0.1321563720703125, -0.11236572265625, -0.0925750732421875, -0.072784423828125, -0.0529937744140625, -0.033203125, -0.0134124755859375, 0.006378173828125, 0.0261688232421875, 0.04595947265625, 0.0657501220703125, 0.085540771484375, 0.1053314208984375, 0.1251220703125, 0.1449127197265625, 0.164703369140625, 0.1844940185546875, 0.20428466796875, 0.2240753173828125, 0.243865966796875, 0.2636566162109375, 0.283447265625, 0.3032379150390625, 0.323028564453125, 0.3428192138671875, 0.36260986328125, 0.3824005126953125, 0.402191162109375, 0.4219818115234375, 0.4417724609375, 0.4615631103515625, 0.481353759765625, 0.5011444091796875, 0.52093505859375, 0.5407257080078125, 0.560516357421875, 0.5803070068359375, 0.60009765625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 12.0, 17.0, 23.0, 39.0, 61.0, 81.0, 117.0, 122.0, 135.0, 123.0, 101.0, 66.0, 36.0, 25.0, 16.0, 16.0, 7.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.315673828125, -0.2962226867675781, -0.27677154541015625, -0.2573204040527344, -0.2378692626953125, -0.21841812133789062, -0.19896697998046875, -0.17951583862304688, -0.160064697265625, -0.14061355590820312, -0.12116241455078125, -0.10171127319335938, -0.0822601318359375, -0.06280899047851562, -0.04335784912109375, -0.023906707763671875, -0.00445556640625, 0.014995574951171875, 0.03444671630859375, 0.053897857666015625, 0.0733489990234375, 0.09280014038085938, 0.11225128173828125, 0.13170242309570312, 0.151153564453125, 0.17060470581054688, 0.19005584716796875, 0.20950698852539062, 0.2289581298828125, 0.24840927124023438, 0.26786041259765625, 0.2873115539550781, 0.3067626953125, 0.3262138366699219, 0.34566497802734375, 0.3651161193847656, 0.3845672607421875, 0.4040184020996094, 0.42346954345703125, 0.4429206848144531, 0.462371826171875, 0.4818229675292969, 0.5012741088867188, 0.5207252502441406, 0.5401763916015625, 0.5596275329589844, 0.5790786743164062, 0.5985298156738281, 0.61798095703125, 0.6374320983886719, 0.6568832397460938, 0.6763343811035156, 0.6957855224609375, 0.7152366638183594, 0.7346878051757812, 0.7541389465332031, 0.773590087890625, 0.7930412292480469, 0.8124923706054688, 0.8319435119628906, 0.8513946533203125, 0.8708457946777344, 0.8902969360351562, 0.9097480773925781, 0.92919921875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 8.0, 9.0, 11.0, 23.0, 25.0, 21.0, 37.0, 50.0, 57.0, 148.0, 378.0, 1486.0, 6715.0, 44057.0, 3758659.0, 360516.0, 17612.0, 3059.0, 711.0, 212.0, 120.0, 69.0, 66.0, 60.0, 40.0, 39.0, 34.0, 23.0, 15.0, 12.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.8125, -0.7898025512695312, -0.7671051025390625, -0.7444076538085938, -0.721710205078125, -0.6990127563476562, -0.6763153076171875, -0.6536178588867188, -0.63092041015625, -0.6082229614257812, -0.5855255126953125, -0.5628280639648438, -0.540130615234375, -0.5174331665039062, -0.4947357177734375, -0.47203826904296875, -0.4493408203125, -0.42664337158203125, -0.4039459228515625, -0.38124847412109375, -0.358551025390625, -0.33585357666015625, -0.3131561279296875, -0.29045867919921875, -0.26776123046875, -0.24506378173828125, -0.2223663330078125, -0.19966888427734375, -0.176971435546875, -0.15427398681640625, -0.1315765380859375, -0.10887908935546875, -0.086181640625, -0.06348419189453125, -0.0407867431640625, -0.01808929443359375, 0.004608154296875, 0.02730560302734375, 0.0500030517578125, 0.07270050048828125, 0.09539794921875, 0.11809539794921875, 0.1407928466796875, 0.16349029541015625, 0.186187744140625, 0.20888519287109375, 0.2315826416015625, 0.25428009033203125, 0.2769775390625, 0.29967498779296875, 0.3223724365234375, 0.34506988525390625, 0.367767333984375, 0.39046478271484375, 0.4131622314453125, 0.43585968017578125, 0.45855712890625, 0.48125457763671875, 0.5039520263671875, 0.5266494750976562, 0.549346923828125, 0.5720443725585938, 0.5947418212890625, 0.6174392700195312, 0.64013671875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 3.0, 4.0, 8.0, 7.0, 14.0, 20.0, 22.0, 42.0, 96.0, 457.0, 2268.0, 883.0, 150.0, 46.0, 29.0, 15.0, 11.0, 7.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.493896484375, -0.4601020812988281, -0.42630767822265625, -0.3925132751464844, -0.3587188720703125, -0.3249244689941406, -0.29113006591796875, -0.2573356628417969, -0.223541259765625, -0.18974685668945312, -0.15595245361328125, -0.12215805053710938, -0.0883636474609375, -0.054569244384765625, -0.02077484130859375, 0.013019561767578125, 0.04681396484375, 0.08060836791992188, 0.11440277099609375, 0.14819717407226562, 0.1819915771484375, 0.21578598022460938, 0.24958038330078125, 0.2833747863769531, 0.317169189453125, 0.3509635925292969, 0.38475799560546875, 0.4185523986816406, 0.4523468017578125, 0.4861412048339844, 0.5199356079101562, 0.5537300109863281, 0.5875244140625, 0.6213188171386719, 0.6551132202148438, 0.6889076232910156, 0.7227020263671875, 0.7564964294433594, 0.7902908325195312, 0.8240852355957031, 0.857879638671875, 0.8916740417480469, 0.9254684448242188, 0.9592628479003906, 0.9930572509765625, 1.0268516540527344, 1.0606460571289062, 1.0944404602050781, 1.12823486328125, 1.1620292663574219, 1.1958236694335938, 1.2296180725097656, 1.2634124755859375, 1.2972068786621094, 1.3310012817382812, 1.3647956848144531, 1.398590087890625, 1.4323844909667969, 1.4661788940429688, 1.4999732971191406, 1.5337677001953125, 1.5675621032714844, 1.6013565063476562, 1.6351509094238281, 1.6689453125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 2.0, 3.0, 27.0, 85.0, 331.0, 327.0, 118.0, 51.0, 21.0, 4.0, 9.0, 6.0, 4.0, 3.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.815892219543457, -4.636350154876709, -4.456808090209961, -4.277266025543213, -4.097723960876465, -3.918181896209717, -3.7386395931243896, -3.5590975284576416, -3.3795554637908936, -3.2000133991241455, -3.0204713344573975, -2.8409290313720703, -2.6613869667053223, -2.481844902038574, -2.302302837371826, -2.122760772705078, -1.94321870803833, -1.763676643371582, -1.584134578704834, -1.4045923948287964, -1.2250503301620483, -1.0455082654953003, -0.8659660816192627, -0.6864240169525146, -0.5068819522857666, -0.32733985781669617, -0.14779776334762573, 0.03174436092376709, 0.21128642559051514, 0.3908284902572632, 0.5703706741333008, 0.7499127388000488, 0.9294543266296387, 1.1089963912963867, 1.2885384559631348, 1.4680806398391724, 1.6476227045059204, 1.8271647691726685, 2.006706953048706, 2.186249017715454, 2.365791082382202, 2.54533314704895, 2.7248752117156982, 2.9044175148010254, 3.0839595794677734, 3.2635016441345215, 3.4430437088012695, 3.6225857734680176, 3.8021278381347656, 3.9816699028015137, 4.161211967468262, 4.34075403213501, 4.520296096801758, 4.699838161468506, 4.879380226135254, 5.05892276763916, 5.23846435546875, 5.418006420135498, 5.597548484802246, 5.777090549468994, 5.956632614135742, 6.13617467880249, 6.315716743469238, 6.4952592849731445, 6.674801349639893]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 4.0, 6.0, 4.0, 6.0, 12.0, 15.0, 22.0, 35.0, 44.0, 47.0, 56.0, 73.0, 69.0, 97.0, 80.0, 60.0, 70.0, 79.0, 45.0, 54.0, 41.0, 25.0, 24.0, 8.0, 9.0, 8.0, 7.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6425580978393555, -4.530004501342773, -4.417450904846191, -4.304897308349609, -4.192343711853027, -4.079790115356445, -3.967236280441284, -3.854682683944702, -3.74212908744812, -3.629575490951538, -3.517021894454956, -3.404468297958374, -3.291914463043213, -3.179360866546631, -3.066807270050049, -2.954253673553467, -2.8417000770568848, -2.7291464805603027, -2.6165928840637207, -2.5040392875671387, -2.3914856910705566, -2.2789320945739746, -2.1663782596588135, -2.0538246631622314, -1.9412710666656494, -1.8287174701690674, -1.7161638736724854, -1.6036101579666138, -1.4910565614700317, -1.3785029649734497, -1.2659492492675781, -1.153395652770996, -1.040842056274414, -0.928288459777832, -0.8157348036766052, -0.7031811475753784, -0.5906275510787964, -0.47807395458221436, -0.36552029848098755, -0.25296664237976074, -0.1404130458831787, -0.027859419584274292, 0.08469420671463013, 0.19724783301353455, 0.30980145931243896, 0.422355055809021, 0.5349087119102478, 0.6474623680114746, 0.7600159645080566, 0.8725695610046387, 0.9851232171058655, 1.0976768732070923, 1.2102304697036743, 1.3227840662002563, 1.435337781906128, 1.54789137840271, 1.660444974899292, 1.772998571395874, 1.885552167892456, 1.9981058835983276, 2.110659599304199, 2.2232131958007812, 2.3357667922973633, 2.4483203887939453, 2.5608739852905273]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 7.0, 5.0, 11.0, 17.0, 42.0, 36.0, 76.0, 107.0, 162.0, 304.0, 520.0, 1042.0, 2210.0, 5132.0, 14156.0, 47593.0, 202681.0, 527691.0, 181051.0, 43377.0, 13136.0, 4888.0, 2047.0, 997.0, 498.0, 313.0, 168.0, 95.0, 52.0, 45.0, 38.0, 15.0, 13.0, 12.0, 7.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.385986328125, -0.374786376953125, -0.36358642578125, -0.352386474609375, -0.3411865234375, -0.329986572265625, -0.31878662109375, -0.307586669921875, -0.29638671875, -0.285186767578125, -0.27398681640625, -0.262786865234375, -0.2515869140625, -0.240386962890625, -0.22918701171875, -0.217987060546875, -0.206787109375, -0.195587158203125, -0.18438720703125, -0.173187255859375, -0.1619873046875, -0.150787353515625, -0.13958740234375, -0.128387451171875, -0.1171875, -0.105987548828125, -0.09478759765625, -0.083587646484375, -0.0723876953125, -0.061187744140625, -0.04998779296875, -0.038787841796875, -0.027587890625, -0.016387939453125, -0.00518798828125, 0.006011962890625, 0.0172119140625, 0.028411865234375, 0.03961181640625, 0.050811767578125, 0.06201171875, 0.073211669921875, 0.08441162109375, 0.095611572265625, 0.1068115234375, 0.118011474609375, 0.12921142578125, 0.140411376953125, 0.151611328125, 0.162811279296875, 0.17401123046875, 0.185211181640625, 0.1964111328125, 0.207611083984375, 0.21881103515625, 0.230010986328125, 0.2412109375, 0.252410888671875, 0.26361083984375, 0.274810791015625, 0.2860107421875, 0.297210693359375, 0.30841064453125, 0.319610595703125, 0.330810546875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 7.0, 16.0, 10.0, 13.0, 16.0, 20.0, 39.0, 41.0, 37.0, 54.0, 50.0, 67.0, 80.0, 81.0, 73.0, 62.0, 52.0, 65.0, 42.0, 51.0, 28.0, 30.0, 14.0, 14.0, 6.0, 10.0, 10.0, 4.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28662109375, -0.27581787109375, -0.2650146484375, -0.25421142578125, -0.243408203125, -0.23260498046875, -0.2218017578125, -0.21099853515625, -0.2001953125, -0.18939208984375, -0.1785888671875, -0.16778564453125, -0.156982421875, -0.14617919921875, -0.1353759765625, -0.12457275390625, -0.11376953125, -0.10296630859375, -0.0921630859375, -0.08135986328125, -0.070556640625, -0.05975341796875, -0.0489501953125, -0.03814697265625, -0.02734375, -0.01654052734375, -0.0057373046875, 0.00506591796875, 0.015869140625, 0.02667236328125, 0.0374755859375, 0.04827880859375, 0.05908203125, 0.06988525390625, 0.0806884765625, 0.09149169921875, 0.102294921875, 0.11309814453125, 0.1239013671875, 0.13470458984375, 0.1455078125, 0.15631103515625, 0.1671142578125, 0.17791748046875, 0.188720703125, 0.19952392578125, 0.2103271484375, 0.22113037109375, 0.23193359375, 0.24273681640625, 0.2535400390625, 0.26434326171875, 0.275146484375, 0.28594970703125, 0.2967529296875, 0.30755615234375, 0.318359375, 0.32916259765625, 0.3399658203125, 0.35076904296875, 0.361572265625, 0.37237548828125, 0.3831787109375, 0.39398193359375, 0.40478515625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 2.0, 5.0, 3.0, 4.0, 7.0, 12.0, 32.0, 40.0, 71.0, 171.0, 346.0, 1009.0, 4090.0, 196917.0, 836352.0, 7293.0, 1322.0, 472.0, 197.0, 92.0, 40.0, 30.0, 9.0, 13.0, 6.0, 6.0, 3.0, 6.0, 0.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.63671875, -1.5887603759765625, -1.540802001953125, -1.4928436279296875, -1.44488525390625, -1.3969268798828125, -1.348968505859375, -1.3010101318359375, -1.2530517578125, -1.2050933837890625, -1.157135009765625, -1.1091766357421875, -1.06121826171875, -1.0132598876953125, -0.965301513671875, -0.9173431396484375, -0.869384765625, -0.8214263916015625, -0.773468017578125, -0.7255096435546875, -0.67755126953125, -0.6295928955078125, -0.581634521484375, -0.5336761474609375, -0.4857177734375, -0.4377593994140625, -0.389801025390625, -0.3418426513671875, -0.29388427734375, -0.2459259033203125, -0.197967529296875, -0.1500091552734375, -0.10205078125, -0.0540924072265625, -0.006134033203125, 0.0418243408203125, 0.08978271484375, 0.1377410888671875, 0.185699462890625, 0.2336578369140625, 0.2816162109375, 0.3295745849609375, 0.377532958984375, 0.4254913330078125, 0.47344970703125, 0.5214080810546875, 0.569366455078125, 0.6173248291015625, 0.665283203125, 0.7132415771484375, 0.761199951171875, 0.8091583251953125, 0.85711669921875, 0.9050750732421875, 0.953033447265625, 1.0009918212890625, 1.0489501953125, 1.0969085693359375, 1.144866943359375, 1.1928253173828125, 1.24078369140625, 1.2887420654296875, 1.336700439453125, 1.3846588134765625, 1.4326171875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 4.0, 5.0, 18.0, 30.0, 45.0, 93.0, 122.0, 126.0, 144.0, 143.0, 101.0, 70.0, 48.0, 27.0, 18.0, 8.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.283203125, -3.1998291015625, -3.116455078125, -3.0330810546875, -2.94970703125, -2.8663330078125, -2.782958984375, -2.6995849609375, -2.6162109375, -2.5328369140625, -2.449462890625, -2.3660888671875, -2.28271484375, -2.1993408203125, -2.115966796875, -2.0325927734375, -1.94921875, -1.8658447265625, -1.782470703125, -1.6990966796875, -1.61572265625, -1.5323486328125, -1.448974609375, -1.3656005859375, -1.2822265625, -1.1988525390625, -1.115478515625, -1.0321044921875, -0.94873046875, -0.8653564453125, -0.781982421875, -0.6986083984375, -0.615234375, -0.5318603515625, -0.448486328125, -0.3651123046875, -0.28173828125, -0.1983642578125, -0.114990234375, -0.0316162109375, 0.0517578125, 0.1351318359375, 0.218505859375, 0.3018798828125, 0.38525390625, 0.4686279296875, 0.552001953125, 0.6353759765625, 0.71875, 0.8021240234375, 0.885498046875, 0.9688720703125, 1.05224609375, 1.1356201171875, 1.218994140625, 1.3023681640625, 1.3857421875, 1.4691162109375, 1.552490234375, 1.6358642578125, 1.71923828125, 1.8026123046875, 1.885986328125, 1.9693603515625, 2.052734375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 1.0, 8.0, 8.0, 7.0, 13.0, 23.0, 25.0, 39.0, 72.0, 129.0, 309.0, 1311.0, 16288.0, 989643.0, 37973.0, 1907.0, 409.0, 166.0, 82.0, 41.0, 35.0, 17.0, 9.0, 11.0, 9.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.47021484375, -0.45377349853515625, -0.4373321533203125, -0.42089080810546875, -0.404449462890625, -0.38800811767578125, -0.3715667724609375, -0.35512542724609375, -0.33868408203125, -0.32224273681640625, -0.3058013916015625, -0.28936004638671875, -0.272918701171875, -0.25647735595703125, -0.2400360107421875, -0.22359466552734375, -0.2071533203125, -0.19071197509765625, -0.1742706298828125, -0.15782928466796875, -0.141387939453125, -0.12494659423828125, -0.1085052490234375, -0.09206390380859375, -0.07562255859375, -0.05918121337890625, -0.0427398681640625, -0.02629852294921875, -0.009857177734375, 0.00658416748046875, 0.0230255126953125, 0.03946685791015625, 0.055908203125, 0.07234954833984375, 0.0887908935546875, 0.10523223876953125, 0.121673583984375, 0.13811492919921875, 0.1545562744140625, 0.17099761962890625, 0.18743896484375, 0.20388031005859375, 0.2203216552734375, 0.23676300048828125, 0.253204345703125, 0.26964569091796875, 0.2860870361328125, 0.30252838134765625, 0.3189697265625, 0.33541107177734375, 0.3518524169921875, 0.36829376220703125, 0.384735107421875, 0.40117645263671875, 0.4176177978515625, 0.43405914306640625, 0.45050048828125, 0.46694183349609375, 0.4833831787109375, 0.49982452392578125, 0.516265869140625, 0.5327072143554688, 0.5491485595703125, 0.5655899047851562, 0.58203125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 6.0, 4.0, 5.0, 3.0, 5.0, 2.0, 6.0, 7.0, 11.0, 8.0, 9.0, 20.0, 27.0, 27.0, 49.0, 98.0, 122.0, 173.0, 140.0, 99.0, 50.0, 37.0, 16.0, 15.0, 15.0, 8.0, 8.0, 9.0, 2.0, 8.0, 4.0, 2.0, 4.0, 1.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.423494338989258e-05, -9.103305637836456e-05, -8.783116936683655e-05, -8.462928235530853e-05, -8.142739534378052e-05, -7.82255083322525e-05, -7.502362132072449e-05, -7.182173430919647e-05, -6.861984729766846e-05, -6.541796028614044e-05, -6.221607327461243e-05, -5.901418626308441e-05, -5.5812299251556396e-05, -5.261041224002838e-05, -4.9408525228500366e-05, -4.620663821697235e-05, -4.3004751205444336e-05, -3.980286419391632e-05, -3.6600977182388306e-05, -3.339909017086029e-05, -3.0197203159332275e-05, -2.699531614780426e-05, -2.3793429136276245e-05, -2.059154212474823e-05, -1.7389655113220215e-05, -1.41877681016922e-05, -1.0985881090164185e-05, -7.78399407863617e-06, -4.582107067108154e-06, -1.3802200555801392e-06, 1.821666955947876e-06, 5.023553967475891e-06, 8.225440979003906e-06, 1.1427327990531921e-05, 1.4629215002059937e-05, 1.783110201358795e-05, 2.1032989025115967e-05, 2.4234876036643982e-05, 2.7436763048171997e-05, 3.063865005970001e-05, 3.384053707122803e-05, 3.704242408275604e-05, 4.024431109428406e-05, 4.344619810581207e-05, 4.664808511734009e-05, 4.98499721288681e-05, 5.305185914039612e-05, 5.625374615192413e-05, 5.945563316345215e-05, 6.265752017498016e-05, 6.585940718650818e-05, 6.90612941980362e-05, 7.226318120956421e-05, 7.546506822109222e-05, 7.866695523262024e-05, 8.186884224414825e-05, 8.507072925567627e-05, 8.827261626720428e-05, 9.14745032787323e-05, 9.467639029026031e-05, 9.787827730178833e-05, 0.00010108016431331635, 0.00010428205132484436, 0.00010748393833637238, 0.00011068582534790039]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 7.0, 18.0, 19.0, 23.0, 35.0, 54.0, 84.0, 158.0, 310.0, 699.0, 1984.0, 10839.0, 240039.0, 766955.0, 22399.0, 3153.0, 899.0, 392.0, 180.0, 117.0, 73.0, 41.0, 21.0, 17.0, 12.0, 12.0, 1.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2479248046875, -0.2380695343017578, -0.22821426391601562, -0.21835899353027344, -0.20850372314453125, -0.19864845275878906, -0.18879318237304688, -0.1789379119873047, -0.1690826416015625, -0.1592273712158203, -0.14937210083007812, -0.13951683044433594, -0.12966156005859375, -0.11980628967285156, -0.10995101928710938, -0.10009574890136719, -0.090240478515625, -0.08038520812988281, -0.07052993774414062, -0.06067466735839844, -0.05081939697265625, -0.04096412658691406, -0.031108856201171875, -0.021253585815429688, -0.0113983154296875, -0.0015430450439453125, 0.008312225341796875, 0.018167495727539062, 0.02802276611328125, 0.03787803649902344, 0.047733306884765625, 0.05758857727050781, 0.06744384765625, 0.07729911804199219, 0.08715438842773438, 0.09700965881347656, 0.10686492919921875, 0.11672019958496094, 0.12657546997070312, 0.1364307403564453, 0.1462860107421875, 0.1561412811279297, 0.16599655151367188, 0.17585182189941406, 0.18570709228515625, 0.19556236267089844, 0.20541763305664062, 0.2152729034423828, 0.225128173828125, 0.2349834442138672, 0.24483871459960938, 0.25469398498535156, 0.26454925537109375, 0.27440452575683594, 0.2842597961425781, 0.2941150665283203, 0.3039703369140625, 0.3138256072998047, 0.3236808776855469, 0.33353614807128906, 0.34339141845703125, 0.35324668884277344, 0.3631019592285156, 0.3729572296142578, 0.3828125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 6.0, 5.0, 2.0, 0.0, 4.0, 7.0, 6.0, 2.0, 7.0, 8.0, 16.0, 13.0, 23.0, 20.0, 31.0, 41.0, 61.0, 53.0, 70.0, 81.0, 110.0, 81.0, 75.0, 77.0, 54.0, 30.0, 24.0, 22.0, 21.0, 18.0, 7.0, 10.0, 2.0, 2.0, 10.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2054443359375, -0.1993122100830078, -0.19318008422851562, -0.18704795837402344, -0.18091583251953125, -0.17478370666503906, -0.16865158081054688, -0.1625194549560547, -0.1563873291015625, -0.1502552032470703, -0.14412307739257812, -0.13799095153808594, -0.13185882568359375, -0.12572669982910156, -0.11959457397460938, -0.11346244812011719, -0.107330322265625, -0.10119819641113281, -0.09506607055664062, -0.08893394470214844, -0.08280181884765625, -0.07666969299316406, -0.07053756713867188, -0.06440544128417969, -0.0582733154296875, -0.05214118957519531, -0.046009063720703125, -0.03987693786621094, -0.03374481201171875, -0.027612686157226562, -0.021480560302734375, -0.015348434448242188, -0.00921630859375, -0.0030841827392578125, 0.003047943115234375, 0.009180068969726562, 0.01531219482421875, 0.021444320678710938, 0.027576446533203125, 0.03370857238769531, 0.0398406982421875, 0.04597282409667969, 0.052104949951171875, 0.05823707580566406, 0.06436920166015625, 0.07050132751464844, 0.07663345336914062, 0.08276557922363281, 0.088897705078125, 0.09502983093261719, 0.10116195678710938, 0.10729408264160156, 0.11342620849609375, 0.11955833435058594, 0.12569046020507812, 0.1318225860595703, 0.1379547119140625, 0.1440868377685547, 0.15021896362304688, 0.15635108947753906, 0.16248321533203125, 0.16861534118652344, 0.17474746704101562, 0.1808795928955078, 0.18701171875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 10.0, 5.0, 13.0, 122.0, 668.0, 156.0, 21.0, 9.0, 1.0, 2.0, 1.0, 2.0], "bins": [-26.998016357421875, -26.521320343017578, -26.04462242126465, -25.56792640686035, -25.091230392456055, -24.614534378051758, -24.137836456298828, -23.66114044189453, -23.184444427490234, -22.707748413085938, -22.231050491333008, -21.75435447692871, -21.277658462524414, -20.800962448120117, -20.324264526367188, -19.84756851196289, -19.370872497558594, -18.894176483154297, -18.417478561401367, -17.94078254699707, -17.464086532592773, -16.987390518188477, -16.510692596435547, -16.03399658203125, -15.55729866027832, -15.080601692199707, -14.60390567779541, -14.127208709716797, -13.6505126953125, -13.173815727233887, -12.697118759155273, -12.220422744750977, -11.743725776672363, -11.26702880859375, -10.790332794189453, -10.31363582611084, -9.836939811706543, -9.36024284362793, -8.883546829223633, -8.40684986114502, -7.9301533699035645, -7.453456878662109, -6.976760387420654, -6.500063896179199, -6.023366928100586, -5.546670913696289, -5.069973945617676, -4.593277454376221, -4.116580963134766, -3.6398844718933105, -3.1631879806518555, -2.6864912509918213, -2.209794759750366, -1.7330982685089111, -1.256401538848877, -0.7797050476074219, -0.3030085563659668, 0.17368799448013306, 0.6503845453262329, 1.1270811557769775, 1.6037776470184326, 2.0804741382598877, 2.557170867919922, 3.033867359161377, 3.510563850402832]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 7.0, 5.0, 21.0, 25.0, 26.0, 39.0, 67.0, 70.0, 77.0, 98.0, 119.0, 105.0, 71.0, 62.0, 56.0, 43.0, 36.0, 27.0, 14.0, 13.0, 9.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.415787696838379, -7.1360368728637695, -6.856285572052002, -6.576534748077393, -6.296783447265625, -6.017032623291016, -5.737281799316406, -5.457530498504639, -5.177779197692871, -4.898028373718262, -4.618277072906494, -4.338526248931885, -4.058774948120117, -3.779024124145508, -3.4992730617523193, -3.219521999359131, -2.9397711753845215, -2.660020112991333, -2.3802690505981445, -2.100518226623535, -1.8207670450210571, -1.5410159826278687, -1.2612650394439697, -0.9815139770507812, -0.7017629146575928, -0.4220118820667267, -0.1422608494758606, 0.1374901533126831, 0.4172412157058716, 0.6969922780990601, 0.976743221282959, 1.2564942836761475, 1.536245346069336, 1.8159964084625244, 2.095747470855713, 2.3754982948303223, 2.65524959564209, 2.935000419616699, 3.2147514820098877, 3.494502544403076, 3.7742536067962646, 4.054004669189453, 4.3337554931640625, 4.61350679397583, 4.8932576179504395, 5.173008918762207, 5.452759742736816, 5.732510566711426, 6.012261867523193, 6.292012691497803, 6.57176399230957, 6.85151481628418, 7.131266117095947, 7.411016941070557, 7.690768241882324, 7.970519065856934, 8.250269889831543, 8.530020713806152, 8.809771537780762, 9.089523315429688, 9.369274139404297, 9.649024963378906, 9.928775787353516, 10.208526611328125, 10.48827838897705]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 6.0, 24.0, 28.0, 36.0, 51.0, 99.0, 166.0, 275.0, 457.0, 849.0, 1675.0, 3999.0, 10788.0, 41336.0, 343174.0, 2739414.0, 942847.0, 83579.0, 15686.0, 5074.0, 2144.0, 1051.0, 571.0, 336.0, 212.0, 136.0, 82.0, 61.0, 34.0, 25.0, 16.0, 12.0, 7.0, 6.0, 3.0, 3.0, 7.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.199951171875, -0.192169189453125, -0.18438720703125, -0.176605224609375, -0.1688232421875, -0.161041259765625, -0.15325927734375, -0.145477294921875, -0.1376953125, -0.129913330078125, -0.12213134765625, -0.114349365234375, -0.1065673828125, -0.098785400390625, -0.09100341796875, -0.083221435546875, -0.075439453125, -0.067657470703125, -0.05987548828125, -0.052093505859375, -0.0443115234375, -0.036529541015625, -0.02874755859375, -0.020965576171875, -0.01318359375, -0.005401611328125, 0.00238037109375, 0.010162353515625, 0.0179443359375, 0.025726318359375, 0.03350830078125, 0.041290283203125, 0.049072265625, 0.056854248046875, 0.06463623046875, 0.072418212890625, 0.0802001953125, 0.087982177734375, 0.09576416015625, 0.103546142578125, 0.111328125, 0.119110107421875, 0.12689208984375, 0.134674072265625, 0.1424560546875, 0.150238037109375, 0.15802001953125, 0.165802001953125, 0.173583984375, 0.181365966796875, 0.18914794921875, 0.196929931640625, 0.2047119140625, 0.212493896484375, 0.22027587890625, 0.228057861328125, 0.23583984375, 0.243621826171875, 0.25140380859375, 0.259185791015625, 0.2669677734375, 0.274749755859375, 0.28253173828125, 0.290313720703125, 0.298095703125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 2.0, 3.0, 10.0, 6.0, 16.0, 16.0, 17.0, 17.0, 40.0, 45.0, 43.0, 42.0, 49.0, 50.0, 66.0, 55.0, 68.0, 53.0, 66.0, 58.0, 53.0, 45.0, 31.0, 40.0, 38.0, 20.0, 15.0, 6.0, 8.0, 9.0, 6.0, 6.0, 1.0, 1.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2393798828125, -0.23091697692871094, -0.22245407104492188, -0.2139911651611328, -0.20552825927734375, -0.1970653533935547, -0.18860244750976562, -0.18013954162597656, -0.1716766357421875, -0.16321372985839844, -0.15475082397460938, -0.1462879180908203, -0.13782501220703125, -0.1293621063232422, -0.12089920043945312, -0.11243629455566406, -0.103973388671875, -0.09551048278808594, -0.08704757690429688, -0.07858467102050781, -0.07012176513671875, -0.06165885925292969, -0.053195953369140625, -0.04473304748535156, -0.0362701416015625, -0.027807235717773438, -0.019344329833984375, -0.010881423950195312, -0.00241851806640625, 0.0060443878173828125, 0.014507293701171875, 0.022970199584960938, 0.03143310546875, 0.03989601135253906, 0.048358917236328125, 0.05682182312011719, 0.06528472900390625, 0.07374763488769531, 0.08221054077148438, 0.09067344665527344, 0.0991363525390625, 0.10759925842285156, 0.11606216430664062, 0.12452507019042969, 0.13298797607421875, 0.1414508819580078, 0.14991378784179688, 0.15837669372558594, 0.166839599609375, 0.17530250549316406, 0.18376541137695312, 0.1922283172607422, 0.20069122314453125, 0.2091541290283203, 0.21761703491210938, 0.22607994079589844, 0.2345428466796875, 0.24300575256347656, 0.2514686584472656, 0.2599315643310547, 0.26839447021484375, 0.2768573760986328, 0.2853202819824219, 0.29378318786621094, 0.30224609375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 8.0, 2.0, 6.0, 10.0, 6.0, 17.0, 25.0, 30.0, 51.0, 61.0, 120.0, 189.0, 306.0, 642.0, 1488.0, 3878.0, 13195.0, 61977.0, 902355.0, 3074858.0, 107887.0, 18558.0, 5176.0, 1772.0, 780.0, 376.0, 181.0, 97.0, 67.0, 51.0, 28.0, 24.0, 22.0, 14.0, 12.0, 5.0, 8.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.368896484375, -0.3577728271484375, -0.346649169921875, -0.3355255126953125, -0.32440185546875, -0.3132781982421875, -0.302154541015625, -0.2910308837890625, -0.2799072265625, -0.2687835693359375, -0.257659912109375, -0.2465362548828125, -0.23541259765625, -0.2242889404296875, -0.213165283203125, -0.2020416259765625, -0.19091796875, -0.1797943115234375, -0.168670654296875, -0.1575469970703125, -0.14642333984375, -0.1352996826171875, -0.124176025390625, -0.1130523681640625, -0.1019287109375, -0.0908050537109375, -0.079681396484375, -0.0685577392578125, -0.05743408203125, -0.0463104248046875, -0.035186767578125, -0.0240631103515625, -0.012939453125, -0.0018157958984375, 0.009307861328125, 0.0204315185546875, 0.03155517578125, 0.0426788330078125, 0.053802490234375, 0.0649261474609375, 0.0760498046875, 0.0871734619140625, 0.098297119140625, 0.1094207763671875, 0.12054443359375, 0.1316680908203125, 0.142791748046875, 0.1539154052734375, 0.1650390625, 0.1761627197265625, 0.187286376953125, 0.1984100341796875, 0.20953369140625, 0.2206573486328125, 0.231781005859375, 0.2429046630859375, 0.2540283203125, 0.2651519775390625, 0.276275634765625, 0.2873992919921875, 0.29852294921875, 0.3096466064453125, 0.320770263671875, 0.3318939208984375, 0.343017578125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 3.0, 8.0, 7.0, 12.0, 16.0, 19.0, 23.0, 45.0, 42.0, 80.0, 139.0, 300.0, 676.0, 1110.0, 872.0, 353.0, 141.0, 88.0, 40.0, 25.0, 21.0, 14.0, 11.0, 6.0, 7.0, 7.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5947265625, -0.5779876708984375, -0.561248779296875, -0.5445098876953125, -0.52777099609375, -0.5110321044921875, -0.494293212890625, -0.4775543212890625, -0.4608154296875, -0.4440765380859375, -0.427337646484375, -0.4105987548828125, -0.39385986328125, -0.3771209716796875, -0.360382080078125, -0.3436431884765625, -0.326904296875, -0.3101654052734375, -0.293426513671875, -0.2766876220703125, -0.25994873046875, -0.2432098388671875, -0.226470947265625, -0.2097320556640625, -0.1929931640625, -0.1762542724609375, -0.159515380859375, -0.1427764892578125, -0.12603759765625, -0.1092987060546875, -0.092559814453125, -0.0758209228515625, -0.05908203125, -0.0423431396484375, -0.025604248046875, -0.0088653564453125, 0.00787353515625, 0.0246124267578125, 0.041351318359375, 0.0580902099609375, 0.0748291015625, 0.0915679931640625, 0.108306884765625, 0.1250457763671875, 0.14178466796875, 0.1585235595703125, 0.175262451171875, 0.1920013427734375, 0.208740234375, 0.2254791259765625, 0.242218017578125, 0.2589569091796875, 0.27569580078125, 0.2924346923828125, 0.309173583984375, 0.3259124755859375, 0.3426513671875, 0.3593902587890625, 0.376129150390625, 0.3928680419921875, 0.40960693359375, 0.4263458251953125, 0.443084716796875, 0.4598236083984375, 0.4765625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 11.0, 51.0, 413.0, 455.0, 43.0, 10.0, 8.0, 5.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.742006301879883, -6.437751293182373, -6.133496284484863, -5.829241752624512, -5.524986743927002, -5.220731735229492, -4.916477203369141, -4.612222194671631, -4.307967185974121, -4.003712177276611, -3.6994574069976807, -3.39520263671875, -3.0909476280212402, -2.7866926193237305, -2.4824378490448, -2.178183078765869, -1.8739280700683594, -1.5696731805801392, -1.265418291091919, -0.9611634016036987, -0.6569085121154785, -0.3526536226272583, -0.048398733139038086, 0.2558560371398926, 0.5601110458374023, 0.8643659353256226, 1.1686208248138428, 1.472875714302063, 1.7771306037902832, 2.081385612487793, 2.3856403827667236, 2.6898951530456543, 2.994150161743164, 3.298405170440674, 3.6026599407196045, 3.906914710998535, 4.211169719696045, 4.515424728393555, 4.819679260253906, 5.123934268951416, 5.428189277648926, 5.7324442863464355, 6.036699295043945, 6.340953826904297, 6.645208835601807, 6.949463844299316, 7.253718376159668, 7.557973384857178, 7.8622283935546875, 8.166482925415039, 8.470738410949707, 8.774992942810059, 9.079248428344727, 9.383502960205078, 9.68775749206543, 9.992012023925781, 10.29626750946045, 10.6005220413208, 10.904777526855469, 11.20903205871582, 11.513286590576172, 11.81754207611084, 12.121796607971191, 12.42605209350586, 12.730306625366211]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 7.0, 9.0, 6.0, 9.0, 15.0, 16.0, 19.0, 23.0, 22.0, 26.0, 49.0, 42.0, 48.0, 47.0, 55.0, 68.0, 63.0, 63.0, 53.0, 53.0, 48.0, 39.0, 29.0, 33.0, 33.0, 22.0, 14.0, 23.0, 22.0, 11.0, 12.0, 8.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.8203125, -2.743502140045166, -2.666692018508911, -2.589881658554077, -2.513071298599243, -2.4362611770629883, -2.3594508171081543, -2.2826404571533203, -2.2058303356170654, -2.1290199756622314, -2.0522098541259766, -1.9753994941711426, -1.8985892534255981, -1.8217790126800537, -1.7449686527252197, -1.6681584119796753, -1.5913480520248413, -1.5145378112792969, -1.437727451324463, -1.3609172105789185, -1.284106969833374, -1.20729660987854, -1.1304863691329956, -1.0536761283874512, -0.976865828037262, -0.9000555276870728, -0.8232452869415283, -0.7464349865913391, -0.6696246862411499, -0.5928144454956055, -0.5160041451454163, -0.4391939043998718, -0.3623836040496826, -0.2855733335018158, -0.20876304805278778, -0.13195276260375977, -0.055142492055892944, 0.021667778491973877, 0.09847807884216309, 0.17528831958770752, 0.25209861993789673, 0.32890889048576355, 0.40571916103363037, 0.4825294613838196, 0.5593397617340088, 0.6361500024795532, 0.7129603028297424, 0.7897705435752869, 0.8665808439254761, 0.9433911442756653, 1.0202014446258545, 1.097011685371399, 1.1738219261169434, 1.2506322860717773, 1.3274425268173218, 1.4042527675628662, 1.4810631275177002, 1.5578733682632446, 1.6346837282180786, 1.711493968963623, 1.7883042097091675, 1.865114450454712, 1.941924810409546, 2.018734931945801, 2.0955452919006348]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 2.0, 9.0, 23.0, 28.0, 49.0, 63.0, 122.0, 251.0, 576.0, 1128.0, 2526.0, 6484.0, 18139.0, 60105.0, 212759.0, 434005.0, 219133.0, 62594.0, 18981.0, 6649.0, 2644.0, 1138.0, 538.0, 264.0, 150.0, 83.0, 35.0, 30.0, 17.0, 13.0, 5.0, 3.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.279296875, -0.2720451354980469, -0.26479339599609375, -0.2575416564941406, -0.2502899169921875, -0.24303817749023438, -0.23578643798828125, -0.22853469848632812, -0.221282958984375, -0.21403121948242188, -0.20677947998046875, -0.19952774047851562, -0.1922760009765625, -0.18502426147460938, -0.17777252197265625, -0.17052078247070312, -0.16326904296875, -0.15601730346679688, -0.14876556396484375, -0.14151382446289062, -0.1342620849609375, -0.12701034545898438, -0.11975860595703125, -0.11250686645507812, -0.105255126953125, -0.09800338745117188, -0.09075164794921875, -0.08349990844726562, -0.0762481689453125, -0.06899642944335938, -0.06174468994140625, -0.054492950439453125, -0.0472412109375, -0.039989471435546875, -0.03273773193359375, -0.025485992431640625, -0.0182342529296875, -0.010982513427734375, -0.00373077392578125, 0.003520965576171875, 0.010772705078125, 0.018024444580078125, 0.02527618408203125, 0.032527923583984375, 0.0397796630859375, 0.047031402587890625, 0.05428314208984375, 0.061534881591796875, 0.06878662109375, 0.07603836059570312, 0.08329010009765625, 0.09054183959960938, 0.0977935791015625, 0.10504531860351562, 0.11229705810546875, 0.11954879760742188, 0.126800537109375, 0.13405227661132812, 0.14130401611328125, 0.14855575561523438, 0.1558074951171875, 0.16305923461914062, 0.17031097412109375, 0.17756271362304688, 0.184814453125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 0.0, 4.0, 4.0, 10.0, 13.0, 11.0, 14.0, 24.0, 23.0, 33.0, 37.0, 40.0, 47.0, 51.0, 42.0, 63.0, 64.0, 65.0, 62.0, 65.0, 60.0, 48.0, 37.0, 41.0, 27.0, 21.0, 26.0, 15.0, 16.0, 12.0, 7.0, 7.0, 9.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.242431640625, -0.23490333557128906, -0.22737503051757812, -0.2198467254638672, -0.21231842041015625, -0.2047901153564453, -0.19726181030273438, -0.18973350524902344, -0.1822052001953125, -0.17467689514160156, -0.16714859008789062, -0.1596202850341797, -0.15209197998046875, -0.1445636749267578, -0.13703536987304688, -0.12950706481933594, -0.121978759765625, -0.11445045471191406, -0.10692214965820312, -0.09939384460449219, -0.09186553955078125, -0.08433723449707031, -0.07680892944335938, -0.06928062438964844, -0.0617523193359375, -0.05422401428222656, -0.046695709228515625, -0.03916740417480469, -0.03163909912109375, -0.024110794067382812, -0.016582489013671875, -0.009054183959960938, -0.00152587890625, 0.0060024261474609375, 0.013530731201171875, 0.021059036254882812, 0.02858734130859375, 0.03611564636230469, 0.043643951416015625, 0.05117225646972656, 0.0587005615234375, 0.06622886657714844, 0.07375717163085938, 0.08128547668457031, 0.08881378173828125, 0.09634208679199219, 0.10387039184570312, 0.11139869689941406, 0.118927001953125, 0.12645530700683594, 0.13398361206054688, 0.1415119171142578, 0.14904022216796875, 0.1565685272216797, 0.16409683227539062, 0.17162513732910156, 0.1791534423828125, 0.18668174743652344, 0.19421005249023438, 0.2017383575439453, 0.20926666259765625, 0.2167949676513672, 0.22432327270507812, 0.23185157775878906, 0.2393798828125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 5.0, 2.0, 2.0, 4.0, 2.0, 3.0, 8.0, 6.0, 7.0, 23.0, 23.0, 24.0, 41.0, 49.0, 54.0, 86.0, 104.0, 155.0, 197.0, 263.0, 362.0, 539.0, 977.0, 2155.0, 7831.0, 110065.0, 869469.0, 46473.0, 5273.0, 1727.0, 804.0, 491.0, 362.0, 232.0, 199.0, 128.0, 106.0, 82.0, 48.0, 40.0, 46.0, 19.0, 23.0, 14.0, 5.0, 8.0, 5.0, 8.0, 2.0, 5.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.61962890625, -0.5992279052734375, -0.578826904296875, -0.5584259033203125, -0.53802490234375, -0.5176239013671875, -0.497222900390625, -0.4768218994140625, -0.4564208984375, -0.4360198974609375, -0.415618896484375, -0.3952178955078125, -0.37481689453125, -0.3544158935546875, -0.334014892578125, -0.3136138916015625, -0.293212890625, -0.2728118896484375, -0.252410888671875, -0.2320098876953125, -0.21160888671875, -0.1912078857421875, -0.170806884765625, -0.1504058837890625, -0.1300048828125, -0.1096038818359375, -0.089202880859375, -0.0688018798828125, -0.04840087890625, -0.0279998779296875, -0.007598876953125, 0.0128021240234375, 0.033203125, 0.0536041259765625, 0.074005126953125, 0.0944061279296875, 0.11480712890625, 0.1352081298828125, 0.155609130859375, 0.1760101318359375, 0.1964111328125, 0.2168121337890625, 0.237213134765625, 0.2576141357421875, 0.27801513671875, 0.2984161376953125, 0.318817138671875, 0.3392181396484375, 0.359619140625, 0.3800201416015625, 0.400421142578125, 0.4208221435546875, 0.44122314453125, 0.4616241455078125, 0.482025146484375, 0.5024261474609375, 0.5228271484375, 0.5432281494140625, 0.563629150390625, 0.5840301513671875, 0.60443115234375, 0.6248321533203125, 0.645233154296875, 0.6656341552734375, 0.68603515625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 10.0, 5.0, 11.0, 16.0, 20.0, 29.0, 27.0, 35.0, 42.0, 48.0, 47.0, 56.0, 51.0, 66.0, 58.0, 58.0, 53.0, 62.0, 47.0, 39.0, 36.0, 27.0, 32.0, 31.0, 15.0, 21.0, 13.0, 10.0, 9.0, 5.0, 5.0, 1.0, 3.0, 2.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.912109375, -0.8802490234375, -0.848388671875, -0.8165283203125, -0.78466796875, -0.7528076171875, -0.720947265625, -0.6890869140625, -0.6572265625, -0.6253662109375, -0.593505859375, -0.5616455078125, -0.52978515625, -0.4979248046875, -0.466064453125, -0.4342041015625, -0.40234375, -0.3704833984375, -0.338623046875, -0.3067626953125, -0.27490234375, -0.2430419921875, -0.211181640625, -0.1793212890625, -0.1474609375, -0.1156005859375, -0.083740234375, -0.0518798828125, -0.02001953125, 0.0118408203125, 0.043701171875, 0.0755615234375, 0.107421875, 0.1392822265625, 0.171142578125, 0.2030029296875, 0.23486328125, 0.2667236328125, 0.298583984375, 0.3304443359375, 0.3623046875, 0.3941650390625, 0.426025390625, 0.4578857421875, 0.48974609375, 0.5216064453125, 0.553466796875, 0.5853271484375, 0.6171875, 0.6490478515625, 0.680908203125, 0.7127685546875, 0.74462890625, 0.7764892578125, 0.808349609375, 0.8402099609375, 0.8720703125, 0.9039306640625, 0.935791015625, 0.9676513671875, 0.99951171875, 1.0313720703125, 1.063232421875, 1.0950927734375, 1.126953125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 5.0, 4.0, 2.0, 12.0, 9.0, 20.0, 29.0, 31.0, 50.0, 68.0, 128.0, 208.0, 384.0, 794.0, 2284.0, 9180.0, 87153.0, 851462.0, 83802.0, 8998.0, 2164.0, 813.0, 352.0, 214.0, 106.0, 71.0, 59.0, 49.0, 29.0, 20.0, 8.0, 12.0, 3.0, 9.0, 11.0, 3.0, 3.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1767578125, -0.17131805419921875, -0.1658782958984375, -0.16043853759765625, -0.154998779296875, -0.14955902099609375, -0.1441192626953125, -0.13867950439453125, -0.13323974609375, -0.12779998779296875, -0.1223602294921875, -0.11692047119140625, -0.111480712890625, -0.10604095458984375, -0.1006011962890625, -0.09516143798828125, -0.0897216796875, -0.08428192138671875, -0.0788421630859375, -0.07340240478515625, -0.067962646484375, -0.06252288818359375, -0.0570831298828125, -0.05164337158203125, -0.04620361328125, -0.04076385498046875, -0.0353240966796875, -0.02988433837890625, -0.024444580078125, -0.01900482177734375, -0.0135650634765625, -0.00812530517578125, -0.002685546875, 0.00275421142578125, 0.0081939697265625, 0.01363372802734375, 0.019073486328125, 0.02451324462890625, 0.0299530029296875, 0.03539276123046875, 0.04083251953125, 0.04627227783203125, 0.0517120361328125, 0.05715179443359375, 0.062591552734375, 0.06803131103515625, 0.0734710693359375, 0.07891082763671875, 0.0843505859375, 0.08979034423828125, 0.0952301025390625, 0.10066986083984375, 0.106109619140625, 0.11154937744140625, 0.1169891357421875, 0.12242889404296875, 0.12786865234375, 0.13330841064453125, 0.1387481689453125, 0.14418792724609375, 0.149627685546875, 0.15506744384765625, 0.1605072021484375, 0.16594696044921875, 0.17138671875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 2.0, 1.0, 4.0, 2.0, 3.0, 5.0, 11.0, 17.0, 8.0, 14.0, 22.0, 22.0, 19.0, 28.0, 39.0, 37.0, 80.0, 104.0, 114.0, 105.0, 82.0, 76.0, 37.0, 28.0, 30.0, 23.0, 16.0, 15.0, 13.0, 13.0, 2.0, 5.0, 7.0, 3.0, 3.0, 0.0, 7.0, 3.0, 1.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.455183029174805e-05, -6.225146353244781e-05, -5.995109677314758e-05, -5.765073001384735e-05, -5.535036325454712e-05, -5.304999649524689e-05, -5.0749629735946655e-05, -4.844926297664642e-05, -4.614889621734619e-05, -4.384852945804596e-05, -4.154816269874573e-05, -3.9247795939445496e-05, -3.6947429180145264e-05, -3.464706242084503e-05, -3.23466956615448e-05, -3.0046328902244568e-05, -2.7745962142944336e-05, -2.5445595383644104e-05, -2.3145228624343872e-05, -2.084486186504364e-05, -1.8544495105743408e-05, -1.6244128346443176e-05, -1.3943761587142944e-05, -1.1643394827842712e-05, -9.34302806854248e-06, -7.0426613092422485e-06, -4.742294549942017e-06, -2.4419277906417847e-06, -1.4156103134155273e-07, 2.158805727958679e-06, 4.459172487258911e-06, 6.759539246559143e-06, 9.059906005859375e-06, 1.1360272765159607e-05, 1.3660639524459839e-05, 1.596100628376007e-05, 1.8261373043060303e-05, 2.0561739802360535e-05, 2.2862106561660767e-05, 2.5162473320961e-05, 2.746284008026123e-05, 2.9763206839561462e-05, 3.2063573598861694e-05, 3.4363940358161926e-05, 3.666430711746216e-05, 3.896467387676239e-05, 4.126504063606262e-05, 4.3565407395362854e-05, 4.5865774154663086e-05, 4.816614091396332e-05, 5.046650767326355e-05, 5.276687443256378e-05, 5.5067241191864014e-05, 5.7367607951164246e-05, 5.966797471046448e-05, 6.196834146976471e-05, 6.426870822906494e-05, 6.656907498836517e-05, 6.88694417476654e-05, 7.116980850696564e-05, 7.347017526626587e-05, 7.57705420255661e-05, 7.807090878486633e-05, 8.037127554416656e-05, 8.26716423034668e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 10.0, 1.0, 8.0, 9.0, 14.0, 18.0, 28.0, 32.0, 50.0, 67.0, 103.0, 141.0, 236.0, 409.0, 960.0, 2467.0, 9103.0, 70661.0, 861162.0, 87714.0, 10497.0, 2699.0, 996.0, 439.0, 255.0, 134.0, 112.0, 70.0, 42.0, 33.0, 20.0, 12.0, 12.0, 7.0, 7.0, 3.0, 3.0, 6.0, 3.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1925048828125, -0.18658828735351562, -0.18067169189453125, -0.17475509643554688, -0.1688385009765625, -0.16292190551757812, -0.15700531005859375, -0.15108871459960938, -0.145172119140625, -0.13925552368164062, -0.13333892822265625, -0.12742233276367188, -0.1215057373046875, -0.11558914184570312, -0.10967254638671875, -0.10375595092773438, -0.09783935546875, -0.09192276000976562, -0.08600616455078125, -0.08008956909179688, -0.0741729736328125, -0.06825637817382812, -0.06233978271484375, -0.056423187255859375, -0.050506591796875, -0.044589996337890625, -0.03867340087890625, -0.032756805419921875, -0.0268402099609375, -0.020923614501953125, -0.01500701904296875, -0.009090423583984375, -0.003173828125, 0.002742767333984375, 0.00865936279296875, 0.014575958251953125, 0.0204925537109375, 0.026409149169921875, 0.03232574462890625, 0.038242340087890625, 0.044158935546875, 0.050075531005859375, 0.05599212646484375, 0.061908721923828125, 0.0678253173828125, 0.07374191284179688, 0.07965850830078125, 0.08557510375976562, 0.09149169921875, 0.09740829467773438, 0.10332489013671875, 0.10924148559570312, 0.1151580810546875, 0.12107467651367188, 0.12699127197265625, 0.13290786743164062, 0.138824462890625, 0.14474105834960938, 0.15065765380859375, 0.15657424926757812, 0.1624908447265625, 0.16840744018554688, 0.17432403564453125, 0.18024063110351562, 0.1861572265625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 6.0, 4.0, 3.0, 4.0, 0.0, 2.0, 3.0, 8.0, 12.0, 8.0, 15.0, 19.0, 22.0, 32.0, 42.0, 55.0, 83.0, 73.0, 75.0, 101.0, 96.0, 64.0, 62.0, 43.0, 39.0, 32.0, 23.0, 26.0, 12.0, 13.0, 8.0, 2.0, 6.0, 6.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.1324462890625, -0.12774085998535156, -0.12303543090820312, -0.11833000183105469, -0.11362457275390625, -0.10891914367675781, -0.10421371459960938, -0.09950828552246094, -0.0948028564453125, -0.09009742736816406, -0.08539199829101562, -0.08068656921386719, -0.07598114013671875, -0.07127571105957031, -0.06657028198242188, -0.06186485290527344, -0.057159423828125, -0.05245399475097656, -0.047748565673828125, -0.04304313659667969, -0.03833770751953125, -0.03363227844238281, -0.028926849365234375, -0.024221420288085938, -0.0195159912109375, -0.014810562133789062, -0.010105133056640625, -0.0053997039794921875, -0.00069427490234375, 0.0040111541748046875, 0.008716583251953125, 0.013422012329101562, 0.01812744140625, 0.022832870483398438, 0.027538299560546875, 0.03224372863769531, 0.03694915771484375, 0.04165458679199219, 0.046360015869140625, 0.05106544494628906, 0.0557708740234375, 0.06047630310058594, 0.06518173217773438, 0.06988716125488281, 0.07459259033203125, 0.07929801940917969, 0.08400344848632812, 0.08870887756347656, 0.093414306640625, 0.09811973571777344, 0.10282516479492188, 0.10753059387207031, 0.11223602294921875, 0.11694145202636719, 0.12164688110351562, 0.12635231018066406, 0.1310577392578125, 0.13576316833496094, 0.14046859741210938, 0.1451740264892578, 0.14987945556640625, 0.1545848846435547, 0.15929031372070312, 0.16399574279785156, 0.168701171875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 13.0, 28.0, 146.0, 511.0, 201.0, 45.0, 21.0, 14.0, 10.0, 6.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8624258041381836, -2.634716510772705, -2.4070072174072266, -2.179297924041748, -1.9515886306762695, -1.723879337310791, -1.4961700439453125, -1.268460750579834, -1.0407514572143555, -0.813042163848877, -0.5853328704833984, -0.3576235771179199, -0.1299142837524414, 0.09779500961303711, 0.3255043029785156, 0.5532135963439941, 0.7809228897094727, 1.0086321830749512, 1.2363414764404297, 1.4640507698059082, 1.6917600631713867, 1.9194693565368652, 2.1471786499023438, 2.3748879432678223, 2.602597236633301, 2.8303065299987793, 3.058015823364258, 3.2857251167297363, 3.513434410095215, 3.7411437034606934, 3.968852996826172, 4.19656229019165, 4.424271583557129, 4.651980876922607, 4.879690170288086, 5.1073994636535645, 5.335108757019043, 5.5628180503845215, 5.79052734375, 6.0182366371154785, 6.245945930480957, 6.4736552238464355, 6.701364517211914, 6.929073810577393, 7.156783103942871, 7.38449239730835, 7.612201690673828, 7.839910984039307, 8.067620277404785, 8.295330047607422, 8.523038864135742, 8.750747680664062, 8.9784574508667, 9.206167221069336, 9.433876037597656, 9.661584854125977, 9.889294624328613, 10.11700439453125, 10.34471321105957, 10.57242202758789, 10.800131797790527, 11.027841567993164, 11.255550384521484, 11.483259201049805, 11.710968971252441]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 6.0, 5.0, 3.0, 3.0, 8.0, 11.0, 10.0, 12.0, 25.0, 16.0, 28.0, 25.0, 33.0, 36.0, 39.0, 44.0, 37.0, 53.0, 82.0, 82.0, 70.0, 60.0, 51.0, 45.0, 40.0, 29.0, 24.0, 16.0, 11.0, 20.0, 21.0, 20.0, 12.0, 7.0, 8.0, 7.0, 4.0, 3.0, 7.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-4.527020454406738, -4.412191390991211, -4.297362327575684, -4.182532787322998, -4.067703723907471, -3.9528746604919434, -3.838045597076416, -3.7232162952423096, -3.6083872318267822, -3.493558168411255, -3.3787288665771484, -3.263899803161621, -3.1490705013275146, -3.0342414379119873, -2.919412136077881, -2.8045830726623535, -2.689754009246826, -2.574924945831299, -2.4600956439971924, -2.345266580581665, -2.2304372787475586, -2.1156082153320312, -2.000779151916504, -1.8859498500823975, -1.771120548248291, -1.6562913656234741, -1.5414621829986572, -1.4266331195831299, -1.311803936958313, -1.196974754333496, -1.0821455717086792, -0.9673164486885071, -0.852487325668335, -0.7376581430435181, -0.622829020023346, -0.507999837398529, -0.39317068457603455, -0.27834153175354004, -0.16351234912872314, -0.048683226108551025, 0.06614595651626587, 0.18097510933876038, 0.2958042621612549, 0.4106334447860718, 0.5254626274108887, 0.6402917504310608, 0.7551209330558777, 0.8699500560760498, 0.9847792387008667, 1.0996084213256836, 1.2144376039505005, 1.3292667865753174, 1.4440958499908447, 1.5589250326156616, 1.6737542152404785, 1.7885832786560059, 1.9034125804901123, 2.0182416439056396, 2.133070945739746, 2.2479000091552734, 2.36272931098938, 2.4775583744049072, 2.5923876762390137, 2.707216739654541, 2.8220458030700684]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 6.0, 2.0, 7.0, 13.0, 14.0, 24.0, 39.0, 42.0, 80.0, 101.0, 176.0, 338.0, 637.0, 1406.0, 3165.0, 8699.0, 30127.0, 190516.0, 1707763.0, 1949170.0, 246779.0, 37120.0, 10003.0, 4015.0, 1908.0, 1012.0, 507.0, 262.0, 121.0, 71.0, 48.0, 35.0, 19.0, 19.0, 7.0, 6.0, 9.0, 5.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2349853515625, -0.22864341735839844, -0.22230148315429688, -0.2159595489501953, -0.20961761474609375, -0.2032756805419922, -0.19693374633789062, -0.19059181213378906, -0.1842498779296875, -0.17790794372558594, -0.17156600952148438, -0.1652240753173828, -0.15888214111328125, -0.1525402069091797, -0.14619827270507812, -0.13985633850097656, -0.133514404296875, -0.12717247009277344, -0.12083053588867188, -0.11448860168457031, -0.10814666748046875, -0.10180473327636719, -0.09546279907226562, -0.08912086486816406, -0.0827789306640625, -0.07643699645996094, -0.07009506225585938, -0.06375312805175781, -0.05741119384765625, -0.05106925964355469, -0.044727325439453125, -0.03838539123535156, -0.03204345703125, -0.025701522827148438, -0.019359588623046875, -0.013017654418945312, -0.00667572021484375, -0.0003337860107421875, 0.006008148193359375, 0.012350082397460938, 0.0186920166015625, 0.025033950805664062, 0.031375885009765625, 0.03771781921386719, 0.04405975341796875, 0.05040168762207031, 0.056743621826171875, 0.06308555603027344, 0.069427490234375, 0.07576942443847656, 0.08211135864257812, 0.08845329284667969, 0.09479522705078125, 0.10113716125488281, 0.10747909545898438, 0.11382102966308594, 0.1201629638671875, 0.12650489807128906, 0.13284683227539062, 0.1391887664794922, 0.14553070068359375, 0.1518726348876953, 0.15821456909179688, 0.16455650329589844, 0.1708984375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 7.0, 6.0, 8.0, 14.0, 24.0, 38.0, 54.0, 70.0, 79.0, 95.0, 95.0, 121.0, 73.0, 102.0, 83.0, 49.0, 30.0, 30.0, 18.0, 7.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5263671875, -0.5141181945800781, -0.5018692016601562, -0.4896202087402344, -0.4773712158203125, -0.4651222229003906, -0.45287322998046875, -0.4406242370605469, -0.428375244140625, -0.4161262512207031, -0.40387725830078125, -0.3916282653808594, -0.3793792724609375, -0.3671302795410156, -0.35488128662109375, -0.3426322937011719, -0.33038330078125, -0.3181343078613281, -0.30588531494140625, -0.2936363220214844, -0.2813873291015625, -0.2691383361816406, -0.25688934326171875, -0.24464035034179688, -0.232391357421875, -0.22014236450195312, -0.20789337158203125, -0.19564437866210938, -0.1833953857421875, -0.17114639282226562, -0.15889739990234375, -0.14664840698242188, -0.1343994140625, -0.12215042114257812, -0.10990142822265625, -0.09765243530273438, -0.0854034423828125, -0.07315444946289062, -0.06090545654296875, -0.048656463623046875, -0.036407470703125, -0.024158477783203125, -0.01190948486328125, 0.000339508056640625, 0.0125885009765625, 0.024837493896484375, 0.03708648681640625, 0.049335479736328125, 0.06158447265625, 0.07383346557617188, 0.08608245849609375, 0.09833145141601562, 0.1105804443359375, 0.12282943725585938, 0.13507843017578125, 0.14732742309570312, 0.159576416015625, 0.17182540893554688, 0.18407440185546875, 0.19632339477539062, 0.2085723876953125, 0.22082138061523438, 0.23307037353515625, 0.24531936645507812, 0.257568359375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 3.0, 1.0, 3.0, 9.0, 10.0, 10.0, 20.0, 39.0, 74.0, 138.0, 257.0, 527.0, 954.0, 2175.0, 6902.0, 34552.0, 780462.0, 3288545.0, 67196.0, 8610.0, 2145.0, 753.0, 397.0, 209.0, 110.0, 68.0, 44.0, 24.0, 12.0, 15.0, 9.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3837890625, -0.3714790344238281, -0.35916900634765625, -0.3468589782714844, -0.3345489501953125, -0.3222389221191406, -0.30992889404296875, -0.2976188659667969, -0.285308837890625, -0.2729988098144531, -0.26068878173828125, -0.24837875366210938, -0.2360687255859375, -0.22375869750976562, -0.21144866943359375, -0.19913864135742188, -0.18682861328125, -0.17451858520507812, -0.16220855712890625, -0.14989852905273438, -0.1375885009765625, -0.12527847290039062, -0.11296844482421875, -0.10065841674804688, -0.088348388671875, -0.07603836059570312, -0.06372833251953125, -0.051418304443359375, -0.0391082763671875, -0.026798248291015625, -0.01448822021484375, -0.002178192138671875, 0.0101318359375, 0.022441864013671875, 0.03475189208984375, 0.047061920166015625, 0.0593719482421875, 0.07168197631835938, 0.08399200439453125, 0.09630203247070312, 0.108612060546875, 0.12092208862304688, 0.13323211669921875, 0.14554214477539062, 0.1578521728515625, 0.17016220092773438, 0.18247222900390625, 0.19478225708007812, 0.20709228515625, 0.21940231323242188, 0.23171234130859375, 0.24402236938476562, 0.2563323974609375, 0.2686424255371094, 0.28095245361328125, 0.2932624816894531, 0.305572509765625, 0.3178825378417969, 0.33019256591796875, 0.3425025939941406, 0.3548126220703125, 0.3671226501464844, 0.37943267822265625, 0.3917427062988281, 0.404052734375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 7.0, 6.0, 10.0, 19.0, 29.0, 45.0, 76.0, 170.0, 545.0, 1361.0, 1203.0, 376.0, 113.0, 50.0, 26.0, 10.0, 16.0, 5.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57470703125, -0.5540847778320312, -0.5334625244140625, -0.5128402709960938, -0.492218017578125, -0.47159576416015625, -0.4509735107421875, -0.43035125732421875, -0.40972900390625, -0.38910675048828125, -0.3684844970703125, -0.34786224365234375, -0.327239990234375, -0.30661773681640625, -0.2859954833984375, -0.26537322998046875, -0.2447509765625, -0.22412872314453125, -0.2035064697265625, -0.18288421630859375, -0.162261962890625, -0.14163970947265625, -0.1210174560546875, -0.10039520263671875, -0.07977294921875, -0.05915069580078125, -0.0385284423828125, -0.01790618896484375, 0.002716064453125, 0.02333831787109375, 0.0439605712890625, 0.06458282470703125, 0.085205078125, 0.10582733154296875, 0.1264495849609375, 0.14707183837890625, 0.167694091796875, 0.18831634521484375, 0.2089385986328125, 0.22956085205078125, 0.25018310546875, 0.27080535888671875, 0.2914276123046875, 0.31204986572265625, 0.332672119140625, 0.35329437255859375, 0.3739166259765625, 0.39453887939453125, 0.4151611328125, 0.43578338623046875, 0.4564056396484375, 0.47702789306640625, 0.497650146484375, 0.5182723999023438, 0.5388946533203125, 0.5595169067382812, 0.58013916015625, 0.6007614135742188, 0.6213836669921875, 0.6420059204101562, 0.662628173828125, 0.6832504272460938, 0.7038726806640625, 0.7244949340820312, 0.7451171875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 7.0, 33.0, 119.0, 372.0, 340.0, 89.0, 14.0, 8.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.320489883422852, -6.140018939971924, -5.959547996520996, -5.779077053070068, -5.598606109619141, -5.418135166168213, -5.237664222717285, -5.057193279266357, -4.87672233581543, -4.696251392364502, -4.515780448913574, -4.3353095054626465, -4.154838562011719, -3.974367618560791, -3.7938966751098633, -3.6134257316589355, -3.4329545497894287, -3.252483606338501, -3.0720126628875732, -2.8915417194366455, -2.7110707759857178, -2.53059983253479, -2.350128650665283, -2.1696577072143555, -1.9891868829727173, -1.8087159395217896, -1.6282449960708618, -1.4477739334106445, -1.2673029899597168, -1.086832046508789, -0.9063611030578613, -0.7258901596069336, -0.5454192161560059, -0.3649482727050781, -0.184477299451828, -0.004006326198577881, 0.17646461725234985, 0.3569355607032776, 0.5374065637588501, 0.7178775072097778, 0.8983484506607056, 1.0788193941116333, 1.259290337562561, 1.4397614002227783, 1.620232343673706, 1.8007032871246338, 1.9811742305755615, 2.1616451740264893, 2.342116117477417, 2.5225870609283447, 2.7030580043792725, 2.8835289478302, 3.063999891281128, 3.2444708347320557, 3.4249420166015625, 3.6054129600524902, 3.785883903503418, 3.9663548469543457, 4.146825790405273, 4.327296733856201, 4.507767677307129, 4.688238620758057, 4.868709564208984, 5.049180507659912, 5.22965145111084]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 5.0, 9.0, 8.0, 15.0, 9.0, 22.0, 20.0, 29.0, 36.0, 54.0, 62.0, 76.0, 82.0, 84.0, 80.0, 76.0, 77.0, 61.0, 54.0, 35.0, 30.0, 23.0, 19.0, 13.0, 7.0, 6.0, 4.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.850261926651001, -1.7613246440887451, -1.6723873615264893, -1.5834500789642334, -1.4945127964019775, -1.4055755138397217, -1.3166381120681763, -1.2277008295059204, -1.1387635469436646, -1.0498262643814087, -0.9608889818191528, -0.8719516396522522, -0.7830143570899963, -0.6940770745277405, -0.6051397323608398, -0.516202449798584, -0.4272651672363281, -0.33832788467407227, -0.24939057230949402, -0.16045325994491577, -0.07151597738265991, 0.017421305179595947, 0.10635864734649658, 0.19529592990875244, 0.2842332124710083, 0.37317049503326416, 0.4621078073978424, 0.5510451197624207, 0.6399824023246765, 0.7289196848869324, 0.817857027053833, 0.9067943096160889, 0.9957313537597656, 1.0846686363220215, 1.1736059188842773, 1.2625432014465332, 1.351480484008789, 1.440417766571045, 1.5293551683425903, 1.6182924509048462, 1.707229733467102, 1.796167016029358, 1.8851042985916138, 1.9740417003631592, 2.062978982925415, 2.151916265487671, 2.2408535480499268, 2.3297908306121826, 2.4187281131744385, 2.5076653957366943, 2.59660267829895, 2.685539960861206, 2.774477243423462, 2.8634145259857178, 2.9523520469665527, 3.0412893295288086, 3.1302266120910645, 3.2191638946533203, 3.308101177215576, 3.397038459777832, 3.485975742340088, 3.5749130249023438, 3.6638503074645996, 3.7527875900268555, 3.8417248725891113]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 0.0, 6.0, 2.0, 7.0, 7.0, 13.0, 10.0, 31.0, 27.0, 38.0, 67.0, 105.0, 166.0, 291.0, 501.0, 913.0, 1961.0, 4644.0, 12719.0, 39375.0, 139561.0, 403020.0, 310379.0, 92276.0, 26749.0, 8908.0, 3401.0, 1545.0, 740.0, 413.0, 243.0, 130.0, 89.0, 55.0, 40.0, 32.0, 20.0, 20.0, 13.0, 11.0, 11.0, 2.0, 2.0, 5.0, 6.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.236328125, -0.22866439819335938, -0.22100067138671875, -0.21333694458007812, -0.2056732177734375, -0.19800949096679688, -0.19034576416015625, -0.18268203735351562, -0.175018310546875, -0.16735458374023438, -0.15969085693359375, -0.15202713012695312, -0.1443634033203125, -0.13669967651367188, -0.12903594970703125, -0.12137222290039062, -0.11370849609375, -0.10604476928710938, -0.09838104248046875, -0.09071731567382812, -0.0830535888671875, -0.07538986206054688, -0.06772613525390625, -0.060062408447265625, -0.052398681640625, -0.044734954833984375, -0.03707122802734375, -0.029407501220703125, -0.0217437744140625, -0.014080047607421875, -0.00641632080078125, 0.001247406005859375, 0.0089111328125, 0.016574859619140625, 0.02423858642578125, 0.031902313232421875, 0.0395660400390625, 0.047229766845703125, 0.05489349365234375, 0.06255722045898438, 0.070220947265625, 0.07788467407226562, 0.08554840087890625, 0.09321212768554688, 0.1008758544921875, 0.10853958129882812, 0.11620330810546875, 0.12386703491210938, 0.13153076171875, 0.13919448852539062, 0.14685821533203125, 0.15452194213867188, 0.1621856689453125, 0.16984939575195312, 0.17751312255859375, 0.18517684936523438, 0.192840576171875, 0.20050430297851562, 0.20816802978515625, 0.21583175659179688, 0.2234954833984375, 0.23115921020507812, 0.23882293701171875, 0.24648666381835938, 0.254150390625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 6.0, 1.0, 5.0, 5.0, 6.0, 3.0, 14.0, 10.0, 22.0, 23.0, 35.0, 44.0, 40.0, 50.0, 62.0, 78.0, 64.0, 63.0, 74.0, 62.0, 73.0, 54.0, 34.0, 53.0, 33.0, 28.0, 17.0, 17.0, 11.0, 8.0, 6.0, 9.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2406005859375, -0.2329540252685547, -0.22530746459960938, -0.21766090393066406, -0.21001434326171875, -0.20236778259277344, -0.19472122192382812, -0.1870746612548828, -0.1794281005859375, -0.1717815399169922, -0.16413497924804688, -0.15648841857910156, -0.14884185791015625, -0.14119529724121094, -0.13354873657226562, -0.1259021759033203, -0.118255615234375, -0.11060905456542969, -0.10296249389648438, -0.09531593322753906, -0.08766937255859375, -0.08002281188964844, -0.07237625122070312, -0.06472969055175781, -0.0570831298828125, -0.04943656921386719, -0.041790008544921875, -0.03414344787597656, -0.02649688720703125, -0.018850326538085938, -0.011203765869140625, -0.0035572052001953125, 0.00408935546875, 0.011735916137695312, 0.019382476806640625, 0.027029037475585938, 0.03467559814453125, 0.04232215881347656, 0.049968719482421875, 0.05761528015136719, 0.0652618408203125, 0.07290840148925781, 0.08055496215820312, 0.08820152282714844, 0.09584808349609375, 0.10349464416503906, 0.11114120483398438, 0.11878776550292969, 0.126434326171875, 0.1340808868408203, 0.14172744750976562, 0.14937400817871094, 0.15702056884765625, 0.16466712951660156, 0.17231369018554688, 0.1799602508544922, 0.1876068115234375, 0.1952533721923828, 0.20289993286132812, 0.21054649353027344, 0.21819305419921875, 0.22583961486816406, 0.23348617553710938, 0.2411327362060547, 0.248779296875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 7.0, 3.0, 9.0, 8.0, 13.0, 24.0, 22.0, 42.0, 55.0, 81.0, 117.0, 187.0, 279.0, 404.0, 693.0, 1377.0, 3635.0, 28068.0, 827793.0, 172358.0, 8675.0, 2134.0, 1015.0, 521.0, 341.0, 220.0, 147.0, 119.0, 69.0, 44.0, 28.0, 17.0, 15.0, 14.0, 11.0, 8.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.72509765625, -0.7029647827148438, -0.6808319091796875, -0.6586990356445312, -0.636566162109375, -0.6144332885742188, -0.5923004150390625, -0.5701675415039062, -0.54803466796875, -0.5259017944335938, -0.5037689208984375, -0.48163604736328125, -0.459503173828125, -0.43737030029296875, -0.4152374267578125, -0.39310455322265625, -0.3709716796875, -0.34883880615234375, -0.3267059326171875, -0.30457305908203125, -0.282440185546875, -0.26030731201171875, -0.2381744384765625, -0.21604156494140625, -0.19390869140625, -0.17177581787109375, -0.1496429443359375, -0.12751007080078125, -0.105377197265625, -0.08324432373046875, -0.0611114501953125, -0.03897857666015625, -0.016845703125, 0.00528717041015625, 0.0274200439453125, 0.04955291748046875, 0.071685791015625, 0.09381866455078125, 0.1159515380859375, 0.13808441162109375, 0.16021728515625, 0.18235015869140625, 0.2044830322265625, 0.22661590576171875, 0.248748779296875, 0.27088165283203125, 0.2930145263671875, 0.31514739990234375, 0.3372802734375, 0.35941314697265625, 0.3815460205078125, 0.40367889404296875, 0.425811767578125, 0.44794464111328125, 0.4700775146484375, 0.49221038818359375, 0.51434326171875, 0.5364761352539062, 0.5586090087890625, 0.5807418823242188, 0.602874755859375, 0.6250076293945312, 0.6471405029296875, 0.6692733764648438, 0.69140625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 5.0, 5.0, 3.0, 5.0, 7.0, 12.0, 14.0, 18.0, 15.0, 19.0, 19.0, 30.0, 19.0, 45.0, 38.0, 36.0, 33.0, 48.0, 48.0, 50.0, 54.0, 44.0, 55.0, 47.0, 39.0, 42.0, 38.0, 34.0, 22.0, 28.0, 22.0, 18.0, 16.0, 10.0, 16.0, 9.0, 9.0, 8.0, 8.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.6630859375, -0.6439285278320312, -0.6247711181640625, -0.6056137084960938, -0.586456298828125, -0.5672988891601562, -0.5481414794921875, -0.5289840698242188, -0.50982666015625, -0.49066925048828125, -0.4715118408203125, -0.45235443115234375, -0.433197021484375, -0.41403961181640625, -0.3948822021484375, -0.37572479248046875, -0.3565673828125, -0.33740997314453125, -0.3182525634765625, -0.29909515380859375, -0.279937744140625, -0.26078033447265625, -0.2416229248046875, -0.22246551513671875, -0.20330810546875, -0.18415069580078125, -0.1649932861328125, -0.14583587646484375, -0.126678466796875, -0.10752105712890625, -0.0883636474609375, -0.06920623779296875, -0.050048828125, -0.03089141845703125, -0.0117340087890625, 0.00742340087890625, 0.026580810546875, 0.04573822021484375, 0.0648956298828125, 0.08405303955078125, 0.10321044921875, 0.12236785888671875, 0.1415252685546875, 0.16068267822265625, 0.179840087890625, 0.19899749755859375, 0.2181549072265625, 0.23731231689453125, 0.2564697265625, 0.27562713623046875, 0.2947845458984375, 0.31394195556640625, 0.333099365234375, 0.35225677490234375, 0.3714141845703125, 0.39057159423828125, 0.40972900390625, 0.42888641357421875, 0.4480438232421875, 0.46720123291015625, 0.486358642578125, 0.5055160522460938, 0.5246734619140625, 0.5438308715820312, 0.56298828125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 8.0, 4.0, 12.0, 9.0, 7.0, 23.0, 18.0, 22.0, 40.0, 65.0, 83.0, 162.0, 330.0, 885.0, 3623.0, 40757.0, 917753.0, 77554.0, 5220.0, 1115.0, 392.0, 167.0, 91.0, 51.0, 34.0, 26.0, 24.0, 15.0, 15.0, 11.0, 4.0, 5.0, 8.0, 6.0, 3.0, 4.0, 2.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2113037109375, -0.2036457061767578, -0.19598770141601562, -0.18832969665527344, -0.18067169189453125, -0.17301368713378906, -0.16535568237304688, -0.1576976776123047, -0.1500396728515625, -0.1423816680908203, -0.13472366333007812, -0.12706565856933594, -0.11940765380859375, -0.11174964904785156, -0.10409164428710938, -0.09643363952636719, -0.088775634765625, -0.08111763000488281, -0.07345962524414062, -0.06580162048339844, -0.05814361572265625, -0.05048561096191406, -0.042827606201171875, -0.03516960144042969, -0.0275115966796875, -0.019853591918945312, -0.012195587158203125, -0.0045375823974609375, 0.00312042236328125, 0.010778427124023438, 0.018436431884765625, 0.026094436645507812, 0.03375244140625, 0.04141044616699219, 0.049068450927734375, 0.05672645568847656, 0.06438446044921875, 0.07204246520996094, 0.07970046997070312, 0.08735847473144531, 0.0950164794921875, 0.10267448425292969, 0.11033248901367188, 0.11799049377441406, 0.12564849853515625, 0.13330650329589844, 0.14096450805664062, 0.1486225128173828, 0.156280517578125, 0.1639385223388672, 0.17159652709960938, 0.17925453186035156, 0.18691253662109375, 0.19457054138183594, 0.20222854614257812, 0.2098865509033203, 0.2175445556640625, 0.2252025604248047, 0.23286056518554688, 0.24051856994628906, 0.24817657470703125, 0.25583457946777344, 0.2634925842285156, 0.2711505889892578, 0.27880859375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 3.0, 2.0, 4.0, 4.0, 2.0, 4.0, 7.0, 6.0, 7.0, 14.0, 16.0, 27.0, 35.0, 58.0, 115.0, 182.0, 176.0, 126.0, 54.0, 40.0, 30.0, 23.0, 16.0, 16.0, 5.0, 5.0, 2.0, 5.0, 3.0, 3.0, 4.0, 1.0, 5.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00011849403381347656, -0.0001147901639342308, -0.00011108629405498505, -0.00010738242417573929, -0.00010367855429649353, -9.997468441724777e-05, -9.627081453800201e-05, -9.256694465875626e-05, -8.88630747795105e-05, -8.515920490026474e-05, -8.145533502101898e-05, -7.775146514177322e-05, -7.404759526252747e-05, -7.034372538328171e-05, -6.663985550403595e-05, -6.293598562479019e-05, -5.9232115745544434e-05, -5.5528245866298676e-05, -5.182437598705292e-05, -4.812050610780716e-05, -4.44166362285614e-05, -4.071276634931564e-05, -3.7008896470069885e-05, -3.330502659082413e-05, -2.960115671157837e-05, -2.589728683233261e-05, -2.2193416953086853e-05, -1.8489547073841095e-05, -1.4785677194595337e-05, -1.1081807315349579e-05, -7.377937436103821e-06, -3.6740675568580627e-06, 2.9802322387695312e-08, 3.7336722016334534e-06, 7.4375420808792114e-06, 1.114141196012497e-05, 1.4845281839370728e-05, 1.8549151718616486e-05, 2.2253021597862244e-05, 2.5956891477108002e-05, 2.966076135635376e-05, 3.336463123559952e-05, 3.7068501114845276e-05, 4.0772370994091034e-05, 4.447624087333679e-05, 4.818011075258255e-05, 5.188398063182831e-05, 5.5587850511074066e-05, 5.9291720390319824e-05, 6.299559026956558e-05, 6.669946014881134e-05, 7.04033300280571e-05, 7.410719990730286e-05, 7.781106978654861e-05, 8.151493966579437e-05, 8.521880954504013e-05, 8.892267942428589e-05, 9.262654930353165e-05, 9.63304191827774e-05, 0.00010003428906202316, 0.00010373815894126892, 0.00010744202882051468, 0.00011114589869976044, 0.0001148497685790062, 0.00011855363845825195]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 4.0, 6.0, 1.0, 7.0, 9.0, 13.0, 15.0, 31.0, 54.0, 66.0, 132.0, 209.0, 461.0, 1181.0, 3986.0, 27238.0, 793351.0, 206421.0, 11372.0, 2376.0, 799.0, 380.0, 183.0, 95.0, 61.0, 41.0, 16.0, 16.0, 8.0, 10.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1756591796875, -0.16910743713378906, -0.16255569458007812, -0.1560039520263672, -0.14945220947265625, -0.1429004669189453, -0.13634872436523438, -0.12979698181152344, -0.1232452392578125, -0.11669349670410156, -0.11014175415039062, -0.10359001159667969, -0.09703826904296875, -0.09048652648925781, -0.08393478393554688, -0.07738304138183594, -0.070831298828125, -0.06427955627441406, -0.057727813720703125, -0.05117607116699219, -0.04462432861328125, -0.03807258605957031, -0.031520843505859375, -0.024969100952148438, -0.0184173583984375, -0.011865615844726562, -0.005313873291015625, 0.0012378692626953125, 0.00778961181640625, 0.014341354370117188, 0.020893096923828125, 0.027444839477539062, 0.03399658203125, 0.04054832458496094, 0.047100067138671875, 0.05365180969238281, 0.06020355224609375, 0.06675529479980469, 0.07330703735351562, 0.07985877990722656, 0.0864105224609375, 0.09296226501464844, 0.09951400756835938, 0.10606575012207031, 0.11261749267578125, 0.11916923522949219, 0.12572097778320312, 0.13227272033691406, 0.138824462890625, 0.14537620544433594, 0.15192794799804688, 0.1584796905517578, 0.16503143310546875, 0.1715831756591797, 0.17813491821289062, 0.18468666076660156, 0.1912384033203125, 0.19779014587402344, 0.20434188842773438, 0.2108936309814453, 0.21744537353515625, 0.2239971160888672, 0.23054885864257812, 0.23710060119628906, 0.24365234375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 1.0, 5.0, 7.0, 4.0, 5.0, 3.0, 5.0, 14.0, 5.0, 22.0, 20.0, 38.0, 39.0, 64.0, 66.0, 73.0, 89.0, 90.0, 79.0, 67.0, 71.0, 42.0, 44.0, 28.0, 31.0, 10.0, 13.0, 5.0, 16.0, 8.0, 9.0, 4.0, 6.0, 4.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0], "bins": [-0.1424560546875, -0.13886260986328125, -0.1352691650390625, -0.13167572021484375, -0.128082275390625, -0.12448883056640625, -0.1208953857421875, -0.11730194091796875, -0.11370849609375, -0.11011505126953125, -0.1065216064453125, -0.10292816162109375, -0.099334716796875, -0.09574127197265625, -0.0921478271484375, -0.08855438232421875, -0.0849609375, -0.08136749267578125, -0.0777740478515625, -0.07418060302734375, -0.070587158203125, -0.06699371337890625, -0.0634002685546875, -0.05980682373046875, -0.05621337890625, -0.05261993408203125, -0.0490264892578125, -0.04543304443359375, -0.041839599609375, -0.03824615478515625, -0.0346527099609375, -0.03105926513671875, -0.0274658203125, -0.02387237548828125, -0.0202789306640625, -0.01668548583984375, -0.013092041015625, -0.00949859619140625, -0.0059051513671875, -0.00231170654296875, 0.00128173828125, 0.00487518310546875, 0.0084686279296875, 0.01206207275390625, 0.015655517578125, 0.01924896240234375, 0.0228424072265625, 0.02643585205078125, 0.030029296875, 0.03362274169921875, 0.0372161865234375, 0.04080963134765625, 0.044403076171875, 0.04799652099609375, 0.0515899658203125, 0.05518341064453125, 0.05877685546875, 0.06237030029296875, 0.0659637451171875, 0.06955718994140625, 0.073150634765625, 0.07674407958984375, 0.0803375244140625, 0.08393096923828125, 0.0875244140625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 8.0, 18.0, 80.0, 295.0, 394.0, 114.0, 34.0, 22.0, 11.0, 7.0, 6.0, 2.0, 3.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9648702144622803, -1.7874879837036133, -1.6101056337356567, -1.4327232837677002, -1.2553410530090332, -1.0779588222503662, -0.9005764722824097, -0.7231941223144531, -0.5458118915557861, -0.36842960119247437, -0.1910473108291626, -0.01366502046585083, 0.16371726989746094, 0.3410995602607727, 0.5184818506240845, 0.695864200592041, 0.873246431350708, 1.050628662109375, 1.2280110120773315, 1.405393362045288, 1.582775592803955, 1.760157823562622, 1.9375401735305786, 2.114922523498535, 2.292304754257202, 2.469686985015869, 2.6470694541931152, 2.8244516849517822, 3.001833915710449, 3.179216146469116, 3.356598377227783, 3.5339808464050293, 3.711362838745117, 3.888745069503784, 4.066127300262451, 4.243509769439697, 4.420891761779785, 4.598274230957031, 4.775656700134277, 4.953039169311523, 5.130421161651611, 5.307803630828857, 5.485185623168945, 5.662568092346191, 5.8399505615234375, 6.017332553863525, 6.1947150230407715, 6.372097015380859, 6.5494794845581055, 6.726861953735352, 6.9042439460754395, 7.0816264152526855, 7.259008407592773, 7.4363908767700195, 7.613773345947266, 7.791155815124512, 7.9685378074646, 8.145919799804688, 8.323302268981934, 8.50068473815918, 8.678067207336426, 8.855449676513672, 9.032831192016602, 9.210213661193848, 9.387596130371094]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 3.0, 4.0, 1.0, 5.0, 5.0, 6.0, 2.0, 3.0, 5.0, 11.0, 12.0, 15.0, 15.0, 8.0, 21.0, 23.0, 14.0, 23.0, 21.0, 34.0, 21.0, 29.0, 29.0, 33.0, 52.0, 68.0, 58.0, 55.0, 60.0, 34.0, 53.0, 44.0, 24.0, 22.0, 28.0, 20.0, 25.0, 21.0, 17.0, 12.0, 13.0, 10.0, 9.0, 6.0, 9.0, 6.0, 8.0, 8.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-2.0536327362060547, -1.9866238832473755, -1.9196151494979858, -1.8526062965393066, -1.785597562789917, -1.7185887098312378, -1.6515798568725586, -1.584571123123169, -1.5175623893737793, -1.4505535364151, -1.3835448026657104, -1.3165359497070312, -1.2495272159576416, -1.1825183629989624, -1.1155095100402832, -1.0485007762908936, -0.9814919233322144, -0.9144831299781799, -0.8474743366241455, -0.7804654836654663, -0.7134567499160767, -0.6464478969573975, -0.579439103603363, -0.5124303102493286, -0.4454215168952942, -0.37841272354125977, -0.31140393018722534, -0.24439510703086853, -0.1773863136768341, -0.11037752032279968, -0.04336869716644287, 0.023640096187591553, 0.09064888954162598, 0.1576576828956604, 0.22466649115085602, 0.29167529940605164, 0.35868409276008606, 0.4256928861141205, 0.4927017092704773, 0.5597105026245117, 0.6267192959785461, 0.6937280893325806, 0.760736882686615, 0.8277456760406494, 0.8947545289993286, 0.9617632627487183, 1.0287721157073975, 1.095780849456787, 1.1627897024154663, 1.2297985553741455, 1.2968072891235352, 1.3638161420822144, 1.430824875831604, 1.4978337287902832, 1.5648424625396729, 1.631851315498352, 1.6988601684570312, 1.7658690214157104, 1.8328777551651, 1.8998866081237793, 1.966895341873169, 2.0339040756225586, 2.1009130477905273, 2.167921781539917, 2.2349305152893066]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 11.0, 18.0, 29.0, 49.0, 83.0, 198.0, 473.0, 1685.0, 12565.0, 685095.0, 3442515.0, 47180.0, 3140.0, 677.0, 276.0, 145.0, 71.0, 34.0, 23.0, 7.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.6435546875, -0.6283111572265625, -0.613067626953125, -0.5978240966796875, -0.58258056640625, -0.5673370361328125, -0.552093505859375, -0.5368499755859375, -0.5216064453125, -0.5063629150390625, -0.491119384765625, -0.4758758544921875, -0.46063232421875, -0.4453887939453125, -0.430145263671875, -0.4149017333984375, -0.399658203125, -0.3844146728515625, -0.369171142578125, -0.3539276123046875, -0.33868408203125, -0.3234405517578125, -0.308197021484375, -0.2929534912109375, -0.2777099609375, -0.2624664306640625, -0.247222900390625, -0.2319793701171875, -0.21673583984375, -0.2014923095703125, -0.186248779296875, -0.1710052490234375, -0.15576171875, -0.1405181884765625, -0.125274658203125, -0.1100311279296875, -0.09478759765625, -0.0795440673828125, -0.064300537109375, -0.0490570068359375, -0.0338134765625, -0.0185699462890625, -0.003326416015625, 0.0119171142578125, 0.02716064453125, 0.0424041748046875, 0.057647705078125, 0.0728912353515625, 0.088134765625, 0.1033782958984375, 0.118621826171875, 0.1338653564453125, 0.14910888671875, 0.1643524169921875, 0.179595947265625, 0.1948394775390625, 0.2100830078125, 0.2253265380859375, 0.240570068359375, 0.2558135986328125, 0.27105712890625, 0.2863006591796875, 0.301544189453125, 0.3167877197265625, 0.33203125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 6.0, 4.0, 6.0, 11.0, 13.0, 8.0, 13.0, 30.0, 39.0, 44.0, 43.0, 60.0, 61.0, 74.0, 75.0, 74.0, 58.0, 74.0, 65.0, 45.0, 49.0, 37.0, 38.0, 25.0, 22.0, 10.0, 7.0, 8.0, 5.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2398681640625, -0.23218345642089844, -0.22449874877929688, -0.2168140411376953, -0.20912933349609375, -0.2014446258544922, -0.19375991821289062, -0.18607521057128906, -0.1783905029296875, -0.17070579528808594, -0.16302108764648438, -0.1553363800048828, -0.14765167236328125, -0.1399669647216797, -0.13228225708007812, -0.12459754943847656, -0.116912841796875, -0.10922813415527344, -0.10154342651367188, -0.09385871887207031, -0.08617401123046875, -0.07848930358886719, -0.07080459594726562, -0.06311988830566406, -0.0554351806640625, -0.04775047302246094, -0.040065765380859375, -0.03238105773925781, -0.02469635009765625, -0.017011642456054688, -0.009326934814453125, -0.0016422271728515625, 0.00604248046875, 0.013727188110351562, 0.021411895751953125, 0.029096603393554688, 0.03678131103515625, 0.04446601867675781, 0.052150726318359375, 0.05983543395996094, 0.0675201416015625, 0.07520484924316406, 0.08288955688476562, 0.09057426452636719, 0.09825897216796875, 0.10594367980957031, 0.11362838745117188, 0.12131309509277344, 0.128997802734375, 0.13668251037597656, 0.14436721801757812, 0.1520519256591797, 0.15973663330078125, 0.1674213409423828, 0.17510604858398438, 0.18279075622558594, 0.1904754638671875, 0.19816017150878906, 0.20584487915039062, 0.2135295867919922, 0.22121429443359375, 0.2288990020751953, 0.23658370971679688, 0.24426841735839844, 0.251953125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 7.0, 7.0, 15.0, 28.0, 38.0, 77.0, 187.0, 470.0, 1185.0, 3411.0, 23994.0, 4034642.0, 123343.0, 4695.0, 1259.0, 461.0, 238.0, 115.0, 53.0, 18.0, 21.0, 12.0, 3.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6123046875, -0.5884628295898438, -0.5646209716796875, -0.5407791137695312, -0.516937255859375, -0.49309539794921875, -0.4692535400390625, -0.44541168212890625, -0.42156982421875, -0.39772796630859375, -0.3738861083984375, -0.35004425048828125, -0.326202392578125, -0.30236053466796875, -0.2785186767578125, -0.25467681884765625, -0.2308349609375, -0.20699310302734375, -0.1831512451171875, -0.15930938720703125, -0.135467529296875, -0.11162567138671875, -0.0877838134765625, -0.06394195556640625, -0.04010009765625, -0.01625823974609375, 0.0075836181640625, 0.03142547607421875, 0.055267333984375, 0.07910919189453125, 0.1029510498046875, 0.12679290771484375, 0.150634765625, 0.17447662353515625, 0.1983184814453125, 0.22216033935546875, 0.246002197265625, 0.26984405517578125, 0.2936859130859375, 0.31752777099609375, 0.34136962890625, 0.36521148681640625, 0.3890533447265625, 0.41289520263671875, 0.436737060546875, 0.46057891845703125, 0.4844207763671875, 0.5082626342773438, 0.5321044921875, 0.5559463500976562, 0.5797882080078125, 0.6036300659179688, 0.627471923828125, 0.6513137817382812, 0.6751556396484375, 0.6989974975585938, 0.72283935546875, 0.7466812133789062, 0.7705230712890625, 0.7943649291992188, 0.818206787109375, 0.8420486450195312, 0.8658905029296875, 0.8897323608398438, 0.91357421875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 9.0, 6.0, 31.0, 48.0, 98.0, 359.0, 1109.0, 1496.0, 604.0, 163.0, 70.0, 33.0, 13.0, 11.0, 6.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7109375, -0.6901702880859375, -0.669403076171875, -0.6486358642578125, -0.62786865234375, -0.6071014404296875, -0.586334228515625, -0.5655670166015625, -0.5447998046875, -0.5240325927734375, -0.503265380859375, -0.4824981689453125, -0.46173095703125, -0.4409637451171875, -0.420196533203125, -0.3994293212890625, -0.378662109375, -0.3578948974609375, -0.337127685546875, -0.3163604736328125, -0.29559326171875, -0.2748260498046875, -0.254058837890625, -0.2332916259765625, -0.2125244140625, -0.1917572021484375, -0.170989990234375, -0.1502227783203125, -0.12945556640625, -0.1086883544921875, -0.087921142578125, -0.0671539306640625, -0.04638671875, -0.0256195068359375, -0.004852294921875, 0.0159149169921875, 0.03668212890625, 0.0574493408203125, 0.078216552734375, 0.0989837646484375, 0.1197509765625, 0.1405181884765625, 0.161285400390625, 0.1820526123046875, 0.20281982421875, 0.2235870361328125, 0.244354248046875, 0.2651214599609375, 0.285888671875, 0.3066558837890625, 0.327423095703125, 0.3481903076171875, 0.36895751953125, 0.3897247314453125, 0.410491943359375, 0.4312591552734375, 0.4520263671875, 0.4727935791015625, 0.493560791015625, 0.5143280029296875, 0.53509521484375, 0.5558624267578125, 0.576629638671875, 0.5973968505859375, 0.6181640625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 5.0, 1.0, 4.0, 9.0, 24.0, 122.0, 507.0, 268.0, 42.0, 6.0, 6.0, 3.0, 6.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.73887825012207, -8.506672859191895, -8.274467468261719, -8.042261123657227, -7.810055732727051, -7.577850341796875, -7.345644950866699, -7.113439083099365, -6.881233215332031, -6.6490278244018555, -6.4168219566345215, -6.184616565704346, -5.952410697937012, -5.720205307006836, -5.48799991607666, -5.255794048309326, -5.02358865737915, -4.791383266448975, -4.559177398681641, -4.326972007751465, -4.094766139984131, -3.862560749053955, -3.6303551197052, -3.3981494903564453, -3.1659438610076904, -2.9337382316589355, -2.7015326023101807, -2.469326972961426, -2.23712158203125, -2.004915714263916, -1.7727103233337402, -1.5405046939849854, -1.3082990646362305, -1.0760934352874756, -0.8438878655433655, -0.6116822957992554, -0.3794766664505005, -0.1472710371017456, 0.08493447303771973, 0.3171401023864746, 0.5493457317352295, 0.7815513610839844, 1.0137569904327393, 1.2459625005722046, 1.4781681299209595, 1.7103737592697144, 1.9425792694091797, 2.1747848987579346, 2.4069905281066895, 2.6391961574554443, 2.871401786804199, 3.103607177734375, 3.335813045501709, 3.5680184364318848, 3.8002240657806396, 4.0324296951293945, 4.26463508605957, 4.496840476989746, 4.72904634475708, 4.961251735687256, 5.19345760345459, 5.425662994384766, 5.657868385314941, 5.890074253082275, 6.122280120849609]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 14.0, 16.0, 30.0, 67.0, 79.0, 87.0, 136.0, 142.0, 124.0, 109.0, 88.0, 51.0, 31.0, 11.0, 8.0, 6.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.660445213317871, -3.5347414016723633, -3.4090375900268555, -3.2833337783813477, -3.1576297283172607, -3.031925916671753, -2.906222105026245, -2.7805182933807373, -2.6548142433166504, -2.5291104316711426, -2.4034066200256348, -2.277702808380127, -2.15199875831604, -2.0262949466705322, -1.9005911350250244, -1.7748873233795166, -1.6491835117340088, -1.523479700088501, -1.3977757692337036, -1.2720719575881958, -1.1463680267333984, -1.0206642150878906, -0.8949604034423828, -0.7692565321922302, -0.6435526609420776, -0.517848789691925, -0.39214494824409485, -0.26644110679626465, -0.14073723554611206, -0.015033364295959473, 0.11067044734954834, 0.23637431859970093, 0.3620781898498535, 0.4877820611000061, 0.6134859323501587, 0.7391897439956665, 0.8648936152458191, 0.9905974864959717, 1.1163012981414795, 1.2420051097869873, 1.3677090406417847, 1.4934128522872925, 1.6191167831420898, 1.7448205947875977, 1.8705244064331055, 1.9962283372879028, 2.121932029724121, 2.247636079788208, 2.373339891433716, 2.4990437030792236, 2.6247475147247314, 2.7504515647888184, 2.876155376434326, 3.001859188079834, 3.127562999725342, 3.2532668113708496, 3.3789706230163574, 3.5046744346618652, 3.630378246307373, 3.756082057952881, 3.8817861080169678, 4.007490158081055, 4.1331939697265625, 4.25889778137207, 4.384601593017578]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 6.0, 1.0, 6.0, 10.0, 11.0, 20.0, 19.0, 32.0, 55.0, 83.0, 142.0, 297.0, 604.0, 1427.0, 4283.0, 19119.0, 140198.0, 654690.0, 194959.0, 24338.0, 5226.0, 1649.0, 636.0, 301.0, 160.0, 96.0, 42.0, 50.0, 17.0, 20.0, 13.0, 8.0, 10.0, 8.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.43310546875, -0.4205780029296875, -0.408050537109375, -0.3955230712890625, -0.38299560546875, -0.3704681396484375, -0.357940673828125, -0.3454132080078125, -0.3328857421875, -0.3203582763671875, -0.307830810546875, -0.2953033447265625, -0.28277587890625, -0.2702484130859375, -0.257720947265625, -0.2451934814453125, -0.232666015625, -0.2201385498046875, -0.207611083984375, -0.1950836181640625, -0.18255615234375, -0.1700286865234375, -0.157501220703125, -0.1449737548828125, -0.1324462890625, -0.1199188232421875, -0.107391357421875, -0.0948638916015625, -0.08233642578125, -0.0698089599609375, -0.057281494140625, -0.0447540283203125, -0.0322265625, -0.0196990966796875, -0.007171630859375, 0.0053558349609375, 0.01788330078125, 0.0304107666015625, 0.042938232421875, 0.0554656982421875, 0.0679931640625, 0.0805206298828125, 0.093048095703125, 0.1055755615234375, 0.11810302734375, 0.1306304931640625, 0.143157958984375, 0.1556854248046875, 0.168212890625, 0.1807403564453125, 0.193267822265625, 0.2057952880859375, 0.21832275390625, 0.2308502197265625, 0.243377685546875, 0.2559051513671875, 0.2684326171875, 0.2809600830078125, 0.293487548828125, 0.3060150146484375, 0.31854248046875, 0.3310699462890625, 0.343597412109375, 0.3561248779296875, 0.36865234375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 12.0, 5.0, 10.0, 12.0, 18.0, 37.0, 25.0, 36.0, 43.0, 65.0, 63.0, 74.0, 80.0, 64.0, 70.0, 66.0, 75.0, 59.0, 32.0, 41.0, 30.0, 16.0, 21.0, 14.0, 15.0, 5.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.239013671875, -0.2313690185546875, -0.223724365234375, -0.2160797119140625, -0.20843505859375, -0.2007904052734375, -0.193145751953125, -0.1855010986328125, -0.1778564453125, -0.1702117919921875, -0.162567138671875, -0.1549224853515625, -0.14727783203125, -0.1396331787109375, -0.131988525390625, -0.1243438720703125, -0.11669921875, -0.1090545654296875, -0.101409912109375, -0.0937652587890625, -0.08612060546875, -0.0784759521484375, -0.070831298828125, -0.0631866455078125, -0.0555419921875, -0.0478973388671875, -0.040252685546875, -0.0326080322265625, -0.02496337890625, -0.0173187255859375, -0.009674072265625, -0.0020294189453125, 0.005615234375, 0.0132598876953125, 0.020904541015625, 0.0285491943359375, 0.03619384765625, 0.0438385009765625, 0.051483154296875, 0.0591278076171875, 0.0667724609375, 0.0744171142578125, 0.082061767578125, 0.0897064208984375, 0.09735107421875, 0.1049957275390625, 0.112640380859375, 0.1202850341796875, 0.1279296875, 0.1355743408203125, 0.143218994140625, 0.1508636474609375, 0.15850830078125, 0.1661529541015625, 0.173797607421875, 0.1814422607421875, 0.1890869140625, 0.1967315673828125, 0.204376220703125, 0.2120208740234375, 0.21966552734375, 0.2273101806640625, 0.234954833984375, 0.2425994873046875, 0.250244140625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 2.0, 5.0, 5.0, 7.0, 16.0, 20.0, 16.0, 33.0, 44.0, 34.0, 76.0, 87.0, 145.0, 208.0, 411.0, 783.0, 2085.0, 8423.0, 52166.0, 573892.0, 356924.0, 42392.0, 7123.0, 1879.0, 708.0, 344.0, 202.0, 150.0, 98.0, 66.0, 61.0, 31.0, 19.0, 20.0, 18.0, 17.0, 13.0, 6.0, 6.0, 6.0, 7.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.33544921875, -0.3230018615722656, -0.31055450439453125, -0.2981071472167969, -0.2856597900390625, -0.2732124328613281, -0.26076507568359375, -0.24831771850585938, -0.235870361328125, -0.22342300415039062, -0.21097564697265625, -0.19852828979492188, -0.1860809326171875, -0.17363357543945312, -0.16118621826171875, -0.14873886108398438, -0.13629150390625, -0.12384414672851562, -0.11139678955078125, -0.09894943237304688, -0.0865020751953125, -0.07405471801757812, -0.06160736083984375, -0.049160003662109375, -0.036712646484375, -0.024265289306640625, -0.01181793212890625, 0.000629425048828125, 0.0130767822265625, 0.025524139404296875, 0.03797149658203125, 0.050418853759765625, 0.0628662109375, 0.07531356811523438, 0.08776092529296875, 0.10020828247070312, 0.1126556396484375, 0.12510299682617188, 0.13755035400390625, 0.14999771118164062, 0.162445068359375, 0.17489242553710938, 0.18733978271484375, 0.19978713989257812, 0.2122344970703125, 0.22468185424804688, 0.23712921142578125, 0.24957656860351562, 0.26202392578125, 0.2744712829589844, 0.28691864013671875, 0.2993659973144531, 0.3118133544921875, 0.3242607116699219, 0.33670806884765625, 0.3491554260253906, 0.361602783203125, 0.3740501403808594, 0.38649749755859375, 0.3989448547363281, 0.4113922119140625, 0.4238395690917969, 0.43628692626953125, 0.4487342834472656, 0.461181640625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 0.0, 8.0, 6.0, 5.0, 9.0, 4.0, 7.0, 6.0, 18.0, 9.0, 14.0, 15.0, 14.0, 23.0, 36.0, 29.0, 32.0, 43.0, 38.0, 47.0, 51.0, 51.0, 49.0, 49.0, 34.0, 42.0, 35.0, 35.0, 40.0, 38.0, 29.0, 29.0, 18.0, 31.0, 19.0, 19.0, 11.0, 13.0, 10.0, 7.0, 8.0, 4.0, 9.0, 6.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.444091796875, -0.4276390075683594, -0.41118621826171875, -0.3947334289550781, -0.3782806396484375, -0.3618278503417969, -0.34537506103515625, -0.3289222717285156, -0.312469482421875, -0.2960166931152344, -0.27956390380859375, -0.2631111145019531, -0.2466583251953125, -0.23020553588867188, -0.21375274658203125, -0.19729995727539062, -0.18084716796875, -0.16439437866210938, -0.14794158935546875, -0.13148880004882812, -0.1150360107421875, -0.09858322143554688, -0.08213043212890625, -0.06567764282226562, -0.049224853515625, -0.032772064208984375, -0.01631927490234375, 0.000133514404296875, 0.0165863037109375, 0.033039093017578125, 0.04949188232421875, 0.06594467163085938, 0.0823974609375, 0.09885025024414062, 0.11530303955078125, 0.13175582885742188, 0.1482086181640625, 0.16466140747070312, 0.18111419677734375, 0.19756698608398438, 0.214019775390625, 0.23047256469726562, 0.24692535400390625, 0.2633781433105469, 0.2798309326171875, 0.2962837219238281, 0.31273651123046875, 0.3291893005371094, 0.34564208984375, 0.3620948791503906, 0.37854766845703125, 0.3950004577636719, 0.4114532470703125, 0.4279060363769531, 0.44435882568359375, 0.4608116149902344, 0.477264404296875, 0.4937171936035156, 0.5101699829101562, 0.5266227722167969, 0.5430755615234375, 0.5595283508300781, 0.5759811401367188, 0.5924339294433594, 0.60888671875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 6.0, 12.0, 15.0, 31.0, 44.0, 70.0, 143.0, 304.0, 997.0, 4611.0, 30459.0, 554426.0, 421533.0, 29786.0, 4446.0, 1005.0, 338.0, 143.0, 75.0, 36.0, 23.0, 13.0, 7.0, 8.0, 1.0, 5.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1944580078125, -0.18947124481201172, -0.18448448181152344, -0.17949771881103516, -0.17451095581054688, -0.1695241928100586, -0.1645374298095703, -0.15955066680908203, -0.15456390380859375, -0.14957714080810547, -0.1445903778076172, -0.1396036148071289, -0.13461685180664062, -0.12963008880615234, -0.12464332580566406, -0.11965656280517578, -0.1146697998046875, -0.10968303680419922, -0.10469627380371094, -0.09970951080322266, -0.09472274780273438, -0.0897359848022461, -0.08474922180175781, -0.07976245880126953, -0.07477569580078125, -0.06978893280029297, -0.06480216979980469, -0.059815406799316406, -0.054828643798828125, -0.049841880798339844, -0.04485511779785156, -0.03986835479736328, -0.034881591796875, -0.02989482879638672, -0.024908065795898438, -0.019921302795410156, -0.014934539794921875, -0.009947776794433594, -0.0049610137939453125, 2.574920654296875e-05, 0.00501251220703125, 0.009999275207519531, 0.014986038208007812, 0.019972801208496094, 0.024959564208984375, 0.029946327209472656, 0.03493309020996094, 0.03991985321044922, 0.0449066162109375, 0.04989337921142578, 0.05488014221191406, 0.059866905212402344, 0.06485366821289062, 0.0698404312133789, 0.07482719421386719, 0.07981395721435547, 0.08480072021484375, 0.08978748321533203, 0.09477424621582031, 0.0997610092163086, 0.10474777221679688, 0.10973453521728516, 0.11472129821777344, 0.11970806121826172, 0.12469482421875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 4.0, 6.0, 7.0, 2.0, 14.0, 17.0, 29.0, 50.0, 60.0, 91.0, 125.0, 137.0, 124.0, 124.0, 70.0, 52.0, 33.0, 25.0, 9.0, 12.0, 5.0, 1.0, 1.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.23464584350586e-05, -6.009731441736221e-05, -5.784817039966583e-05, -5.559902638196945e-05, -5.334988236427307e-05, -5.110073834657669e-05, -4.885159432888031e-05, -4.660245031118393e-05, -4.435330629348755e-05, -4.210416227579117e-05, -3.985501825809479e-05, -3.760587424039841e-05, -3.5356730222702026e-05, -3.3107586205005646e-05, -3.0858442187309265e-05, -2.8609298169612885e-05, -2.6360154151916504e-05, -2.4111010134220123e-05, -2.1861866116523743e-05, -1.9612722098827362e-05, -1.736357808113098e-05, -1.51144340634346e-05, -1.286529004573822e-05, -1.061614602804184e-05, -8.367002010345459e-06, -6.117857992649078e-06, -3.868713974952698e-06, -1.6195699572563171e-06, 6.295740604400635e-07, 2.878718078136444e-06, 5.127862095832825e-06, 7.377006113529205e-06, 9.626150131225586e-06, 1.1875294148921967e-05, 1.4124438166618347e-05, 1.6373582184314728e-05, 1.862272620201111e-05, 2.087187021970749e-05, 2.312101423740387e-05, 2.537015825510025e-05, 2.761930227279663e-05, 2.986844629049301e-05, 3.211759030818939e-05, 3.436673432588577e-05, 3.661587834358215e-05, 3.8865022361278534e-05, 4.1114166378974915e-05, 4.3363310396671295e-05, 4.5612454414367676e-05, 4.7861598432064056e-05, 5.011074244976044e-05, 5.235988646745682e-05, 5.46090304851532e-05, 5.685817450284958e-05, 5.910731852054596e-05, 6.135646253824234e-05, 6.360560655593872e-05, 6.58547505736351e-05, 6.810389459133148e-05, 7.035303860902786e-05, 7.260218262672424e-05, 7.485132664442062e-05, 7.7100470662117e-05, 7.934961467981339e-05, 8.159875869750977e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 9.0, 4.0, 15.0, 16.0, 20.0, 43.0, 80.0, 130.0, 264.0, 775.0, 2737.0, 14508.0, 140450.0, 792281.0, 84067.0, 10035.0, 2004.0, 582.0, 251.0, 104.0, 68.0, 43.0, 26.0, 12.0, 11.0, 7.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2022705078125, -0.19738483428955078, -0.19249916076660156, -0.18761348724365234, -0.18272781372070312, -0.1778421401977539, -0.1729564666748047, -0.16807079315185547, -0.16318511962890625, -0.15829944610595703, -0.1534137725830078, -0.1485280990600586, -0.14364242553710938, -0.13875675201416016, -0.13387107849121094, -0.12898540496826172, -0.1240997314453125, -0.11921405792236328, -0.11432838439941406, -0.10944271087646484, -0.10455703735351562, -0.0996713638305664, -0.09478569030761719, -0.08990001678466797, -0.08501434326171875, -0.08012866973876953, -0.07524299621582031, -0.0703573226928711, -0.06547164916992188, -0.060585975646972656, -0.05570030212402344, -0.05081462860107422, -0.045928955078125, -0.04104328155517578, -0.03615760803222656, -0.031271934509277344, -0.026386260986328125, -0.021500587463378906, -0.016614913940429688, -0.011729240417480469, -0.00684356689453125, -0.0019578933715820312, 0.0029277801513671875, 0.007813453674316406, 0.012699127197265625, 0.017584800720214844, 0.022470474243164062, 0.02735614776611328, 0.0322418212890625, 0.03712749481201172, 0.04201316833496094, 0.046898841857910156, 0.051784515380859375, 0.056670188903808594, 0.06155586242675781, 0.06644153594970703, 0.07132720947265625, 0.07621288299560547, 0.08109855651855469, 0.0859842300415039, 0.09086990356445312, 0.09575557708740234, 0.10064125061035156, 0.10552692413330078, 0.11041259765625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 1.0, 0.0, 8.0, 5.0, 3.0, 9.0, 14.0, 19.0, 27.0, 51.0, 56.0, 82.0, 84.0, 109.0, 133.0, 96.0, 91.0, 59.0, 32.0, 33.0, 36.0, 20.0, 11.0, 8.0, 11.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.134033203125, -0.12943267822265625, -0.1248321533203125, -0.12023162841796875, -0.115631103515625, -0.11103057861328125, -0.1064300537109375, -0.10182952880859375, -0.09722900390625, -0.09262847900390625, -0.0880279541015625, -0.08342742919921875, -0.078826904296875, -0.07422637939453125, -0.0696258544921875, -0.06502532958984375, -0.0604248046875, -0.05582427978515625, -0.0512237548828125, -0.04662322998046875, -0.042022705078125, -0.03742218017578125, -0.0328216552734375, -0.02822113037109375, -0.02362060546875, -0.01902008056640625, -0.0144195556640625, -0.00981903076171875, -0.005218505859375, -0.00061798095703125, 0.0039825439453125, 0.00858306884765625, 0.01318359375, 0.01778411865234375, 0.0223846435546875, 0.02698516845703125, 0.031585693359375, 0.03618621826171875, 0.0407867431640625, 0.04538726806640625, 0.04998779296875, 0.05458831787109375, 0.0591888427734375, 0.06378936767578125, 0.068389892578125, 0.07299041748046875, 0.0775909423828125, 0.08219146728515625, 0.0867919921875, 0.09139251708984375, 0.0959930419921875, 0.10059356689453125, 0.105194091796875, 0.10979461669921875, 0.1143951416015625, 0.11899566650390625, 0.12359619140625, 0.12819671630859375, 0.1327972412109375, 0.13739776611328125, 0.141998291015625, 0.14659881591796875, 0.1511993408203125, 0.15579986572265625, 0.160400390625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 11.0, 5.0, 14.0, 41.0, 119.0, 313.0, 374.0, 82.0, 26.0, 6.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.067654132843018, -6.907448768615723, -6.747243881225586, -6.587038516998291, -6.426833152770996, -6.266628265380859, -6.1064229011535645, -5.9462175369262695, -5.786012649536133, -5.625807285308838, -5.465602397918701, -5.305397033691406, -5.1451921463012695, -4.984986782073975, -4.82478141784668, -4.664576530456543, -4.504371166229248, -4.344165802001953, -4.183960914611816, -4.0237555503845215, -3.8635504245758057, -3.70334529876709, -3.543139934539795, -3.382934808731079, -3.2227296829223633, -3.0625245571136475, -2.9023194313049316, -2.7421140670776367, -2.581908941268921, -2.421703815460205, -2.26149845123291, -2.1012933254241943, -1.9410877227783203, -1.7808825969696045, -1.6206773519515991, -1.4604721069335938, -1.300266981124878, -1.140061855316162, -0.9798566102981567, -0.8196513652801514, -0.6594462394714355, -0.49924105405807495, -0.33903586864471436, -0.17883068323135376, -0.018625497817993164, 0.14157968759536743, 0.301784873008728, 0.4619901180267334, 0.6221952438354492, 0.7824004292488098, 0.9426056146621704, 1.1028108596801758, 1.2630159854888916, 1.4232211112976074, 1.5834263563156128, 1.7436316013336182, 1.903836727142334, 2.06404185295105, 2.2242469787597656, 2.3844523429870605, 2.5446574687957764, 2.704862594604492, 2.865067958831787, 3.025273084640503, 3.1854782104492188]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 6.0, 6.0, 7.0, 8.0, 11.0, 9.0, 7.0, 18.0, 24.0, 18.0, 12.0, 31.0, 28.0, 29.0, 35.0, 28.0, 35.0, 58.0, 62.0, 81.0, 78.0, 54.0, 42.0, 42.0, 24.0, 33.0, 27.0, 35.0, 26.0, 22.0, 16.0, 17.0, 12.0, 17.0, 10.0, 6.0, 7.0, 3.0, 6.0, 5.0, 2.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9093279838562012, -1.8437790870666504, -1.7782301902770996, -1.7126811742782593, -1.6471322774887085, -1.5815833806991577, -1.5160343647003174, -1.4504854679107666, -1.3849365711212158, -1.319387674331665, -1.2538387775421143, -1.188289761543274, -1.1227408647537231, -1.0571919679641724, -0.9916430115699768, -0.9260940551757812, -0.8605451583862305, -0.7949962615966797, -0.7294473052024841, -0.6638983488082886, -0.5983494520187378, -0.532800555229187, -0.46725159883499146, -0.4017026722431183, -0.3361537456512451, -0.27060481905937195, -0.20505589246749878, -0.1395069658756256, -0.07395803928375244, -0.008409112691879272, 0.057139813899993896, 0.12268874049186707, 0.18823742866516113, 0.2537863552570343, 0.31933528184890747, 0.38488420844078064, 0.4504331350326538, 0.5159820318222046, 0.5815309882164001, 0.6470799446105957, 0.7126288414001465, 0.7781777381896973, 0.8437266945838928, 0.9092756509780884, 0.9748245477676392, 1.04037344455719, 1.1059224605560303, 1.171471357345581, 1.2370202541351318, 1.3025691509246826, 1.3681180477142334, 1.4336670637130737, 1.4992159605026245, 1.5647648572921753, 1.6303138732910156, 1.6958627700805664, 1.7614116668701172, 1.826960563659668, 1.8925094604492188, 1.958058476448059, 2.0236072540283203, 2.08915638923645, 2.154705286026001, 2.2202541828155518, 2.2858030796051025]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 6.0, 4.0, 6.0, 5.0, 10.0, 5.0, 12.0, 23.0, 35.0, 43.0, 70.0, 142.0, 250.0, 538.0, 1440.0, 4490.0, 19139.0, 192557.0, 2501049.0, 1368568.0, 89454.0, 11532.0, 3000.0, 1032.0, 395.0, 183.0, 110.0, 61.0, 33.0, 26.0, 18.0, 7.0, 11.0, 6.0, 7.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.24609375, -0.23836708068847656, -0.23064041137695312, -0.2229137420654297, -0.21518707275390625, -0.2074604034423828, -0.19973373413085938, -0.19200706481933594, -0.1842803955078125, -0.17655372619628906, -0.16882705688476562, -0.1611003875732422, -0.15337371826171875, -0.1456470489501953, -0.13792037963867188, -0.13019371032714844, -0.122467041015625, -0.11474037170410156, -0.10701370239257812, -0.09928703308105469, -0.09156036376953125, -0.08383369445800781, -0.07610702514648438, -0.06838035583496094, -0.0606536865234375, -0.05292701721191406, -0.045200347900390625, -0.03747367858886719, -0.02974700927734375, -0.022020339965820312, -0.014293670654296875, -0.0065670013427734375, 0.00115966796875, 0.008886337280273438, 0.016613006591796875, 0.024339675903320312, 0.03206634521484375, 0.03979301452636719, 0.047519683837890625, 0.05524635314941406, 0.0629730224609375, 0.07069969177246094, 0.07842636108398438, 0.08615303039550781, 0.09387969970703125, 0.10160636901855469, 0.10933303833007812, 0.11705970764160156, 0.124786376953125, 0.13251304626464844, 0.14023971557617188, 0.1479663848876953, 0.15569305419921875, 0.1634197235107422, 0.17114639282226562, 0.17887306213378906, 0.1865997314453125, 0.19432640075683594, 0.20205307006835938, 0.2097797393798828, 0.21750640869140625, 0.2252330780029297, 0.23295974731445312, 0.24068641662597656, 0.2484130859375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 2.0, 5.0, 7.0, 6.0, 13.0, 11.0, 18.0, 22.0, 32.0, 40.0, 45.0, 66.0, 55.0, 89.0, 70.0, 71.0, 68.0, 86.0, 64.0, 56.0, 29.0, 34.0, 42.0, 28.0, 13.0, 11.0, 10.0, 6.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2464599609375, -0.2388324737548828, -0.23120498657226562, -0.22357749938964844, -0.21595001220703125, -0.20832252502441406, -0.20069503784179688, -0.1930675506591797, -0.1854400634765625, -0.1778125762939453, -0.17018508911132812, -0.16255760192871094, -0.15493011474609375, -0.14730262756347656, -0.13967514038085938, -0.1320476531982422, -0.124420166015625, -0.11679267883300781, -0.10916519165039062, -0.10153770446777344, -0.09391021728515625, -0.08628273010253906, -0.07865524291992188, -0.07102775573730469, -0.0634002685546875, -0.05577278137207031, -0.048145294189453125, -0.04051780700683594, -0.03289031982421875, -0.025262832641601562, -0.017635345458984375, -0.010007858276367188, -0.00238037109375, 0.0052471160888671875, 0.012874603271484375, 0.020502090454101562, 0.02812957763671875, 0.03575706481933594, 0.043384552001953125, 0.05101203918457031, 0.0586395263671875, 0.06626701354980469, 0.07389450073242188, 0.08152198791503906, 0.08914947509765625, 0.09677696228027344, 0.10440444946289062, 0.11203193664550781, 0.119659423828125, 0.1272869110107422, 0.13491439819335938, 0.14254188537597656, 0.15016937255859375, 0.15779685974121094, 0.16542434692382812, 0.1730518341064453, 0.1806793212890625, 0.1883068084716797, 0.19593429565429688, 0.20356178283691406, 0.21118927001953125, 0.21881675720214844, 0.22644424438476562, 0.2340717315673828, 0.24169921875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 7.0, 3.0, 5.0, 7.0, 7.0, 14.0, 22.0, 35.0, 44.0, 63.0, 107.0, 195.0, 393.0, 851.0, 2787.0, 11995.0, 98028.0, 2926017.0, 1096862.0, 45979.0, 7392.0, 1981.0, 699.0, 344.0, 153.0, 89.0, 61.0, 42.0, 28.0, 20.0, 17.0, 7.0, 9.0, 4.0, 5.0, 4.0, 3.0, 5.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.2646484375, -0.2554740905761719, -0.24629974365234375, -0.23712539672851562, -0.2279510498046875, -0.21877670288085938, -0.20960235595703125, -0.20042800903320312, -0.191253662109375, -0.18207931518554688, -0.17290496826171875, -0.16373062133789062, -0.1545562744140625, -0.14538192749023438, -0.13620758056640625, -0.12703323364257812, -0.11785888671875, -0.10868453979492188, -0.09951019287109375, -0.09033584594726562, -0.0811614990234375, -0.07198715209960938, -0.06281280517578125, -0.053638458251953125, -0.044464111328125, -0.035289764404296875, -0.02611541748046875, -0.016941070556640625, -0.0077667236328125, 0.001407623291015625, 0.01058197021484375, 0.019756317138671875, 0.0289306640625, 0.038105010986328125, 0.04727935791015625, 0.056453704833984375, 0.0656280517578125, 0.07480239868164062, 0.08397674560546875, 0.09315109252929688, 0.102325439453125, 0.11149978637695312, 0.12067413330078125, 0.12984848022460938, 0.1390228271484375, 0.14819717407226562, 0.15737152099609375, 0.16654586791992188, 0.17572021484375, 0.18489456176757812, 0.19406890869140625, 0.20324325561523438, 0.2124176025390625, 0.22159194946289062, 0.23076629638671875, 0.23994064331054688, 0.249114990234375, 0.2582893371582031, 0.26746368408203125, 0.2766380310058594, 0.2858123779296875, 0.2949867248535156, 0.30416107177734375, 0.3133354187011719, 0.322509765625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 6.0, 6.0, 9.0, 6.0, 10.0, 18.0, 17.0, 28.0, 40.0, 77.0, 105.0, 165.0, 293.0, 426.0, 620.0, 650.0, 567.0, 389.0, 226.0, 140.0, 89.0, 54.0, 27.0, 35.0, 19.0, 18.0, 9.0, 7.0, 9.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2393798828125, -0.2312297821044922, -0.22307968139648438, -0.21492958068847656, -0.20677947998046875, -0.19862937927246094, -0.19047927856445312, -0.1823291778564453, -0.1741790771484375, -0.1660289764404297, -0.15787887573242188, -0.14972877502441406, -0.14157867431640625, -0.13342857360839844, -0.12527847290039062, -0.11712837219238281, -0.108978271484375, -0.10082817077636719, -0.09267807006835938, -0.08452796936035156, -0.07637786865234375, -0.06822776794433594, -0.060077667236328125, -0.05192756652832031, -0.0437774658203125, -0.03562736511230469, -0.027477264404296875, -0.019327163696289062, -0.01117706298828125, -0.0030269622802734375, 0.005123138427734375, 0.013273239135742188, 0.02142333984375, 0.029573440551757812, 0.037723541259765625, 0.04587364196777344, 0.05402374267578125, 0.06217384338378906, 0.07032394409179688, 0.07847404479980469, 0.0866241455078125, 0.09477424621582031, 0.10292434692382812, 0.11107444763183594, 0.11922454833984375, 0.12737464904785156, 0.13552474975585938, 0.1436748504638672, 0.151824951171875, 0.1599750518798828, 0.16812515258789062, 0.17627525329589844, 0.18442535400390625, 0.19257545471191406, 0.20072555541992188, 0.2088756561279297, 0.2170257568359375, 0.2251758575439453, 0.23332595825195312, 0.24147605895996094, 0.24962615966796875, 0.25777626037597656, 0.2659263610839844, 0.2740764617919922, 0.2822265625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 7.0, 17.0, 18.0, 32.0, 66.0, 111.0, 146.0, 175.0, 161.0, 109.0, 83.0, 34.0, 18.0, 6.0, 8.0, 4.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3326082229614258, -1.2683184146881104, -1.204028606414795, -1.1397387981414795, -1.075448989868164, -1.0111591815948486, -0.9468694925308228, -0.8825796842575073, -0.8182898759841919, -0.7540000677108765, -0.689710259437561, -0.6254205107688904, -0.561130702495575, -0.4968408942222595, -0.4325511157512665, -0.36826133728027344, -0.303971529006958, -0.23968173563480377, -0.17539194226264954, -0.1111021488904953, -0.046812355518341064, 0.017477452754974365, 0.08176723122596741, 0.14605700969696045, 0.21034681797027588, 0.2746366262435913, 0.33892640471458435, 0.4032161831855774, 0.4675059914588928, 0.5317957997322083, 0.5960855484008789, 0.6603753566741943, 0.7246651649475098, 0.7889549732208252, 0.8532447814941406, 0.9175345301628113, 0.9818243384361267, 1.046114206314087, 1.1104038953781128, 1.1746937036514282, 1.2389835119247437, 1.303273320198059, 1.3675631284713745, 1.43185293674469, 1.4961426258087158, 1.5604324340820312, 1.6247222423553467, 1.689012050628662, 1.7533018589019775, 1.817591667175293, 1.8818814754486084, 1.9461712837219238, 2.0104610919952393, 2.0747509002685547, 2.13904070854187, 2.2033305168151855, 2.267620086669922, 2.3319098949432373, 2.3961997032165527, 2.460489511489868, 2.5247793197631836, 2.589069128036499, 2.6533589363098145, 2.717648506164551, 2.7819385528564453]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 6.0, 2.0, 7.0, 6.0, 6.0, 13.0, 14.0, 20.0, 16.0, 23.0, 28.0, 30.0, 32.0, 49.0, 51.0, 47.0, 49.0, 66.0, 62.0, 60.0, 50.0, 60.0, 41.0, 37.0, 38.0, 43.0, 39.0, 28.0, 21.0, 17.0, 18.0, 13.0, 2.0, 5.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-1.6954822540283203, -1.6533327102661133, -1.6111831665039062, -1.5690336227416992, -1.5268839597702026, -1.4847344160079956, -1.4425848722457886, -1.4004353284835815, -1.358285665512085, -1.316136121749878, -1.273986577987671, -1.2318370342254639, -1.1896873712539673, -1.1475378274917603, -1.1053882837295532, -1.0632387399673462, -1.0210891962051392, -0.9789396524429321, -0.9367900490760803, -0.8946405053138733, -0.8524909019470215, -0.8103413581848145, -0.7681918144226074, -0.7260422706604004, -0.6838926672935486, -0.6417431235313416, -0.5995935201644897, -0.5574439764022827, -0.5152944326400757, -0.4731448292732239, -0.43099528551101685, -0.3888457119464874, -0.346696138381958, -0.3045465648174286, -0.26239699125289917, -0.22024744749069214, -0.17809787392616272, -0.1359483003616333, -0.09379875659942627, -0.05164918303489685, -0.009499609470367432, 0.03264995664358139, 0.07479952275753021, 0.11694908142089844, 0.15909865498542786, 0.20124822854995728, 0.2433977723121643, 0.2855473458766937, 0.32769691944122314, 0.36984649300575256, 0.411996066570282, 0.454145610332489, 0.49629518389701843, 0.5384447574615479, 0.5805943012237549, 0.6227438449859619, 0.6648934483528137, 0.7070429921150208, 0.7491925954818726, 0.7913421392440796, 0.8334916830062866, 0.8756412863731384, 0.9177908301353455, 0.9599404335021973, 1.0020899772644043]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 4.0, 8.0, 15.0, 23.0, 35.0, 42.0, 107.0, 151.0, 298.0, 597.0, 1639.0, 5855.0, 30378.0, 218258.0, 632949.0, 131852.0, 19857.0, 4093.0, 1249.0, 514.0, 276.0, 156.0, 70.0, 50.0, 28.0, 17.0, 9.0, 5.0, 4.0, 3.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.405517578125, -0.3946685791015625, -0.383819580078125, -0.3729705810546875, -0.36212158203125, -0.3512725830078125, -0.340423583984375, -0.3295745849609375, -0.3187255859375, -0.3078765869140625, -0.297027587890625, -0.2861785888671875, -0.27532958984375, -0.2644805908203125, -0.253631591796875, -0.2427825927734375, -0.23193359375, -0.2210845947265625, -0.210235595703125, -0.1993865966796875, -0.18853759765625, -0.1776885986328125, -0.166839599609375, -0.1559906005859375, -0.1451416015625, -0.1342926025390625, -0.123443603515625, -0.1125946044921875, -0.10174560546875, -0.0908966064453125, -0.080047607421875, -0.0691986083984375, -0.058349609375, -0.0475006103515625, -0.036651611328125, -0.0258026123046875, -0.01495361328125, -0.0041046142578125, 0.006744384765625, 0.0175933837890625, 0.0284423828125, 0.0392913818359375, 0.050140380859375, 0.0609893798828125, 0.07183837890625, 0.0826873779296875, 0.093536376953125, 0.1043853759765625, 0.115234375, 0.1260833740234375, 0.136932373046875, 0.1477813720703125, 0.15863037109375, 0.1694793701171875, 0.180328369140625, 0.1911773681640625, 0.2020263671875, 0.2128753662109375, 0.223724365234375, 0.2345733642578125, 0.24542236328125, 0.2562713623046875, 0.267120361328125, 0.2779693603515625, 0.288818359375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 3.0, 4.0, 3.0, 10.0, 16.0, 16.0, 24.0, 36.0, 41.0, 56.0, 51.0, 64.0, 74.0, 77.0, 84.0, 63.0, 73.0, 69.0, 53.0, 32.0, 37.0, 32.0, 28.0, 25.0, 13.0, 3.0, 5.0, 6.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2481689453125, -0.2405071258544922, -0.23284530639648438, -0.22518348693847656, -0.21752166748046875, -0.20985984802246094, -0.20219802856445312, -0.1945362091064453, -0.1868743896484375, -0.1792125701904297, -0.17155075073242188, -0.16388893127441406, -0.15622711181640625, -0.14856529235839844, -0.14090347290039062, -0.1332416534423828, -0.125579833984375, -0.11791801452636719, -0.11025619506835938, -0.10259437561035156, -0.09493255615234375, -0.08727073669433594, -0.07960891723632812, -0.07194709777832031, -0.0642852783203125, -0.05662345886230469, -0.048961639404296875, -0.04129981994628906, -0.03363800048828125, -0.025976181030273438, -0.018314361572265625, -0.010652542114257812, -0.00299072265625, 0.0046710968017578125, 0.012332916259765625, 0.019994735717773438, 0.02765655517578125, 0.03531837463378906, 0.042980194091796875, 0.05064201354980469, 0.0583038330078125, 0.06596565246582031, 0.07362747192382812, 0.08128929138183594, 0.08895111083984375, 0.09661293029785156, 0.10427474975585938, 0.11193656921386719, 0.119598388671875, 0.1272602081298828, 0.13492202758789062, 0.14258384704589844, 0.15024566650390625, 0.15790748596191406, 0.16556930541992188, 0.1732311248779297, 0.1808929443359375, 0.1885547637939453, 0.19621658325195312, 0.20387840270996094, 0.21154022216796875, 0.21920204162597656, 0.22686386108398438, 0.2345256805419922, 0.2421875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 5.0, 9.0, 13.0, 12.0, 27.0, 32.0, 40.0, 60.0, 73.0, 83.0, 139.0, 182.0, 260.0, 379.0, 664.0, 1171.0, 3018.0, 14622.0, 134781.0, 787043.0, 89598.0, 10775.0, 2605.0, 1056.0, 569.0, 407.0, 282.0, 166.0, 117.0, 82.0, 62.0, 68.0, 34.0, 27.0, 25.0, 17.0, 13.0, 9.0, 6.0, 3.0, 6.0, 2.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.415283203125, -0.40247344970703125, -0.3896636962890625, -0.37685394287109375, -0.364044189453125, -0.35123443603515625, -0.3384246826171875, -0.32561492919921875, -0.31280517578125, -0.29999542236328125, -0.2871856689453125, -0.27437591552734375, -0.261566162109375, -0.24875640869140625, -0.2359466552734375, -0.22313690185546875, -0.2103271484375, -0.19751739501953125, -0.1847076416015625, -0.17189788818359375, -0.159088134765625, -0.14627838134765625, -0.1334686279296875, -0.12065887451171875, -0.10784912109375, -0.09503936767578125, -0.0822296142578125, -0.06941986083984375, -0.056610107421875, -0.04380035400390625, -0.0309906005859375, -0.01818084716796875, -0.00537109375, 0.00743865966796875, 0.0202484130859375, 0.03305816650390625, 0.045867919921875, 0.05867767333984375, 0.0714874267578125, 0.08429718017578125, 0.09710693359375, 0.10991668701171875, 0.1227264404296875, 0.13553619384765625, 0.148345947265625, 0.16115570068359375, 0.1739654541015625, 0.18677520751953125, 0.1995849609375, 0.21239471435546875, 0.2252044677734375, 0.23801422119140625, 0.250823974609375, 0.26363372802734375, 0.2764434814453125, 0.28925323486328125, 0.30206298828125, 0.31487274169921875, 0.3276824951171875, 0.34049224853515625, 0.353302001953125, 0.36611175537109375, 0.3789215087890625, 0.39173126220703125, 0.404541015625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 4.0, 1.0, 3.0, 4.0, 15.0, 5.0, 12.0, 15.0, 15.0, 21.0, 41.0, 22.0, 39.0, 42.0, 57.0, 43.0, 58.0, 66.0, 67.0, 71.0, 63.0, 53.0, 41.0, 40.0, 36.0, 29.0, 35.0, 37.0, 16.0, 9.0, 7.0, 11.0, 6.0, 3.0, 4.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.625, -0.6049728393554688, -0.5849456787109375, -0.5649185180664062, -0.544891357421875, -0.5248641967773438, -0.5048370361328125, -0.48480987548828125, -0.46478271484375, -0.44475555419921875, -0.4247283935546875, -0.40470123291015625, -0.384674072265625, -0.36464691162109375, -0.3446197509765625, -0.32459259033203125, -0.3045654296875, -0.28453826904296875, -0.2645111083984375, -0.24448394775390625, -0.224456787109375, -0.20442962646484375, -0.1844024658203125, -0.16437530517578125, -0.14434814453125, -0.12432098388671875, -0.1042938232421875, -0.08426666259765625, -0.064239501953125, -0.04421234130859375, -0.0241851806640625, -0.00415802001953125, 0.015869140625, 0.03589630126953125, 0.0559234619140625, 0.07595062255859375, 0.095977783203125, 0.11600494384765625, 0.1360321044921875, 0.15605926513671875, 0.17608642578125, 0.19611358642578125, 0.2161407470703125, 0.23616790771484375, 0.256195068359375, 0.27622222900390625, 0.2962493896484375, 0.31627655029296875, 0.3363037109375, 0.35633087158203125, 0.3763580322265625, 0.39638519287109375, 0.416412353515625, 0.43643951416015625, 0.4564666748046875, 0.47649383544921875, 0.49652099609375, 0.5165481567382812, 0.5365753173828125, 0.5566024780273438, 0.576629638671875, 0.5966567993164062, 0.6166839599609375, 0.6367111206054688, 0.65673828125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 6.0, 5.0, 16.0, 28.0, 44.0, 62.0, 163.0, 287.0, 821.0, 2963.0, 16922.0, 191790.0, 786343.0, 41169.0, 5681.0, 1324.0, 463.0, 207.0, 98.0, 62.0, 30.0, 15.0, 15.0, 8.0, 8.0, 2.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1942138671875, -0.18938350677490234, -0.1845531463623047, -0.17972278594970703, -0.17489242553710938, -0.17006206512451172, -0.16523170471191406, -0.1604013442993164, -0.15557098388671875, -0.1507406234741211, -0.14591026306152344, -0.14107990264892578, -0.13624954223632812, -0.13141918182373047, -0.1265888214111328, -0.12175846099853516, -0.1169281005859375, -0.11209774017333984, -0.10726737976074219, -0.10243701934814453, -0.09760665893554688, -0.09277629852294922, -0.08794593811035156, -0.0831155776977539, -0.07828521728515625, -0.0734548568725586, -0.06862449645996094, -0.06379413604736328, -0.058963775634765625, -0.05413341522216797, -0.04930305480957031, -0.044472694396972656, -0.039642333984375, -0.034811973571777344, -0.029981613159179688, -0.02515125274658203, -0.020320892333984375, -0.015490531921386719, -0.010660171508789062, -0.005829811096191406, -0.00099945068359375, 0.0038309097290039062, 0.008661270141601562, 0.013491630554199219, 0.018321990966796875, 0.02315235137939453, 0.027982711791992188, 0.032813072204589844, 0.0376434326171875, 0.042473793029785156, 0.04730415344238281, 0.05213451385498047, 0.056964874267578125, 0.06179523468017578, 0.06662559509277344, 0.0714559555053711, 0.07628631591796875, 0.0811166763305664, 0.08594703674316406, 0.09077739715576172, 0.09560775756835938, 0.10043811798095703, 0.10526847839355469, 0.11009883880615234, 0.11492919921875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 1.0, 2.0, 5.0, 1.0, 5.0, 4.0, 2.0, 14.0, 11.0, 13.0, 21.0, 23.0, 26.0, 61.0, 86.0, 95.0, 84.0, 115.0, 89.0, 68.0, 64.0, 48.0, 51.0, 23.0, 20.0, 19.0, 19.0, 7.0, 7.0, 8.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3882598876953125e-05, -5.235709249973297e-05, -5.083158612251282e-05, -4.9306079745292664e-05, -4.778057336807251e-05, -4.6255066990852356e-05, -4.47295606136322e-05, -4.320405423641205e-05, -4.1678547859191895e-05, -4.015304148197174e-05, -3.862753510475159e-05, -3.710202872753143e-05, -3.557652235031128e-05, -3.4051015973091125e-05, -3.252550959587097e-05, -3.100000321865082e-05, -2.9474496841430664e-05, -2.794899046421051e-05, -2.6423484086990356e-05, -2.4897977709770203e-05, -2.337247133255005e-05, -2.1846964955329895e-05, -2.032145857810974e-05, -1.8795952200889587e-05, -1.7270445823669434e-05, -1.574493944644928e-05, -1.4219433069229126e-05, -1.2693926692008972e-05, -1.1168420314788818e-05, -9.642913937568665e-06, -8.11740756034851e-06, -6.591901183128357e-06, -5.066394805908203e-06, -3.5408884286880493e-06, -2.0153820514678955e-06, -4.898756742477417e-07, 1.0356307029724121e-06, 2.561137080192566e-06, 4.08664345741272e-06, 5.6121498346328735e-06, 7.137656211853027e-06, 8.663162589073181e-06, 1.0188668966293335e-05, 1.1714175343513489e-05, 1.3239681720733643e-05, 1.4765188097953796e-05, 1.629069447517395e-05, 1.7816200852394104e-05, 1.9341707229614258e-05, 2.086721360683441e-05, 2.2392719984054565e-05, 2.391822636127472e-05, 2.5443732738494873e-05, 2.6969239115715027e-05, 2.849474549293518e-05, 3.0020251870155334e-05, 3.154575824737549e-05, 3.307126462459564e-05, 3.4596771001815796e-05, 3.612227737903595e-05, 3.7647783756256104e-05, 3.917329013347626e-05, 4.069879651069641e-05, 4.2224302887916565e-05, 4.374980926513672e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 11.0, 3.0, 3.0, 15.0, 9.0, 23.0, 24.0, 32.0, 43.0, 74.0, 105.0, 152.0, 214.0, 368.0, 639.0, 1365.0, 3134.0, 8486.0, 28872.0, 125412.0, 687716.0, 143615.0, 32135.0, 9405.0, 3405.0, 1445.0, 713.0, 379.0, 233.0, 155.0, 93.0, 70.0, 62.0, 38.0, 30.0, 22.0, 12.0, 11.0, 10.0, 10.0, 7.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0836181640625, -0.08096694946289062, -0.07831573486328125, -0.07566452026367188, -0.0730133056640625, -0.07036209106445312, -0.06771087646484375, -0.06505966186523438, -0.062408447265625, -0.059757232666015625, -0.05710601806640625, -0.054454803466796875, -0.0518035888671875, -0.049152374267578125, -0.04650115966796875, -0.043849945068359375, -0.04119873046875, -0.038547515869140625, -0.03589630126953125, -0.033245086669921875, -0.0305938720703125, -0.027942657470703125, -0.02529144287109375, -0.022640228271484375, -0.019989013671875, -0.017337799072265625, -0.01468658447265625, -0.012035369873046875, -0.0093841552734375, -0.006732940673828125, -0.00408172607421875, -0.001430511474609375, 0.001220703125, 0.003871917724609375, 0.00652313232421875, 0.009174346923828125, 0.0118255615234375, 0.014476776123046875, 0.01712799072265625, 0.019779205322265625, 0.022430419921875, 0.025081634521484375, 0.02773284912109375, 0.030384063720703125, 0.0330352783203125, 0.035686492919921875, 0.03833770751953125, 0.040988922119140625, 0.04364013671875, 0.046291351318359375, 0.04894256591796875, 0.051593780517578125, 0.0542449951171875, 0.056896209716796875, 0.05954742431640625, 0.062198638916015625, 0.064849853515625, 0.06750106811523438, 0.07015228271484375, 0.07280349731445312, 0.0754547119140625, 0.07810592651367188, 0.08075714111328125, 0.08340835571289062, 0.0860595703125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 8.0, 8.0, 11.0, 12.0, 19.0, 17.0, 21.0, 21.0, 43.0, 56.0, 77.0, 91.0, 100.0, 98.0, 98.0, 72.0, 49.0, 42.0, 40.0, 27.0, 25.0, 18.0, 8.0, 10.0, 3.0, 3.0, 8.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09320068359375, -0.09019088745117188, -0.08718109130859375, -0.08417129516601562, -0.0811614990234375, -0.07815170288085938, -0.07514190673828125, -0.07213211059570312, -0.069122314453125, -0.06611251831054688, -0.06310272216796875, -0.060092926025390625, -0.0570831298828125, -0.054073333740234375, -0.05106353759765625, -0.048053741455078125, -0.0450439453125, -0.042034149169921875, -0.03902435302734375, -0.036014556884765625, -0.0330047607421875, -0.029994964599609375, -0.02698516845703125, -0.023975372314453125, -0.020965576171875, -0.017955780029296875, -0.01494598388671875, -0.011936187744140625, -0.0089263916015625, -0.005916595458984375, -0.00290679931640625, 0.000102996826171875, 0.00311279296875, 0.006122589111328125, 0.00913238525390625, 0.012142181396484375, 0.0151519775390625, 0.018161773681640625, 0.02117156982421875, 0.024181365966796875, 0.027191162109375, 0.030200958251953125, 0.03321075439453125, 0.036220550537109375, 0.0392303466796875, 0.042240142822265625, 0.04524993896484375, 0.048259735107421875, 0.05126953125, 0.054279327392578125, 0.05728912353515625, 0.060298919677734375, 0.0633087158203125, 0.06631851196289062, 0.06932830810546875, 0.07233810424804688, 0.075347900390625, 0.07835769653320312, 0.08136749267578125, 0.08437728881835938, 0.0873870849609375, 0.09039688110351562, 0.09340667724609375, 0.09641647338867188, 0.09942626953125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 6.0, 12.0, 29.0, 133.0, 494.0, 239.0, 58.0, 15.0, 7.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.761096477508545, -7.583735466003418, -7.406374931335449, -7.229013919830322, -7.051652908325195, -6.874292373657227, -6.6969313621521, -6.519570350646973, -6.342209815979004, -6.164848804473877, -5.987488269805908, -5.810127258300781, -5.6327667236328125, -5.4554057121276855, -5.278044700622559, -5.10068416595459, -4.923323154449463, -4.745962142944336, -4.568601608276367, -4.39124059677124, -4.213879585266113, -4.0365190505981445, -3.8591580390930176, -3.6817972660064697, -3.504436492919922, -3.327075719833374, -3.149714946746826, -2.972353935241699, -2.7949931621551514, -2.6176323890686035, -2.4402713775634766, -2.2629106044769287, -2.085550308227539, -1.9081895351409912, -1.7308286428451538, -1.5534677505493164, -1.3761069774627686, -1.1987462043762207, -1.0213853120803833, -0.8440244197845459, -0.666663646697998, -0.4893028140068054, -0.3119419813156128, -0.13458114862442017, 0.04277968406677246, 0.2201405167579651, 0.3975013494491577, 0.5748622417449951, 0.752223014831543, 0.9295838475227356, 1.1069446802139282, 1.2843055725097656, 1.4616663455963135, 1.6390271186828613, 1.8163880109786987, 1.9937489032745361, 2.171109676361084, 2.348470449447632, 2.5258312225341797, 2.7031922340393066, 2.8805530071258545, 3.0579137802124023, 3.2352747917175293, 3.412635564804077, 3.589996337890625]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 5.0, 3.0, 5.0, 5.0, 7.0, 3.0, 5.0, 5.0, 7.0, 10.0, 10.0, 14.0, 11.0, 18.0, 19.0, 13.0, 24.0, 31.0, 29.0, 32.0, 39.0, 52.0, 56.0, 99.0, 83.0, 72.0, 47.0, 34.0, 33.0, 29.0, 26.0, 24.0, 14.0, 23.0, 16.0, 16.0, 16.0, 12.0, 13.0, 9.0, 12.0, 6.0, 3.0, 3.0, 2.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6487575769424438, -1.5938482284545898, -1.5389389991760254, -1.4840296506881714, -1.4291203022003174, -1.374211072921753, -1.319301724433899, -1.264392375946045, -1.2094831466674805, -1.1545737981796265, -1.099664568901062, -1.044755220413208, -0.9898459315299988, -0.9349366426467896, -0.8800272941589355, -0.8251180052757263, -0.7702087163925171, -0.7152994275093079, -0.6603901386260986, -0.6054807901382446, -0.5505715012550354, -0.49566221237182617, -0.44075289368629456, -0.38584357500076294, -0.3309342861175537, -0.2760249972343445, -0.22111567854881287, -0.16620637476444244, -0.11129707098007202, -0.05638778209686279, -0.0014784634113311768, 0.05343085527420044, 0.10834002494812012, 0.16324932873249054, 0.21815863251686096, 0.2730679512023926, 0.3279772400856018, 0.38288652896881104, 0.43779584765434265, 0.49270516633987427, 0.5476144552230835, 0.6025237441062927, 0.657433032989502, 0.712342381477356, 0.7672516703605652, 0.8221609592437744, 0.8770703077316284, 0.9319795966148376, 0.9868888854980469, 1.0417982339859009, 1.0967074632644653, 1.1516168117523193, 1.2065260410308838, 1.2614353895187378, 1.3163447380065918, 1.3712539672851562, 1.4261633157730103, 1.4810726642608643, 1.5359818935394287, 1.5908912420272827, 1.6458005905151367, 1.7007098197937012, 1.7556191682815552, 1.8105285167694092, 1.8654377460479736]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 7.0, 2.0, 3.0, 10.0, 14.0, 14.0, 25.0, 39.0, 59.0, 104.0, 194.0, 464.0, 1032.0, 3548.0, 19709.0, 313356.0, 3271640.0, 550302.0, 26952.0, 4550.0, 1224.0, 463.0, 243.0, 122.0, 73.0, 35.0, 30.0, 26.0, 7.0, 13.0, 8.0, 6.0, 3.0, 8.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26123046875, -0.25140380859375, -0.2415771484375, -0.23175048828125, -0.221923828125, -0.21209716796875, -0.2022705078125, -0.19244384765625, -0.1826171875, -0.17279052734375, -0.1629638671875, -0.15313720703125, -0.143310546875, -0.13348388671875, -0.1236572265625, -0.11383056640625, -0.10400390625, -0.09417724609375, -0.0843505859375, -0.07452392578125, -0.064697265625, -0.05487060546875, -0.0450439453125, -0.03521728515625, -0.025390625, -0.01556396484375, -0.0057373046875, 0.00408935546875, 0.013916015625, 0.02374267578125, 0.0335693359375, 0.04339599609375, 0.05322265625, 0.06304931640625, 0.0728759765625, 0.08270263671875, 0.092529296875, 0.10235595703125, 0.1121826171875, 0.12200927734375, 0.1318359375, 0.14166259765625, 0.1514892578125, 0.16131591796875, 0.171142578125, 0.18096923828125, 0.1907958984375, 0.20062255859375, 0.21044921875, 0.22027587890625, 0.2301025390625, 0.23992919921875, 0.249755859375, 0.25958251953125, 0.2694091796875, 0.27923583984375, 0.2890625, 0.29888916015625, 0.3087158203125, 0.31854248046875, 0.328369140625, 0.33819580078125, 0.3480224609375, 0.35784912109375, 0.36767578125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 7.0, 5.0, 3.0, 7.0, 9.0, 14.0, 30.0, 30.0, 50.0, 62.0, 62.0, 66.0, 76.0, 89.0, 72.0, 61.0, 73.0, 81.0, 46.0, 42.0, 30.0, 29.0, 17.0, 19.0, 10.0, 8.0, 3.0, 4.0, 4.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.256591796875, -0.24883651733398438, -0.24108123779296875, -0.23332595825195312, -0.2255706787109375, -0.21781539916992188, -0.21006011962890625, -0.20230484008789062, -0.194549560546875, -0.18679428100585938, -0.17903900146484375, -0.17128372192382812, -0.1635284423828125, -0.15577316284179688, -0.14801788330078125, -0.14026260375976562, -0.13250732421875, -0.12475204467773438, -0.11699676513671875, -0.10924148559570312, -0.1014862060546875, -0.09373092651367188, -0.08597564697265625, -0.07822036743164062, -0.070465087890625, -0.06270980834960938, -0.05495452880859375, -0.047199249267578125, -0.0394439697265625, -0.031688690185546875, -0.02393341064453125, -0.016178131103515625, -0.0084228515625, -0.000667572021484375, 0.00708770751953125, 0.014842987060546875, 0.0225982666015625, 0.030353546142578125, 0.03810882568359375, 0.045864105224609375, 0.053619384765625, 0.061374664306640625, 0.06912994384765625, 0.07688522338867188, 0.0846405029296875, 0.09239578247070312, 0.10015106201171875, 0.10790634155273438, 0.11566162109375, 0.12341690063476562, 0.13117218017578125, 0.13892745971679688, 0.1466827392578125, 0.15443801879882812, 0.16219329833984375, 0.16994857788085938, 0.177703857421875, 0.18545913696289062, 0.19321441650390625, 0.20096969604492188, 0.2087249755859375, 0.21648025512695312, 0.22423553466796875, 0.23199081420898438, 0.23974609375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 11.0, 12.0, 10.0, 20.0, 18.0, 41.0, 66.0, 110.0, 235.0, 479.0, 1212.0, 4839.0, 40969.0, 2280726.0, 1823874.0, 35341.0, 4308.0, 1067.0, 439.0, 207.0, 101.0, 74.0, 35.0, 33.0, 19.0, 9.0, 4.0, 7.0, 2.0, 2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.330810546875, -0.3189849853515625, -0.307159423828125, -0.2953338623046875, -0.28350830078125, -0.2716827392578125, -0.259857177734375, -0.2480316162109375, -0.2362060546875, -0.2243804931640625, -0.212554931640625, -0.2007293701171875, -0.18890380859375, -0.1770782470703125, -0.165252685546875, -0.1534271240234375, -0.1416015625, -0.1297760009765625, -0.117950439453125, -0.1061248779296875, -0.09429931640625, -0.0824737548828125, -0.070648193359375, -0.0588226318359375, -0.0469970703125, -0.0351715087890625, -0.023345947265625, -0.0115203857421875, 0.00030517578125, 0.0121307373046875, 0.023956298828125, 0.0357818603515625, 0.047607421875, 0.0594329833984375, 0.071258544921875, 0.0830841064453125, 0.09490966796875, 0.1067352294921875, 0.118560791015625, 0.1303863525390625, 0.1422119140625, 0.1540374755859375, 0.165863037109375, 0.1776885986328125, 0.18951416015625, 0.2013397216796875, 0.213165283203125, 0.2249908447265625, 0.23681640625, 0.2486419677734375, 0.260467529296875, 0.2722930908203125, 0.28411865234375, 0.2959442138671875, 0.307769775390625, 0.3195953369140625, 0.3314208984375, 0.3432464599609375, 0.355072021484375, 0.3668975830078125, 0.37872314453125, 0.3905487060546875, 0.402374267578125, 0.4141998291015625, 0.426025390625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 4.0, 7.0, 4.0, 6.0, 18.0, 17.0, 25.0, 31.0, 42.0, 56.0, 72.0, 131.0, 239.0, 371.0, 460.0, 594.0, 543.0, 462.0, 342.0, 207.0, 150.0, 94.0, 54.0, 25.0, 29.0, 30.0, 22.0, 12.0, 4.0, 5.0, 3.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.238525390625, -0.23054885864257812, -0.22257232666015625, -0.21459579467773438, -0.2066192626953125, -0.19864273071289062, -0.19066619873046875, -0.18268966674804688, -0.174713134765625, -0.16673660278320312, -0.15876007080078125, -0.15078353881835938, -0.1428070068359375, -0.13483047485351562, -0.12685394287109375, -0.11887741088867188, -0.11090087890625, -0.10292434692382812, -0.09494781494140625, -0.08697128295898438, -0.0789947509765625, -0.07101821899414062, -0.06304168701171875, -0.055065155029296875, -0.047088623046875, -0.039112091064453125, -0.03113555908203125, -0.023159027099609375, -0.0151824951171875, -0.007205963134765625, 0.00077056884765625, 0.008747100830078125, 0.0167236328125, 0.024700164794921875, 0.03267669677734375, 0.040653228759765625, 0.0486297607421875, 0.056606292724609375, 0.06458282470703125, 0.07255935668945312, 0.080535888671875, 0.08851242065429688, 0.09648895263671875, 0.10446548461914062, 0.1124420166015625, 0.12041854858398438, 0.12839508056640625, 0.13637161254882812, 0.14434814453125, 0.15232467651367188, 0.16030120849609375, 0.16827774047851562, 0.1762542724609375, 0.18423080444335938, 0.19220733642578125, 0.20018386840820312, 0.208160400390625, 0.21613693237304688, 0.22411346435546875, 0.23208999633789062, 0.2400665283203125, 0.24804306030273438, 0.25601959228515625, 0.2639961242675781, 0.27197265625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 11.0, 12.0, 62.0, 142.0, 282.0, 255.0, 138.0, 63.0, 21.0, 7.0, 4.0, 5.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2180449962615967, -3.0988314151763916, -2.9796178340911865, -2.8604042530059814, -2.7411906719207764, -2.6219770908355713, -2.502763271331787, -2.383549690246582, -2.264336109161377, -2.145122528076172, -2.025908946990967, -1.9066953659057617, -1.7874817848205566, -1.6682682037353516, -1.549054503440857, -1.4298409223556519, -1.3106274604797363, -1.1914138793945312, -1.0722002983093262, -0.9529866576194763, -0.8337730765342712, -0.7145594954490662, -0.5953458547592163, -0.47613227367401123, -0.35691869258880615, -0.23770509660243988, -0.11849150061607361, 0.0007221102714538574, 0.11993569135665894, 0.239149272441864, 0.35836291313171387, 0.47757649421691895, 0.5967898368835449, 0.71600341796875, 0.8352169990539551, 0.9544306397438049, 1.0736441612243652, 1.1928577423095703, 1.312071442604065, 1.43128502368927, 1.550498604774475, 1.6697121858596802, 1.7889257669448853, 1.9081394672393799, 2.027353048324585, 2.14656662940979, 2.265780210494995, 2.3849937915802, 2.5042073726654053, 2.6234209537506104, 2.7426345348358154, 2.8618481159210205, 2.9810616970062256, 3.1002752780914307, 3.219489097595215, 3.33870267868042, 3.457916259765625, 3.57712984085083, 3.696343421936035, 3.8155570030212402, 3.9347705841064453, 4.05398416519165, 4.1731977462768555, 4.2924113273620605, 4.411624908447266]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 10.0, 10.0, 12.0, 8.0, 14.0, 19.0, 26.0, 21.0, 33.0, 44.0, 29.0, 46.0, 60.0, 54.0, 72.0, 73.0, 74.0, 63.0, 53.0, 36.0, 58.0, 27.0, 28.0, 26.0, 21.0, 17.0, 14.0, 12.0, 10.0, 9.0, 6.0, 2.0, 6.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.88785982131958, -1.8361716270446777, -1.784483551979065, -1.7327953577041626, -1.6811072826385498, -1.6294190883636475, -1.5777310132980347, -1.5260428190231323, -1.4743547439575195, -1.4226665496826172, -1.3709784746170044, -1.319290280342102, -1.2676022052764893, -1.215914011001587, -1.1642259359359741, -1.1125377416610718, -1.060849666595459, -1.0091614723205566, -0.9574733972549438, -0.9057852625846863, -0.8540971279144287, -0.8024089336395264, -0.7507208585739136, -0.6990326642990112, -0.6473444700241089, -0.5956563353538513, -0.5439682006835938, -0.4922800660133362, -0.4405919313430786, -0.38890376687049866, -0.3372156322002411, -0.2855274975299835, -0.23383939266204834, -0.18215125799179077, -0.1304631233215332, -0.07877497375011444, -0.027086839079856873, 0.02460131049156189, 0.07628944516181946, 0.12797757983207703, 0.1796657145023346, 0.23135384917259216, 0.28304198384284973, 0.3347301483154297, 0.38641828298568726, 0.4381064176559448, 0.4897945523262024, 0.54148268699646, 0.5931708216667175, 0.6448589563369751, 0.6965470910072327, 0.7482352256774902, 0.7999233603477478, 0.8516114950180054, 0.9032996892929077, 0.9549877643585205, 1.0066759586334229, 1.0583641529083252, 1.110052227973938, 1.1617404222488403, 1.2134284973144531, 1.2651166915893555, 1.3168047666549683, 1.3684929609298706, 1.4201810359954834]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 5.0, 4.0, 7.0, 24.0, 30.0, 32.0, 40.0, 92.0, 151.0, 241.0, 533.0, 1055.0, 2456.0, 6481.0, 22572.0, 115701.0, 600395.0, 242838.0, 39423.0, 10201.0, 3381.0, 1394.0, 684.0, 345.0, 181.0, 103.0, 76.0, 41.0, 26.0, 17.0, 8.0, 8.0, 4.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.41552734375, -0.4042015075683594, -0.39287567138671875, -0.3815498352050781, -0.3702239990234375, -0.3588981628417969, -0.34757232666015625, -0.3362464904785156, -0.324920654296875, -0.3135948181152344, -0.30226898193359375, -0.2909431457519531, -0.2796173095703125, -0.2682914733886719, -0.25696563720703125, -0.24563980102539062, -0.23431396484375, -0.22298812866210938, -0.21166229248046875, -0.20033645629882812, -0.1890106201171875, -0.17768478393554688, -0.16635894775390625, -0.15503311157226562, -0.143707275390625, -0.13238143920898438, -0.12105560302734375, -0.10972976684570312, -0.0984039306640625, -0.08707809448242188, -0.07575225830078125, -0.06442642211914062, -0.0531005859375, -0.041774749755859375, -0.03044891357421875, -0.019123077392578125, -0.0077972412109375, 0.003528594970703125, 0.01485443115234375, 0.026180267333984375, 0.037506103515625, 0.048831939697265625, 0.06015777587890625, 0.07148361206054688, 0.0828094482421875, 0.09413528442382812, 0.10546112060546875, 0.11678695678710938, 0.12811279296875, 0.13943862915039062, 0.15076446533203125, 0.16209030151367188, 0.1734161376953125, 0.18474197387695312, 0.19606781005859375, 0.20739364624023438, 0.218719482421875, 0.23004531860351562, 0.24137115478515625, 0.2526969909667969, 0.2640228271484375, 0.2753486633300781, 0.28667449951171875, 0.2980003356933594, 0.309326171875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 5.0, 2.0, 6.0, 11.0, 12.0, 16.0, 29.0, 36.0, 53.0, 54.0, 77.0, 66.0, 80.0, 64.0, 80.0, 83.0, 73.0, 59.0, 54.0, 31.0, 42.0, 18.0, 8.0, 15.0, 10.0, 10.0, 4.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.255859375, -0.248046875, -0.240234375, -0.232421875, -0.224609375, -0.216796875, -0.208984375, -0.201171875, -0.193359375, -0.185546875, -0.177734375, -0.169921875, -0.162109375, -0.154296875, -0.146484375, -0.138671875, -0.130859375, -0.123046875, -0.115234375, -0.107421875, -0.099609375, -0.091796875, -0.083984375, -0.076171875, -0.068359375, -0.060546875, -0.052734375, -0.044921875, -0.037109375, -0.029296875, -0.021484375, -0.013671875, -0.005859375, 0.001953125, 0.009765625, 0.017578125, 0.025390625, 0.033203125, 0.041015625, 0.048828125, 0.056640625, 0.064453125, 0.072265625, 0.080078125, 0.087890625, 0.095703125, 0.103515625, 0.111328125, 0.119140625, 0.126953125, 0.134765625, 0.142578125, 0.150390625, 0.158203125, 0.166015625, 0.173828125, 0.181640625, 0.189453125, 0.197265625, 0.205078125, 0.212890625, 0.220703125, 0.228515625, 0.236328125, 0.244140625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 6.0, 13.0, 14.0, 14.0, 28.0, 39.0, 62.0, 79.0, 117.0, 191.0, 256.0, 452.0, 768.0, 1545.0, 4550.0, 50053.0, 928984.0, 53125.0, 4647.0, 1550.0, 750.0, 474.0, 266.0, 179.0, 123.0, 73.0, 62.0, 40.0, 30.0, 20.0, 10.0, 13.0, 6.0, 5.0, 3.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7041015625, -0.6842727661132812, -0.6644439697265625, -0.6446151733398438, -0.624786376953125, -0.6049575805664062, -0.5851287841796875, -0.5652999877929688, -0.54547119140625, -0.5256423950195312, -0.5058135986328125, -0.48598480224609375, -0.466156005859375, -0.44632720947265625, -0.4264984130859375, -0.40666961669921875, -0.3868408203125, -0.36701202392578125, -0.3471832275390625, -0.32735443115234375, -0.307525634765625, -0.28769683837890625, -0.2678680419921875, -0.24803924560546875, -0.22821044921875, -0.20838165283203125, -0.1885528564453125, -0.16872406005859375, -0.148895263671875, -0.12906646728515625, -0.1092376708984375, -0.08940887451171875, -0.069580078125, -0.04975128173828125, -0.0299224853515625, -0.01009368896484375, 0.009735107421875, 0.02956390380859375, 0.0493927001953125, 0.06922149658203125, 0.08905029296875, 0.10887908935546875, 0.1287078857421875, 0.14853668212890625, 0.168365478515625, 0.18819427490234375, 0.2080230712890625, 0.22785186767578125, 0.2476806640625, 0.26750946044921875, 0.2873382568359375, 0.30716705322265625, 0.326995849609375, 0.34682464599609375, 0.3666534423828125, 0.38648223876953125, 0.40631103515625, 0.42613983154296875, 0.4459686279296875, 0.46579742431640625, 0.485626220703125, 0.5054550170898438, 0.5252838134765625, 0.5451126098632812, 0.56494140625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 5.0, 3.0, 4.0, 6.0, 8.0, 12.0, 14.0, 14.0, 33.0, 32.0, 38.0, 46.0, 52.0, 57.0, 51.0, 71.0, 82.0, 70.0, 77.0, 52.0, 60.0, 35.0, 37.0, 35.0, 23.0, 22.0, 17.0, 13.0, 8.0, 8.0, 10.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58544921875, -0.5635757446289062, -0.5417022705078125, -0.5198287963867188, -0.497955322265625, -0.47608184814453125, -0.4542083740234375, -0.43233489990234375, -0.41046142578125, -0.38858795166015625, -0.3667144775390625, -0.34484100341796875, -0.322967529296875, -0.30109405517578125, -0.2792205810546875, -0.25734710693359375, -0.2354736328125, -0.21360015869140625, -0.1917266845703125, -0.16985321044921875, -0.147979736328125, -0.12610626220703125, -0.1042327880859375, -0.08235931396484375, -0.06048583984375, -0.03861236572265625, -0.0167388916015625, 0.00513458251953125, 0.027008056640625, 0.04888153076171875, 0.0707550048828125, 0.09262847900390625, 0.114501953125, 0.13637542724609375, 0.1582489013671875, 0.18012237548828125, 0.201995849609375, 0.22386932373046875, 0.2457427978515625, 0.26761627197265625, 0.28948974609375, 0.31136322021484375, 0.3332366943359375, 0.35511016845703125, 0.376983642578125, 0.39885711669921875, 0.4207305908203125, 0.44260406494140625, 0.4644775390625, 0.48635101318359375, 0.5082244873046875, 0.5300979614257812, 0.551971435546875, 0.5738449096679688, 0.5957183837890625, 0.6175918579101562, 0.63946533203125, 0.6613388061523438, 0.6832122802734375, 0.7050857543945312, 0.726959228515625, 0.7488327026367188, 0.7707061767578125, 0.7925796508789062, 0.814453125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 0.0, 3.0, 2.0, 2.0, 1.0, 5.0, 4.0, 1.0, 0.0, 5.0, 5.0, 2.0, 4.0, 12.0, 8.0, 6.0, 7.0, 19.0, 22.0, 26.0, 36.0, 66.0, 106.0, 156.0, 277.0, 630.0, 1945.0, 10421.0, 323096.0, 696171.0, 11843.0, 2168.0, 750.0, 301.0, 155.0, 80.0, 60.0, 52.0, 28.0, 19.0, 17.0, 7.0, 10.0, 7.0, 3.0, 5.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.2138671875, -0.20718955993652344, -0.20051193237304688, -0.1938343048095703, -0.18715667724609375, -0.1804790496826172, -0.17380142211914062, -0.16712379455566406, -0.1604461669921875, -0.15376853942871094, -0.14709091186523438, -0.1404132843017578, -0.13373565673828125, -0.1270580291748047, -0.12038040161132812, -0.11370277404785156, -0.107025146484375, -0.10034751892089844, -0.09366989135742188, -0.08699226379394531, -0.08031463623046875, -0.07363700866699219, -0.06695938110351562, -0.06028175354003906, -0.0536041259765625, -0.04692649841308594, -0.040248870849609375, -0.03357124328613281, -0.02689361572265625, -0.020215988159179688, -0.013538360595703125, -0.0068607330322265625, -0.00018310546875, 0.0064945220947265625, 0.013172149658203125, 0.019849777221679688, 0.02652740478515625, 0.03320503234863281, 0.039882659912109375, 0.04656028747558594, 0.0532379150390625, 0.05991554260253906, 0.06659317016601562, 0.07327079772949219, 0.07994842529296875, 0.08662605285644531, 0.09330368041992188, 0.09998130798339844, 0.106658935546875, 0.11333656311035156, 0.12001419067382812, 0.1266918182373047, 0.13336944580078125, 0.1400470733642578, 0.14672470092773438, 0.15340232849121094, 0.1600799560546875, 0.16675758361816406, 0.17343521118164062, 0.1801128387451172, 0.18679046630859375, 0.1934680938720703, 0.20014572143554688, 0.20682334899902344, 0.2135009765625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 3.0, 13.0, 4.0, 7.0, 10.0, 9.0, 13.0, 19.0, 28.0, 28.0, 41.0, 70.0, 97.0, 121.0, 126.0, 101.0, 84.0, 60.0, 36.0, 22.0, 25.0, 14.0, 10.0, 14.0, 10.0, 7.0, 7.0, 7.0, 2.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0], "bins": [-8.70823860168457e-05, -8.492451161146164e-05, -8.276663720607758e-05, -8.060876280069351e-05, -7.845088839530945e-05, -7.629301398992538e-05, -7.413513958454132e-05, -7.197726517915726e-05, -6.98193907737732e-05, -6.766151636838913e-05, -6.550364196300507e-05, -6.3345767557621e-05, -6.118789315223694e-05, -5.9030018746852875e-05, -5.687214434146881e-05, -5.471426993608475e-05, -5.2556395530700684e-05, -5.039852112531662e-05, -4.8240646719932556e-05, -4.608277231454849e-05, -4.392489790916443e-05, -4.1767023503780365e-05, -3.96091490983963e-05, -3.745127469301224e-05, -3.5293400287628174e-05, -3.313552588224411e-05, -3.0977651476860046e-05, -2.8819777071475983e-05, -2.666190266609192e-05, -2.4504028260707855e-05, -2.234615385532379e-05, -2.0188279449939728e-05, -1.8030405044555664e-05, -1.58725306391716e-05, -1.3714656233787537e-05, -1.1556781828403473e-05, -9.39890742301941e-06, -7.2410330176353455e-06, -5.083158612251282e-06, -2.925284206867218e-06, -7.674098014831543e-07, 1.3904646039009094e-06, 3.548339009284973e-06, 5.706213414669037e-06, 7.8640878200531e-06, 1.0021962225437164e-05, 1.2179836630821228e-05, 1.4337711036205292e-05, 1.6495585441589355e-05, 1.865345984697342e-05, 2.0811334252357483e-05, 2.2969208657741547e-05, 2.512708306312561e-05, 2.7284957468509674e-05, 2.9442831873893738e-05, 3.16007062792778e-05, 3.3758580684661865e-05, 3.591645509004593e-05, 3.807432949542999e-05, 4.0232203900814056e-05, 4.239007830619812e-05, 4.4547952711582184e-05, 4.670582711696625e-05, 4.886370152235031e-05, 5.1021575927734375e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 3.0, 6.0, 7.0, 5.0, 8.0, 13.0, 26.0, 28.0, 32.0, 53.0, 69.0, 107.0, 212.0, 333.0, 766.0, 1861.0, 6638.0, 44071.0, 859691.0, 118687.0, 11114.0, 2738.0, 1017.0, 472.0, 211.0, 121.0, 75.0, 51.0, 19.0, 22.0, 13.0, 17.0, 15.0, 13.0, 16.0, 5.0, 5.0, 5.0, 3.0, 1.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1497802734375, -0.14533233642578125, -0.1408843994140625, -0.13643646240234375, -0.131988525390625, -0.12754058837890625, -0.1230926513671875, -0.11864471435546875, -0.11419677734375, -0.10974884033203125, -0.1053009033203125, -0.10085296630859375, -0.096405029296875, -0.09195709228515625, -0.0875091552734375, -0.08306121826171875, -0.07861328125, -0.07416534423828125, -0.0697174072265625, -0.06526947021484375, -0.060821533203125, -0.05637359619140625, -0.0519256591796875, -0.04747772216796875, -0.04302978515625, -0.03858184814453125, -0.0341339111328125, -0.02968597412109375, -0.025238037109375, -0.02079010009765625, -0.0163421630859375, -0.01189422607421875, -0.0074462890625, -0.00299835205078125, 0.0014495849609375, 0.00589752197265625, 0.010345458984375, 0.01479339599609375, 0.0192413330078125, 0.02368927001953125, 0.02813720703125, 0.03258514404296875, 0.0370330810546875, 0.04148101806640625, 0.045928955078125, 0.05037689208984375, 0.0548248291015625, 0.05927276611328125, 0.063720703125, 0.06816864013671875, 0.0726165771484375, 0.07706451416015625, 0.081512451171875, 0.08596038818359375, 0.0904083251953125, 0.09485626220703125, 0.09930419921875, 0.10375213623046875, 0.1082000732421875, 0.11264801025390625, 0.117095947265625, 0.12154388427734375, 0.1259918212890625, 0.13043975830078125, 0.1348876953125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 5.0, 6.0, 12.0, 17.0, 16.0, 27.0, 46.0, 58.0, 95.0, 131.0, 163.0, 116.0, 91.0, 77.0, 34.0, 32.0, 19.0, 7.0, 8.0, 4.0, 7.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.152099609375, -0.14802932739257812, -0.14395904541015625, -0.13988876342773438, -0.1358184814453125, -0.13174819946289062, -0.12767791748046875, -0.12360763549804688, -0.119537353515625, -0.11546707153320312, -0.11139678955078125, -0.10732650756835938, -0.1032562255859375, -0.09918594360351562, -0.09511566162109375, -0.09104537963867188, -0.08697509765625, -0.08290481567382812, -0.07883453369140625, -0.07476425170898438, -0.0706939697265625, -0.06662368774414062, -0.06255340576171875, -0.058483123779296875, -0.054412841796875, -0.050342559814453125, -0.04627227783203125, -0.042201995849609375, -0.0381317138671875, -0.034061431884765625, -0.02999114990234375, -0.025920867919921875, -0.0218505859375, -0.017780303955078125, -0.01371002197265625, -0.009639739990234375, -0.0055694580078125, -0.001499176025390625, 0.00257110595703125, 0.006641387939453125, 0.010711669921875, 0.014781951904296875, 0.01885223388671875, 0.022922515869140625, 0.0269927978515625, 0.031063079833984375, 0.03513336181640625, 0.039203643798828125, 0.04327392578125, 0.047344207763671875, 0.05141448974609375, 0.055484771728515625, 0.0595550537109375, 0.06362533569335938, 0.06769561767578125, 0.07176589965820312, 0.075836181640625, 0.07990646362304688, 0.08397674560546875, 0.08804702758789062, 0.0921173095703125, 0.09618759155273438, 0.10025787353515625, 0.10432815551757812, 0.1083984375]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 8.0, 38.0, 269.0, 605.0, 54.0, 11.0, 4.0, 6.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.463346481323242, -11.2151460647583, -10.96694564819336, -10.718745231628418, -10.470544815063477, -10.222344398498535, -9.974143981933594, -9.725943565368652, -9.477743148803711, -9.22954273223877, -8.981342315673828, -8.733141899108887, -8.484941482543945, -8.236741065979004, -7.9885406494140625, -7.740340232849121, -7.49213981628418, -7.243939399719238, -6.995738983154297, -6.7475385665893555, -6.499338150024414, -6.251137733459473, -6.002937316894531, -5.75473690032959, -5.50653600692749, -5.258335590362549, -5.010135173797607, -4.761934757232666, -4.513734340667725, -4.265533924102783, -4.017333507537842, -3.7691330909729004, -3.520932674407959, -3.2727322578430176, -3.024531841278076, -2.7763314247131348, -2.5281310081481934, -2.279930591583252, -2.0317301750183105, -1.7835296392440796, -1.5353292226791382, -1.2871288061141968, -1.0389283895492554, -0.7907279133796692, -0.5425274968147278, -0.2943270206451416, -0.046126604080200195, 0.2020738124847412, 0.4502742290496826, 0.698474645614624, 0.9466750621795654, 1.1948754787445068, 1.4430758953094482, 1.6912764310836792, 1.9394768476486206, 2.1876773834228516, 2.435877799987793, 2.6840782165527344, 2.932278633117676, 3.180479049682617, 3.4286794662475586, 3.6768798828125, 3.9250802993774414, 4.173280715942383, 4.421481132507324]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 1.0, 4.0, 6.0, 4.0, 7.0, 10.0, 13.0, 7.0, 14.0, 13.0, 20.0, 22.0, 26.0, 28.0, 36.0, 51.0, 41.0, 90.0, 183.0, 104.0, 44.0, 45.0, 38.0, 30.0, 32.0, 28.0, 25.0, 15.0, 10.0, 18.0, 7.0, 10.0, 9.0, 6.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0799918174743652, -2.0016672611236572, -1.9233425855636597, -1.845017910003662, -1.766693353652954, -1.688368797302246, -1.6100441217422485, -1.531719446182251, -1.453394889831543, -1.375070333480835, -1.2967456579208374, -1.2184209823608398, -1.1400964260101318, -1.0617718696594238, -0.9834471940994263, -0.9051225781440735, -0.8267979621887207, -0.7484733462333679, -0.6701487302780151, -0.5918241143226624, -0.5134994983673096, -0.4351748824119568, -0.356850266456604, -0.2785256505012512, -0.20020103454589844, -0.12187641859054565, -0.04355180263519287, 0.03477281332015991, 0.1130974292755127, 0.19142204523086548, 0.26974666118621826, 0.34807127714157104, 0.4263956546783447, 0.5047202706336975, 0.5830448865890503, 0.6613695025444031, 0.7396941184997559, 0.8180187344551086, 0.8963433504104614, 0.9746679663658142, 1.052992582321167, 1.131317138671875, 1.2096418142318726, 1.2879664897918701, 1.3662910461425781, 1.4446156024932861, 1.5229402780532837, 1.6012649536132812, 1.6795895099639893, 1.7579140663146973, 1.8362387418746948, 1.9145634174346924, 1.9928879737854004, 2.0712125301361084, 2.1495370864868164, 2.2278618812561035, 2.3061864376068115, 2.3845109939575195, 2.4628357887268066, 2.5411603450775146, 2.6194849014282227, 2.6978094577789307, 2.7761340141296387, 2.854458808898926, 2.932783365249634]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 4.0, 12.0, 11.0, 32.0, 30.0, 49.0, 86.0, 173.0, 290.0, 606.0, 1249.0, 3444.0, 12647.0, 87590.0, 1131623.0, 2569648.0, 346927.0, 29322.0, 6534.0, 2161.0, 895.0, 385.0, 215.0, 128.0, 69.0, 40.0, 30.0, 29.0, 13.0, 7.0, 3.0, 7.0, 8.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.269775390625, -0.25988006591796875, -0.2499847412109375, -0.24008941650390625, -0.230194091796875, -0.22029876708984375, -0.2104034423828125, -0.20050811767578125, -0.19061279296875, -0.18071746826171875, -0.1708221435546875, -0.16092681884765625, -0.151031494140625, -0.14113616943359375, -0.1312408447265625, -0.12134552001953125, -0.1114501953125, -0.10155487060546875, -0.0916595458984375, -0.08176422119140625, -0.071868896484375, -0.06197357177734375, -0.0520782470703125, -0.04218292236328125, -0.03228759765625, -0.02239227294921875, -0.0124969482421875, -0.00260162353515625, 0.007293701171875, 0.01718902587890625, 0.0270843505859375, 0.03697967529296875, 0.046875, 0.05677032470703125, 0.0666656494140625, 0.07656097412109375, 0.086456298828125, 0.09635162353515625, 0.1062469482421875, 0.11614227294921875, 0.12603759765625, 0.13593292236328125, 0.1458282470703125, 0.15572357177734375, 0.165618896484375, 0.17551422119140625, 0.1854095458984375, 0.19530487060546875, 0.2052001953125, 0.21509552001953125, 0.2249908447265625, 0.23488616943359375, 0.244781494140625, 0.25467681884765625, 0.2645721435546875, 0.27446746826171875, 0.28436279296875, 0.29425811767578125, 0.3041534423828125, 0.31404876708984375, 0.323944091796875, 0.33383941650390625, 0.3437347412109375, 0.35363006591796875, 0.363525390625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 4.0, 5.0, 9.0, 9.0, 15.0, 20.0, 31.0, 37.0, 52.0, 59.0, 74.0, 70.0, 70.0, 82.0, 88.0, 84.0, 72.0, 55.0, 38.0, 43.0, 22.0, 18.0, 9.0, 11.0, 12.0, 5.0, 2.0, 6.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2568359375, -0.24914169311523438, -0.24144744873046875, -0.23375320434570312, -0.2260589599609375, -0.21836471557617188, -0.21067047119140625, -0.20297622680664062, -0.195281982421875, -0.18758773803710938, -0.17989349365234375, -0.17219924926757812, -0.1645050048828125, -0.15681076049804688, -0.14911651611328125, -0.14142227172851562, -0.13372802734375, -0.12603378295898438, -0.11833953857421875, -0.11064529418945312, -0.1029510498046875, -0.09525680541992188, -0.08756256103515625, -0.07986831665039062, -0.072174072265625, -0.06447982788085938, -0.05678558349609375, -0.049091339111328125, -0.0413970947265625, -0.033702850341796875, -0.02600860595703125, -0.018314361572265625, -0.0106201171875, -0.002925872802734375, 0.00476837158203125, 0.012462615966796875, 0.0201568603515625, 0.027851104736328125, 0.03554534912109375, 0.043239593505859375, 0.050933837890625, 0.058628082275390625, 0.06632232666015625, 0.07401657104492188, 0.0817108154296875, 0.08940505981445312, 0.09709930419921875, 0.10479354858398438, 0.11248779296875, 0.12018203735351562, 0.12787628173828125, 0.13557052612304688, 0.1432647705078125, 0.15095901489257812, 0.15865325927734375, 0.16634750366210938, 0.174041748046875, 0.18173599243164062, 0.18943023681640625, 0.19712448120117188, 0.2048187255859375, 0.21251296997070312, 0.22020721435546875, 0.22790145874023438, 0.235595703125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 6.0, 0.0, 4.0, 5.0, 10.0, 7.0, 13.0, 29.0, 40.0, 53.0, 85.0, 150.0, 337.0, 796.0, 2110.0, 12138.0, 3662971.0, 503794.0, 8334.0, 1941.0, 703.0, 342.0, 162.0, 97.0, 52.0, 39.0, 22.0, 15.0, 13.0, 3.0, 7.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0703125, -1.0367279052734375, -1.003143310546875, -0.9695587158203125, -0.93597412109375, -0.9023895263671875, -0.868804931640625, -0.8352203369140625, -0.8016357421875, -0.7680511474609375, -0.734466552734375, -0.7008819580078125, -0.66729736328125, -0.6337127685546875, -0.600128173828125, -0.5665435791015625, -0.532958984375, -0.4993743896484375, -0.465789794921875, -0.4322052001953125, -0.39862060546875, -0.3650360107421875, -0.331451416015625, -0.2978668212890625, -0.2642822265625, -0.2306976318359375, -0.197113037109375, -0.1635284423828125, -0.12994384765625, -0.0963592529296875, -0.062774658203125, -0.0291900634765625, 0.00439453125, 0.0379791259765625, 0.071563720703125, 0.1051483154296875, 0.13873291015625, 0.1723175048828125, 0.205902099609375, 0.2394866943359375, 0.2730712890625, 0.3066558837890625, 0.340240478515625, 0.3738250732421875, 0.40740966796875, 0.4409942626953125, 0.474578857421875, 0.5081634521484375, 0.541748046875, 0.5753326416015625, 0.608917236328125, 0.6425018310546875, 0.67608642578125, 0.7096710205078125, 0.743255615234375, 0.7768402099609375, 0.8104248046875, 0.8440093994140625, 0.877593994140625, 0.9111785888671875, 0.94476318359375, 0.9783477783203125, 1.011932373046875, 1.0455169677734375, 1.0791015625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 6.0, 3.0, 5.0, 12.0, 31.0, 68.0, 107.0, 193.0, 379.0, 755.0, 919.0, 674.0, 400.0, 198.0, 118.0, 70.0, 39.0, 30.0, 20.0, 18.0, 6.0, 5.0, 5.0, 5.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60693359375, -0.5830078125, -0.55908203125, -0.53515625, -0.51123046875, -0.4873046875, -0.46337890625, -0.439453125, -0.41552734375, -0.3916015625, -0.36767578125, -0.34375, -0.31982421875, -0.2958984375, -0.27197265625, -0.248046875, -0.22412109375, -0.2001953125, -0.17626953125, -0.15234375, -0.12841796875, -0.1044921875, -0.08056640625, -0.056640625, -0.03271484375, -0.0087890625, 0.01513671875, 0.0390625, 0.06298828125, 0.0869140625, 0.11083984375, 0.134765625, 0.15869140625, 0.1826171875, 0.20654296875, 0.23046875, 0.25439453125, 0.2783203125, 0.30224609375, 0.326171875, 0.35009765625, 0.3740234375, 0.39794921875, 0.421875, 0.44580078125, 0.4697265625, 0.49365234375, 0.517578125, 0.54150390625, 0.5654296875, 0.58935546875, 0.61328125, 0.63720703125, 0.6611328125, 0.68505859375, 0.708984375, 0.73291015625, 0.7568359375, 0.78076171875, 0.8046875, 0.82861328125, 0.8525390625, 0.87646484375, 0.900390625, 0.92431640625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 9.0, 19.0, 41.0, 184.0, 400.0, 207.0, 71.0, 27.0, 14.0, 9.0, 5.0, 3.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.7272138595581055, -3.363909959793091, -3.000606060028076, -2.6373021602630615, -2.273998260498047, -1.9106943607330322, -1.5473904609680176, -1.184086561203003, -0.8207826614379883, -0.45747876167297363, -0.09417486190795898, 0.26912903785705566, 0.6324329376220703, 0.995736837387085, 1.3590407371520996, 1.7223446369171143, 2.085648536682129, 2.4489524364471436, 2.812256336212158, 3.175560235977173, 3.5388641357421875, 3.902168035507202, 4.265471935272217, 4.628775596618652, 4.992079734802246, 5.35538387298584, 5.718687534332275, 6.081991195678711, 6.445295333862305, 6.808599472045898, 7.171903133392334, 7.5352067947387695, 7.898509979248047, 8.26181411743164, 8.625118255615234, 8.988421440124512, 9.351725578308105, 9.7150297164917, 10.078332901000977, 10.44163703918457, 10.804941177368164, 11.168245315551758, 11.531549453735352, 11.894852638244629, 12.258156776428223, 12.621460914611816, 12.984764099121094, 13.348068237304688, 13.711372375488281, 14.074676513671875, 14.437980651855469, 14.801283836364746, 15.16458797454834, 15.527892112731934, 15.891195297241211, 16.254499435424805, 16.6178035736084, 16.981107711791992, 17.344411849975586, 17.70771598815918, 18.07101821899414, 18.434322357177734, 18.797626495361328, 19.160930633544922, 19.524234771728516]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 8.0, 1.0, 2.0, 7.0, 6.0, 12.0, 10.0, 14.0, 24.0, 42.0, 40.0, 41.0, 62.0, 53.0, 85.0, 85.0, 89.0, 100.0, 71.0, 49.0, 48.0, 39.0, 32.0, 18.0, 12.0, 16.0, 15.0, 8.0, 5.0, 8.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.228280067443848, -4.069037437438965, -3.909795045852661, -3.7505526542663574, -3.5913100242614746, -3.432067394256592, -3.272825002670288, -3.1135826110839844, -2.9543399810791016, -2.7950973510742188, -2.635854959487915, -2.4766125679016113, -2.3173699378967285, -2.1581273078918457, -1.998884916305542, -1.8396424055099487, -1.6803998947143555, -1.5211573839187622, -1.361914873123169, -1.2026723623275757, -1.0434298515319824, -0.8841873407363892, -0.7249448299407959, -0.5657023191452026, -0.4064598083496094, -0.2472172975540161, -0.08797478675842285, 0.07126772403717041, 0.23051023483276367, 0.38975274562835693, 0.5489952564239502, 0.7082377672195435, 0.8674802780151367, 1.02672278881073, 1.1859652996063232, 1.3452078104019165, 1.5044503211975098, 1.663692831993103, 1.8229353427886963, 1.9821778535842896, 2.141420364379883, 2.3006629943847656, 2.4599053859710693, 2.619147777557373, 2.778390407562256, 2.9376330375671387, 3.0968754291534424, 3.256117820739746, 3.415360450744629, 3.5746030807495117, 3.7338454723358154, 3.893087863922119, 4.052330493927002, 4.211573123931885, 4.370815277099609, 4.530057907104492, 4.689300537109375, 4.848543167114258, 5.007785797119141, 5.167027950286865, 5.326270580291748, 5.485513210296631, 5.6447553634643555, 5.803997993469238, 5.963240623474121]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 4.0, 5.0, 5.0, 7.0, 16.0, 24.0, 52.0, 71.0, 91.0, 181.0, 292.0, 603.0, 1397.0, 3445.0, 9769.0, 38503.0, 286642.0, 623168.0, 62477.0, 13858.0, 4615.0, 1715.0, 731.0, 375.0, 176.0, 109.0, 87.0, 40.0, 25.0, 22.0, 12.0, 9.0, 4.0, 12.0, 4.0, 5.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3310546875, -0.3207550048828125, -0.310455322265625, -0.3001556396484375, -0.28985595703125, -0.2795562744140625, -0.269256591796875, -0.2589569091796875, -0.2486572265625, -0.2383575439453125, -0.228057861328125, -0.2177581787109375, -0.20745849609375, -0.1971588134765625, -0.186859130859375, -0.1765594482421875, -0.166259765625, -0.1559600830078125, -0.145660400390625, -0.1353607177734375, -0.12506103515625, -0.1147613525390625, -0.104461669921875, -0.0941619873046875, -0.0838623046875, -0.0735626220703125, -0.063262939453125, -0.0529632568359375, -0.04266357421875, -0.0323638916015625, -0.022064208984375, -0.0117645263671875, -0.00146484375, 0.0088348388671875, 0.019134521484375, 0.0294342041015625, 0.03973388671875, 0.0500335693359375, 0.060333251953125, 0.0706329345703125, 0.0809326171875, 0.0912322998046875, 0.101531982421875, 0.1118316650390625, 0.12213134765625, 0.1324310302734375, 0.142730712890625, 0.1530303955078125, 0.163330078125, 0.1736297607421875, 0.183929443359375, 0.1942291259765625, 0.20452880859375, 0.2148284912109375, 0.225128173828125, 0.2354278564453125, 0.2457275390625, 0.2560272216796875, 0.266326904296875, 0.2766265869140625, 0.28692626953125, 0.2972259521484375, 0.307525634765625, 0.3178253173828125, 0.328125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 6.0, 9.0, 13.0, 24.0, 32.0, 35.0, 57.0, 63.0, 82.0, 76.0, 92.0, 87.0, 83.0, 68.0, 71.0, 45.0, 52.0, 43.0, 20.0, 12.0, 7.0, 8.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25146484375, -0.24055862426757812, -0.22965240478515625, -0.21874618530273438, -0.2078399658203125, -0.19693374633789062, -0.18602752685546875, -0.17512130737304688, -0.164215087890625, -0.15330886840820312, -0.14240264892578125, -0.13149642944335938, -0.1205902099609375, -0.10968399047851562, -0.09877777099609375, -0.08787155151367188, -0.07696533203125, -0.06605911254882812, -0.05515289306640625, -0.044246673583984375, -0.0333404541015625, -0.022434234619140625, -0.01152801513671875, -0.000621795654296875, 0.010284423828125, 0.021190643310546875, 0.03209686279296875, 0.043003082275390625, 0.0539093017578125, 0.06481552124023438, 0.07572174072265625, 0.08662796020507812, 0.0975341796875, 0.10844039916992188, 0.11934661865234375, 0.13025283813476562, 0.1411590576171875, 0.15206527709960938, 0.16297149658203125, 0.17387771606445312, 0.184783935546875, 0.19569015502929688, 0.20659637451171875, 0.21750259399414062, 0.2284088134765625, 0.23931503295898438, 0.25022125244140625, 0.2611274719238281, 0.27203369140625, 0.2829399108886719, 0.29384613037109375, 0.3047523498535156, 0.3156585693359375, 0.3265647888183594, 0.33747100830078125, 0.3483772277832031, 0.359283447265625, 0.3701896667480469, 0.38109588623046875, 0.3920021057128906, 0.4029083251953125, 0.4138145446777344, 0.42472076416015625, 0.4356269836425781, 0.446533203125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 5.0, 4.0, 8.0, 5.0, 9.0, 21.0, 30.0, 40.0, 59.0, 66.0, 112.0, 158.0, 324.0, 586.0, 1390.0, 5097.0, 48773.0, 943722.0, 40878.0, 4572.0, 1323.0, 521.0, 326.0, 174.0, 117.0, 67.0, 54.0, 45.0, 19.0, 10.0, 10.0, 9.0, 7.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.428955078125, -0.4153251647949219, -0.40169525146484375, -0.3880653381347656, -0.3744354248046875, -0.3608055114746094, -0.34717559814453125, -0.3335456848144531, -0.319915771484375, -0.3062858581542969, -0.29265594482421875, -0.2790260314941406, -0.2653961181640625, -0.2517662048339844, -0.23813629150390625, -0.22450637817382812, -0.21087646484375, -0.19724655151367188, -0.18361663818359375, -0.16998672485351562, -0.1563568115234375, -0.14272689819335938, -0.12909698486328125, -0.11546707153320312, -0.101837158203125, -0.08820724487304688, -0.07457733154296875, -0.060947418212890625, -0.0473175048828125, -0.033687591552734375, -0.02005767822265625, -0.006427764892578125, 0.0072021484375, 0.020832061767578125, 0.03446197509765625, 0.048091888427734375, 0.0617218017578125, 0.07535171508789062, 0.08898162841796875, 0.10261154174804688, 0.116241455078125, 0.12987136840820312, 0.14350128173828125, 0.15713119506835938, 0.1707611083984375, 0.18439102172851562, 0.19802093505859375, 0.21165084838867188, 0.22528076171875, 0.23891067504882812, 0.25254058837890625, 0.2661705017089844, 0.2798004150390625, 0.2934303283691406, 0.30706024169921875, 0.3206901550292969, 0.334320068359375, 0.3479499816894531, 0.36157989501953125, 0.3752098083496094, 0.3888397216796875, 0.4024696350097656, 0.41609954833984375, 0.4297294616699219, 0.443359375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 5.0, 8.0, 6.0, 7.0, 4.0, 8.0, 5.0, 10.0, 10.0, 2.0, 18.0, 16.0, 24.0, 30.0, 39.0, 42.0, 56.0, 52.0, 76.0, 67.0, 83.0, 57.0, 65.0, 47.0, 42.0, 39.0, 27.0, 22.0, 16.0, 16.0, 19.0, 17.0, 9.0, 13.0, 9.0, 6.0, 3.0, 6.0, 4.0, 3.0, 6.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.72265625, -0.7010116577148438, -0.6793670654296875, -0.6577224731445312, -0.636077880859375, -0.6144332885742188, -0.5927886962890625, -0.5711441040039062, -0.54949951171875, -0.5278549194335938, -0.5062103271484375, -0.48456573486328125, -0.462921142578125, -0.44127655029296875, -0.4196319580078125, -0.39798736572265625, -0.3763427734375, -0.35469818115234375, -0.3330535888671875, -0.31140899658203125, -0.289764404296875, -0.26811981201171875, -0.2464752197265625, -0.22483062744140625, -0.20318603515625, -0.18154144287109375, -0.1598968505859375, -0.13825225830078125, -0.116607666015625, -0.09496307373046875, -0.0733184814453125, -0.05167388916015625, -0.030029296875, -0.00838470458984375, 0.0132598876953125, 0.03490447998046875, 0.056549072265625, 0.07819366455078125, 0.0998382568359375, 0.12148284912109375, 0.14312744140625, 0.16477203369140625, 0.1864166259765625, 0.20806121826171875, 0.229705810546875, 0.25135040283203125, 0.2729949951171875, 0.29463958740234375, 0.3162841796875, 0.33792877197265625, 0.3595733642578125, 0.38121795654296875, 0.402862548828125, 0.42450714111328125, 0.4461517333984375, 0.46779632568359375, 0.48944091796875, 0.5110855102539062, 0.5327301025390625, 0.5543746948242188, 0.576019287109375, 0.5976638793945312, 0.6193084716796875, 0.6409530639648438, 0.66259765625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 7.0, 5.0, 11.0, 10.0, 15.0, 28.0, 18.0, 30.0, 51.0, 79.0, 104.0, 168.0, 248.0, 429.0, 872.0, 1800.0, 4956.0, 19461.0, 212000.0, 773846.0, 24317.0, 5807.0, 2042.0, 966.0, 479.0, 240.0, 159.0, 120.0, 78.0, 46.0, 52.0, 29.0, 23.0, 13.0, 10.0, 10.0, 7.0, 7.0, 4.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.05438232421875, -0.05257368087768555, -0.050765037536621094, -0.04895639419555664, -0.04714775085449219, -0.045339107513427734, -0.04353046417236328, -0.04172182083129883, -0.039913177490234375, -0.03810453414916992, -0.03629589080810547, -0.034487247467041016, -0.03267860412597656, -0.03086996078491211, -0.029061317443847656, -0.027252674102783203, -0.02544403076171875, -0.023635387420654297, -0.021826744079589844, -0.02001810073852539, -0.018209457397460938, -0.016400814056396484, -0.014592170715332031, -0.012783527374267578, -0.010974884033203125, -0.009166240692138672, -0.007357597351074219, -0.005548954010009766, -0.0037403106689453125, -0.0019316673278808594, -0.00012302398681640625, 0.0016856193542480469, 0.0034942626953125, 0.005302906036376953, 0.007111549377441406, 0.00892019271850586, 0.010728836059570312, 0.012537479400634766, 0.014346122741699219, 0.016154766082763672, 0.017963409423828125, 0.019772052764892578, 0.02158069610595703, 0.023389339447021484, 0.025197982788085938, 0.02700662612915039, 0.028815269470214844, 0.030623912811279297, 0.03243255615234375, 0.0342411994934082, 0.036049842834472656, 0.03785848617553711, 0.03966712951660156, 0.041475772857666016, 0.04328441619873047, 0.04509305953979492, 0.046901702880859375, 0.04871034622192383, 0.05051898956298828, 0.052327632904052734, 0.05413627624511719, 0.05594491958618164, 0.057753562927246094, 0.05956220626831055, 0.061370849609375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 4.0, 5.0, 5.0, 4.0, 7.0, 3.0, 10.0, 16.0, 24.0, 26.0, 51.0, 49.0, 57.0, 80.0, 84.0, 93.0, 92.0, 86.0, 67.0, 56.0, 33.0, 35.0, 28.0, 13.0, 16.0, 16.0, 6.0, 9.0, 7.0, 2.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.4809112548828125e-05, -3.34596261382103e-05, -3.211013972759247e-05, -3.076065331697464e-05, -2.941116690635681e-05, -2.8061680495738983e-05, -2.6712194085121155e-05, -2.5362707674503326e-05, -2.4013221263885498e-05, -2.266373485326767e-05, -2.131424844264984e-05, -1.9964762032032013e-05, -1.8615275621414185e-05, -1.7265789210796356e-05, -1.5916302800178528e-05, -1.45668163895607e-05, -1.3217329978942871e-05, -1.1867843568325043e-05, -1.0518357157707214e-05, -9.168870747089386e-06, -7.819384336471558e-06, -6.469897925853729e-06, -5.120411515235901e-06, -3.7709251046180725e-06, -2.421438694000244e-06, -1.0719522833824158e-06, 2.775341272354126e-07, 1.627020537853241e-06, 2.9765069484710693e-06, 4.325993359088898e-06, 5.675479769706726e-06, 7.0249661803245544e-06, 8.374452590942383e-06, 9.723939001560211e-06, 1.107342541217804e-05, 1.2422911822795868e-05, 1.3772398233413696e-05, 1.5121884644031525e-05, 1.6471371054649353e-05, 1.782085746526718e-05, 1.917034387588501e-05, 2.0519830286502838e-05, 2.1869316697120667e-05, 2.3218803107738495e-05, 2.4568289518356323e-05, 2.591777592897415e-05, 2.726726233959198e-05, 2.861674875020981e-05, 2.9966235160827637e-05, 3.1315721571445465e-05, 3.2665207982063293e-05, 3.401469439268112e-05, 3.536418080329895e-05, 3.671366721391678e-05, 3.806315362453461e-05, 3.9412640035152435e-05, 4.0762126445770264e-05, 4.211161285638809e-05, 4.346109926700592e-05, 4.481058567762375e-05, 4.616007208824158e-05, 4.7509558498859406e-05, 4.8859044909477234e-05, 5.020853132009506e-05, 5.155801773071289e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 5.0, 4.0, 1.0, 7.0, 5.0, 7.0, 12.0, 13.0, 19.0, 24.0, 29.0, 39.0, 58.0, 79.0, 141.0, 153.0, 274.0, 447.0, 740.0, 1268.0, 2408.0, 4994.0, 10902.0, 28721.0, 120816.0, 773195.0, 67366.0, 20038.0, 8184.0, 3890.0, 1934.0, 1082.0, 601.0, 353.0, 240.0, 163.0, 96.0, 73.0, 48.0, 33.0, 28.0, 13.0, 16.0, 11.0, 18.0, 5.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.0308990478515625, -0.029880285263061523, -0.028861522674560547, -0.02784276008605957, -0.026823997497558594, -0.025805234909057617, -0.02478647232055664, -0.023767709732055664, -0.022748947143554688, -0.02173018455505371, -0.020711421966552734, -0.019692659378051758, -0.01867389678955078, -0.017655134201049805, -0.016636371612548828, -0.015617609024047852, -0.014598846435546875, -0.013580083847045898, -0.012561321258544922, -0.011542558670043945, -0.010523796081542969, -0.009505033493041992, -0.008486270904541016, -0.007467508316040039, -0.0064487457275390625, -0.005429983139038086, -0.004411220550537109, -0.003392457962036133, -0.0023736953735351562, -0.0013549327850341797, -0.0003361701965332031, 0.0006825923919677734, 0.00170135498046875, 0.0027201175689697266, 0.003738880157470703, 0.00475764274597168, 0.005776405334472656, 0.006795167922973633, 0.00781393051147461, 0.008832693099975586, 0.009851455688476562, 0.010870218276977539, 0.011888980865478516, 0.012907743453979492, 0.013926506042480469, 0.014945268630981445, 0.015964031219482422, 0.0169827938079834, 0.018001556396484375, 0.01902031898498535, 0.020039081573486328, 0.021057844161987305, 0.02207660675048828, 0.023095369338989258, 0.024114131927490234, 0.02513289451599121, 0.026151657104492188, 0.027170419692993164, 0.02818918228149414, 0.029207944869995117, 0.030226707458496094, 0.03124547004699707, 0.03226423263549805, 0.03328299522399902, 0.0343017578125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 1.0, 3.0, 3.0, 5.0, 10.0, 10.0, 9.0, 14.0, 12.0, 28.0, 32.0, 43.0, 79.0, 133.0, 171.0, 136.0, 96.0, 60.0, 46.0, 27.0, 11.0, 14.0, 13.0, 7.0, 8.0, 5.0, 8.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0638427734375, -0.06182575225830078, -0.05980873107910156, -0.057791709899902344, -0.055774688720703125, -0.053757667541503906, -0.05174064636230469, -0.04972362518310547, -0.04770660400390625, -0.04568958282470703, -0.04367256164550781, -0.041655540466308594, -0.039638519287109375, -0.037621498107910156, -0.03560447692871094, -0.03358745574951172, -0.0315704345703125, -0.02955341339111328, -0.027536392211914062, -0.025519371032714844, -0.023502349853515625, -0.021485328674316406, -0.019468307495117188, -0.01745128631591797, -0.01543426513671875, -0.013417243957519531, -0.011400222778320312, -0.009383201599121094, -0.007366180419921875, -0.005349159240722656, -0.0033321380615234375, -0.0013151168823242188, 0.000701904296875, 0.0027189254760742188, 0.0047359466552734375, 0.006752967834472656, 0.008769989013671875, 0.010787010192871094, 0.012804031372070312, 0.014821052551269531, 0.01683807373046875, 0.01885509490966797, 0.020872116088867188, 0.022889137268066406, 0.024906158447265625, 0.026923179626464844, 0.028940200805664062, 0.03095722198486328, 0.0329742431640625, 0.03499126434326172, 0.03700828552246094, 0.039025306701660156, 0.041042327880859375, 0.043059349060058594, 0.04507637023925781, 0.04709339141845703, 0.04911041259765625, 0.05112743377685547, 0.05314445495605469, 0.055161476135253906, 0.057178497314453125, 0.059195518493652344, 0.06121253967285156, 0.06322956085205078, 0.06524658203125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 8.0, 13.0, 28.0, 39.0, 62.0, 156.0, 540.0, 77.0, 38.0, 16.0, 9.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.0018630027771, -4.896159648895264, -4.790456295013428, -4.684752464294434, -4.579049110412598, -4.473345756530762, -4.367642402648926, -4.26193904876709, -4.156235694885254, -4.050532341003418, -3.944828748703003, -3.839125394821167, -3.733421802520752, -3.627718448638916, -3.52201509475708, -3.416311740875244, -3.31060791015625, -3.204904556274414, -3.099200963973999, -2.993497610092163, -2.887794017791748, -2.782090663909912, -2.676387310028076, -2.5706839561462402, -2.464980363845825, -2.3592770099639893, -2.253573417663574, -2.1478700637817383, -2.0421667098999023, -1.9364631175994873, -1.8307597637176514, -1.7250562906265259, -1.6193530559539795, -1.513649582862854, -1.4079461097717285, -1.3022427558898926, -1.196539282798767, -1.0908358097076416, -0.9851323962211609, -0.8794289827346802, -0.7737255096435547, -0.6680220365524292, -0.5623186230659485, -0.4566151797771454, -0.3509117364883423, -0.2452082633972168, -0.13950484991073608, -0.03380143642425537, 0.07190203666687012, 0.17760547995567322, 0.2833089232444763, 0.3890123665332794, 0.4947158098220825, 0.600419282913208, 0.7061226963996887, 0.8118261098861694, 0.9175295829772949, 1.0232330560684204, 1.128936529159546, 1.2346398830413818, 1.3403433561325073, 1.4460468292236328, 1.5517501831054688, 1.6574536561965942, 1.7631571292877197]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 3.0, 4.0, 1.0, 5.0, 3.0, 10.0, 7.0, 13.0, 11.0, 20.0, 14.0, 16.0, 19.0, 23.0, 33.0, 26.0, 37.0, 89.0, 324.0, 104.0, 26.0, 18.0, 21.0, 26.0, 23.0, 26.0, 23.0, 23.0, 8.0, 11.0, 6.0, 6.0, 4.0, 6.0, 2.0, 5.0, 1.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5587775707244873, -2.4887776374816895, -2.4187777042388916, -2.3487777709960938, -2.278778076171875, -2.208778142929077, -2.1387782096862793, -2.0687782764434814, -1.9987783432006836, -1.9287784099578857, -1.858778476715088, -1.7887786626815796, -1.7187787294387817, -1.6487787961959839, -1.5787789821624756, -1.5087790489196777, -1.4387791156768799, -1.368779182434082, -1.2987792491912842, -1.2287794351577759, -1.158779501914978, -1.0887795686721802, -1.0187797546386719, -0.948779821395874, -0.8787798881530762, -0.8087799549102783, -0.7387800812721252, -0.6687802076339722, -0.5987802743911743, -0.5287803411483765, -0.4587804675102234, -0.3887805640697479, -0.31878089904785156, -0.2487809956073761, -0.17878109216690063, -0.10878118872642517, -0.03878128528594971, 0.031218618154525757, 0.10121852159500122, 0.17121842503547668, 0.24121832847595215, 0.3112182319164276, 0.3812181353569031, 0.45121803879737854, 0.521217942237854, 0.5912178754806519, 0.6612177491188049, 0.731217622756958, 0.8012175559997559, 0.8712174892425537, 0.9412173628807068, 1.0112172365188599, 1.0812171697616577, 1.1512171030044556, 1.2212169170379639, 1.2912168502807617, 1.3612167835235596, 1.4312167167663574, 1.5012166500091553, 1.5712164640426636, 1.6412163972854614, 1.7112163305282593, 1.7812161445617676, 1.8512160778045654, 1.9212160110473633]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 6.0, 10.0, 16.0, 22.0, 34.0, 37.0, 48.0, 70.0, 211.0, 260.0, 69.0, 59.0, 41.0, 33.0, 24.0, 23.0, 10.0, 9.0, 5.0, 5.0, 2.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2271728515625, -0.2168598175048828, -0.20654678344726562, -0.19623374938964844, -0.18592071533203125, -0.17560768127441406, -0.16529464721679688, -0.1549816131591797, -0.1446685791015625, -0.1343555450439453, -0.12404251098632812, -0.11372947692871094, -0.10341644287109375, -0.09310340881347656, -0.08279037475585938, -0.07247734069824219, -0.062164306640625, -0.05185127258300781, -0.041538238525390625, -0.031225204467773438, -0.02091217041015625, -0.010599136352539062, -0.000286102294921875, 0.010026931762695312, 0.0203399658203125, 0.030652999877929688, 0.040966033935546875, 0.05127906799316406, 0.06159210205078125, 0.07190513610839844, 0.08221817016601562, 0.09253120422363281, 0.10284423828125, 0.11315727233886719, 0.12347030639648438, 0.13378334045410156, 0.14409637451171875, 0.15440940856933594, 0.16472244262695312, 0.1750354766845703, 0.1853485107421875, 0.1956615447998047, 0.20597457885742188, 0.21628761291503906, 0.22660064697265625, 0.23691368103027344, 0.24722671508789062, 0.2575397491455078, 0.267852783203125, 0.2781658172607422, 0.2884788513183594, 0.29879188537597656, 0.30910491943359375, 0.31941795349121094, 0.3297309875488281, 0.3400440216064453, 0.3503570556640625, 0.3606700897216797, 0.3709831237792969, 0.38129615783691406, 0.39160919189453125, 0.40192222595214844, 0.4122352600097656, 0.4225482940673828, 0.432861328125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 11.0, 10.0, 5.0, 16.0, 14.0, 20.0, 33.0, 24.0, 62.0, 171.0, 443.0, 2900.0, 8365785.0, 17554.0, 986.0, 260.0, 105.0, 52.0, 9.0, 10.0, 40.0, 14.0, 5.0, 18.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 3.0, 2.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0, 5.0], "bins": [-3.53940749168396, -3.42431902885437, -3.3092308044433594, -3.1941423416137695, -3.079054117202759, -2.963965654373169, -2.848877429962158, -2.7337889671325684, -2.6187005043029785, -2.5036120414733887, -2.388523817062378, -2.273435354232788, -2.1583471298217773, -2.0432586669921875, -1.9281703233718872, -1.813081979751587, -1.6979937553405762, -1.5829054117202759, -1.4678170680999756, -1.3527286052703857, -1.237640380859375, -1.1225519180297852, -1.0074635744094849, -0.8923752307891846, -0.7772868871688843, -0.662198543548584, -0.5471101999282837, -0.4320217967033386, -0.31693345308303833, -0.20184510946273804, -0.08675670623779297, 0.028331637382507324, 0.14341998100280762, 0.2585083246231079, 0.3735966980457306, 0.48868507146835327, 0.6037734150886536, 0.7188617587089539, 0.8339501619338989, 0.9490385055541992, 1.0641268491744995, 1.1792151927947998, 1.2943035364151, 1.4093918800354004, 1.5244803428649902, 1.639568567276001, 1.7546570301055908, 1.8697453737258911, 1.9848337173461914, 2.0999221801757812, 2.215010404586792, 2.330098867416382, 2.4451870918273926, 2.5602755546569824, 2.6753640174865723, 2.790452241897583, 2.9055404663085938, 3.0206289291381836, 3.1357171535491943, 3.250805616378784, 3.365893840789795, 3.4809823036193848, 3.5960707664489746, 3.7111589908599854, 3.826247453689575]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 0.0, 3.0, 0.0, 3.0, 2.0, 2.0, 4.0, 1.0, 4.0, 2.0, 5.0, 1.0, 11.0, 2.0, 5.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 6.0, 4.0, 4.0, 4.0, 2.0, 4.0, 2.0, 2.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.611243963241577, -2.531331777572632, -2.4514195919036865, -2.3715076446533203, -2.291595458984375, -2.2116832733154297, -2.1317710876464844, -2.051858901977539, -1.9719469547271729, -1.8920347690582275, -1.8121227025985718, -1.7322105169296265, -1.6522984504699707, -1.5723862648010254, -1.49247407913208, -1.4125620126724243, -1.332649827003479, -1.2527376413345337, -1.172825574874878, -1.0929133892059326, -1.0130013227462769, -0.9330891370773315, -0.853177011013031, -0.7732648849487305, -0.6933527588844299, -0.6134406328201294, -0.5335285067558289, -0.45361635088920593, -0.3737042248249054, -0.29379209876060486, -0.21387994289398193, -0.1339678168296814, -0.05405569076538086, 0.025856442749500275, 0.10576857626438141, 0.18568071722984314, 0.2655928432941437, 0.3455049693584442, 0.42541712522506714, 0.5053292512893677, 0.5852413773536682, 0.6651535034179688, 0.7450656294822693, 0.8249777555465698, 0.9048899412155151, 0.9848020076751709, 1.0647141933441162, 1.1446263790130615, 1.2245384454727173, 1.3044506311416626, 1.3843626976013184, 1.4642748832702637, 1.5441869497299194, 1.6240991353988647, 1.7040112018585205, 1.7839233875274658, 1.8638355731964111, 1.9437477588653564, 2.0236599445343018, 2.103571891784668, 2.1834840774536133, 2.2633962631225586, 2.343308448791504, 2.423220634460449, 2.5031325817108154]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 17.0, 6.0, 28.0, 35.0, 44.0, 61.0, 96.0, 147.0, 211.0, 439.0, 1019.0, 3458.0, 15066.0, 86356.0, 302223.0, 93687.0, 15754.0, 3320.0, 1056.0, 464.0, 243.0, 163.0, 111.0, 71.0, 56.0, 33.0, 14.0, 20.0, 14.0, 11.0, 10.0, 5.0, 4.0, 3.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.30859375, -2.245391845703125, -2.18218994140625, -2.118988037109375, -2.0557861328125, -1.992584228515625, -1.92938232421875, -1.866180419921875, -1.802978515625, -1.739776611328125, -1.67657470703125, -1.613372802734375, -1.5501708984375, -1.486968994140625, -1.42376708984375, -1.360565185546875, -1.29736328125, -1.234161376953125, -1.17095947265625, -1.107757568359375, -1.0445556640625, -0.981353759765625, -0.91815185546875, -0.854949951171875, -0.791748046875, -0.728546142578125, -0.66534423828125, -0.602142333984375, -0.5389404296875, -0.475738525390625, -0.41253662109375, -0.349334716796875, -0.2861328125, -0.222930908203125, -0.15972900390625, -0.096527099609375, -0.0333251953125, 0.029876708984375, 0.09307861328125, 0.156280517578125, 0.219482421875, 0.282684326171875, 0.34588623046875, 0.409088134765625, 0.4722900390625, 0.535491943359375, 0.59869384765625, 0.661895751953125, 0.72509765625, 0.788299560546875, 0.85150146484375, 0.914703369140625, 0.9779052734375, 1.041107177734375, 1.10430908203125, 1.167510986328125, 1.230712890625, 1.293914794921875, 1.35711669921875, 1.420318603515625, 1.4835205078125, 1.546722412109375, 1.60992431640625, 1.673126220703125, 1.736328125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 6.0, 5.0, 6.0, 8.0, 12.0, 18.0, 20.0, 38.0, 34.0, 41.0, 60.0, 62.0, 104.0, 112.0, 98.0, 99.0, 73.0, 51.0, 37.0, 19.0, 24.0, 23.0, 16.0, 10.0, 6.0, 3.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3095703125, -0.298492431640625, -0.28741455078125, -0.276336669921875, -0.2652587890625, -0.254180908203125, -0.24310302734375, -0.232025146484375, -0.220947265625, -0.209869384765625, -0.19879150390625, -0.187713623046875, -0.1766357421875, -0.165557861328125, -0.15447998046875, -0.143402099609375, -0.13232421875, -0.121246337890625, -0.11016845703125, -0.099090576171875, -0.0880126953125, -0.076934814453125, -0.06585693359375, -0.054779052734375, -0.043701171875, -0.032623291015625, -0.02154541015625, -0.010467529296875, 0.0006103515625, 0.011688232421875, 0.02276611328125, 0.033843994140625, 0.044921875, 0.055999755859375, 0.06707763671875, 0.078155517578125, 0.0892333984375, 0.100311279296875, 0.11138916015625, 0.122467041015625, 0.133544921875, 0.144622802734375, 0.15570068359375, 0.166778564453125, 0.1778564453125, 0.188934326171875, 0.20001220703125, 0.211090087890625, 0.22216796875, 0.233245849609375, 0.24432373046875, 0.255401611328125, 0.2664794921875, 0.277557373046875, 0.28863525390625, 0.299713134765625, 0.310791015625, 0.321868896484375, 0.33294677734375, 0.344024658203125, 0.3551025390625, 0.366180419921875, 0.37725830078125, 0.388336181640625, 0.3994140625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 7.0, 6.0, 23.0, 37.0, 87.0, 102.0, 107.0, 54.0, 17.0, 18.0, 4.0, 7.0, 2.0, 8.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6309139728546143, -1.5468950271606445, -1.4628762006759644, -1.3788572549819946, -1.294838309288025, -1.2108194828033447, -1.126800537109375, -1.0427815914154053, -0.9587627053260803, -0.8747438192367554, -0.7907248735427856, -0.7067059874534607, -0.6226871013641357, -0.538668155670166, -0.45464926958084106, -0.37063032388687134, -0.2866114377975464, -0.20259252190589905, -0.1185736209154129, -0.03455471992492676, 0.04946419596672058, 0.13348311185836792, 0.21750199794769287, 0.3015209436416626, 0.38553982973098755, 0.4695587456226349, 0.5535776615142822, 0.6375965476036072, 0.7216154336929321, 0.8056343793869019, 0.8896532654762268, 0.9736722111701965, 1.0576910972595215, 1.1417100429534912, 1.2257288694381714, 1.3097478151321411, 1.3937667608261108, 1.477785587310791, 1.5618045330047607, 1.6458234786987305, 1.7298424243927002, 1.81386137008667, 1.89788019657135, 1.9818991422653198, 2.06591796875, 2.1499369144439697, 2.2339558601379395, 2.317974805831909, 2.401993751525879, 2.4860126972198486, 2.5700316429138184, 2.654050350189209, 2.7380692958831787, 2.8220882415771484, 2.906107187271118, 2.990126132965088, 3.0741448402404785, 3.1581637859344482, 3.242182731628418, 3.3262014389038086, 3.4102203845977783, 3.494239330291748, 3.5782582759857178, 3.6622772216796875, 3.7462961673736572]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 4.0, 5.0, 5.0, 7.0, 9.0, 8.0, 13.0, 29.0, 44.0, 49.0, 68.0, 67.0, 78.0, 35.0, 15.0, 18.0, 14.0, 3.0, 5.0, 5.0, 7.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.592702627182007, -2.52793288230896, -2.463163375854492, -2.3983936309814453, -2.3336238861083984, -2.2688541412353516, -2.204084634780884, -2.139314889907837, -2.074545383453369, -2.0097756385803223, -1.945006012916565, -1.8802363872528076, -1.8154666423797607, -1.7506970167160034, -1.685927391052246, -1.6211576461791992, -1.5563879013061523, -1.491618275642395, -1.4268485307693481, -1.3620789051055908, -1.297309160232544, -1.2325395345687866, -1.1677699089050293, -1.1030001640319824, -1.038230538368225, -0.973460853099823, -0.9086911678314209, -0.8439215421676636, -0.7791518568992615, -0.7143821716308594, -0.649612545967102, -0.5848428606987, -0.5200729370117188, -0.45530325174331665, -0.39053359627723694, -0.3257639408111572, -0.2609942555427551, -0.19622457027435303, -0.13145491480827332, -0.0666852593421936, -0.001915574073791504, 0.0628540962934494, 0.1276237666606903, 0.1923934370279312, 0.2571631073951721, 0.3219327926635742, 0.38670244812965393, 0.45147210359573364, 0.5162417888641357, 0.5810114741325378, 0.6457811594009399, 0.7105507850646973, 0.7753204703330994, 0.8400901556015015, 0.9048597812652588, 0.9696294665336609, 1.034399151802063, 1.0991687774658203, 1.1639385223388672, 1.2287081480026245, 1.2934777736663818, 1.3582475185394287, 1.423017144203186, 1.4877867698669434, 1.5525565147399902]}, "eval/loss": 4.200125694274902, "eval/wer": 1.9598968663228877, "eval/runtime": 786.8447, "eval/samples_per_second": 3.358, "eval/steps_per_second": 0.281, "train/train_runtime": 5718.4377, "train/train_samples_per_second": 4.991, "train/train_steps_per_second": 0.104, "train/total_flos": 0.0, "train/train_loss": 4.336673439953865} \ No newline at end of file